Merge pull request #601 from knocte/sock_improvements
[mono.git] / mcs / class / System / Test / System.Net / WebUtilityTest.cs
1 //
2 // System.Net.WebUtilityTest.cs
3 //
4 // copied and edited from System.Web.HttpUtilityTest.cs
5 //
6 // Author:
7 //      Sebastien Pouliot  <sebastien@ximian.com>
8 //      Mike Kestner <mkestner@novell.com>
9 //
10 // Copyright (C) 2005, 2010 Novell, Inc (http://www.novell.com)
11 //
12 // Permission is hereby granted, free of charge, to any person obtaining
13 // a copy of this software and associated documentation files (the
14 // "Software"), to deal in the Software without restriction, including
15 // without limitation the rights to use, copy, modify, merge, publish,
16 // distribute, sublicense, and/or sell copies of the Software, and to
17 // permit persons to whom the Software is furnished to do so, subject to
18 // the following conditions:
19 // 
20 // The above copyright notice and this permission notice shall be
21 // included in all copies or substantial portions of the Software.
22 // 
23 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 // EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 // MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 // NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
27 // LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
28 // OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
29 // WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
30 //
31
32 #if NET_4_0 && !MOBILE
33
34 using System;
35 using System.Text;
36 using System.Net;
37 using System.IO;
38 using System.Collections.Specialized;
39
40 using NUnit.Framework;
41
42 namespace MonoTests.System.Net {
43
44         [TestFixture]
45         public class WebUtilityTest {
46
47                 [Test]
48                 public void HtmlEncode_LtGt ()
49                 {
50                         Assert.AreEqual ("&lt;script&gt;", WebUtility.HtmlEncode ("<script>"));
51                 }
52
53                 // Notes:
54                 // * this is to avoid a regression that would cause Mono to 
55                 //   fail item #3 of the XSS vulnerabilities listed at:
56                 //   http://it-project.ru/andir/docs/aspxvuln/aspxvuln.en.xml
57                 //   we didn't fall the first time so let's ensure we never will
58                 // * The author notes that Microsoft has decided not to fix 
59                 //   this issue (hence the NotDotNet category).
60
61                 [Test]
62                 [Category ("NotDotNet")]
63 #if TARGET_JVM
64                 [Ignore ("TD #6954")]
65 #endif
66                 public void HtmlEncode_XSS ()
67                 {
68                         string problem = "\xff1cscript\xff1e";  // unicode looks alike <script>
69                         byte[] utf8data = Encoding.UTF8.GetBytes (problem);
70                         Encoding win1251 = Encoding.GetEncoding ("windows-1251");
71                         byte[] windata = Encoding.Convert (Encoding.UTF8, win1251, utf8data);
72                         // now it's a real problem
73                         Assert.AreEqual ("<script>", Encoding.ASCII.GetString (windata), "<script>");
74
75                         string encoded = WebUtility.HtmlEncode (problem);
76                         Assert.AreEqual ("&#65308;script&#65310;", encoded, "&#65308;script&#65310;");
77                         
78                         utf8data = Encoding.UTF8.GetBytes (encoded);
79                         windata = Encoding.Convert (Encoding.UTF8, win1251, utf8data);
80                         Assert.AreEqual ("&#65308;script&#65310;", Encoding.ASCII.GetString (windata), "ok");
81                 }
82
83                 [Test]
84 #if !TARGET_JVM
85                 [Category ("NotWorking")]
86 #endif
87                 public void HtmlEncode () {
88                         for (char c = char.MinValue; c < char.MaxValue; c++) {
89                                 String exp = HtmlEncode (c.ToString ());
90                                 String act = WebUtility.HtmlEncode (c.ToString ());
91                                 Assert.AreEqual (exp, act, "HtmlEncode " + c.ToString () + " [" + (int) c + "]");
92                         }
93                 }
94                 
95                 string HtmlEncode (string s) {
96                         if (s == null)
97                                 return null;
98
99                         bool needEncode = false;
100                         for (int i = 0; i < s.Length; i++) {
101                                 char c = s [i];
102                                 if (c == '&' || c == '"' || c == '<' || c == '>' || c > 159) {
103                                         needEncode = true;
104                                         break;
105                                 }
106                         }
107
108                         if (!needEncode)
109                                 return s;
110
111                         StringBuilder output = new StringBuilder ();
112
113                         int len = s.Length;
114                         for (int i = 0; i < len; i++)
115                                 switch (s [i]) {
116                                 case '&':
117                                         output.Append ("&amp;");
118                                         break;
119                                 case '>':
120                                         output.Append ("&gt;");
121                                         break;
122                                 case '<':
123                                         output.Append ("&lt;");
124                                         break;
125                                 case '"':
126                                         output.Append ("&quot;");
127                                         break;
128                                 default:
129                                         // MS starts encoding with &# from 160 and stops at 255.
130                                         // We don't do that. One reason is the 65308/65310 unicode
131                                         // characters that look like '<' and '>'.
132                                         if (s [i] > 159 && s [i] < 256) {
133                                                 output.Append ("&#");
134                                                 output.Append (((int) s [i]).ToString ());
135                                                 output.Append (";");
136                                         }
137                                         else {
138                                                 output.Append (s [i]);
139                                         }
140                                         break;
141                                 }
142                         return output.ToString ();
143                 }
144
145                 
146                 [Test]
147                 public void EscapedCharacters ()
148                 {
149                         for (int i = 0; i < 256; i++) {
150                                 string str = new string ((char) i, 1);
151                                 string encoded = WebUtility.HtmlEncode (str);
152                                 if ((i > 159 && i < 256 ) || i == '&' || i == '<' || i == '>' || i == '"') {
153                                         if (encoded [0] != '&' || encoded [encoded.Length - 1] != ';')
154                                                 Assert.Fail ("Failed for i = " + i);
155                                 } else if (encoded.Length != 1) {
156                                         Assert.Fail ("Wrong length for i = " + i);
157                                 }
158                         }
159                 }
160
161                 [Test]
162                 public void Decode1 ()
163                 {
164                         Assert.AreEqual ("\xE9", WebUtility.HtmlDecode ("&#233;"));
165                 }
166
167                 [Test]
168                 public void RoundTrip ()
169                 {
170                         string x = "<html>& hello+= world!";
171                         string y = WebUtility.HtmlEncode (x);
172                         string z = WebUtility.HtmlDecode (y);
173                         Assert.AreEqual (x, z);
174                 }
175
176                 [Test]
177                 public void LooksLikeEntity ()
178                 {
179                         string str = "<%# \"hola\" + \"/somepage.aspx?ItemID=\" + DataBinder.Eval(Container.DataItem,\"Country\")" +
180                                         " + \"&mid=\" + ModuleID + \"&pageindex=\" + Request.Params.Get(\"pageindex\") %>";
181                         Assert.AreEqual (str, WebUtility.HtmlDecode (str));
182                 }
183
184                 [Test]
185                 public void EntityEncoding ()
186                 {
187                         var expected = "\u00A0\u00A1\u00A2\u00A3\u00A4\u00A5\u00A6\u00A7\u00A8\u00A9\u00AA\u00AB\u00AC\u00AD\u00AE\u00AF\u00B0\u00B1\u00B2\u00B3\u00B4\u00B5\u00B6\u00B7\u00B8\u00B9\u00BA\u00BB\u00BC\u00BD\u00BE\u00BF\u00C0\u00C1\u00C2\u00C3\u00C4\u00C5\u00C6\u00C7\u00C8\u00C9\u00CA\u00CB\u00CC\u00CD\u00CE\u00CF\u00D0\u00D1\u00D2\u00D3\u00D4\u00D5\u00D6\u00D7\u00D8\u00D9\u00DA\u00DB\u00DC\u00DD\u00DE\u00DF\u00E0\u00E1\u00E2\u00E3\u00E4\u00E5\u00E6\u00E7\u00E8\u00E9\u00EA\u00EB\u00EC\u00ED\u00EE\u00EF\u00F0\u00F1\u00F2\u00F3\u00F4\u00F5\u00F6\u00F7\u00F8\u00F9\u00FA\u00FB\u00FC\u00FD\u00FE\u00FF\u0192\u0391\u0392\u0393\u0394\u0395\u0396\u0397\u0398\u0399\u039A\u039B\u039C\u039D\u039E\u039F\u03A0\u03A1\u03A3\u03A4\u03A5\u03A6\u03A7\u03A8\u03A9\u03B1\u03B2\u03B3\u03B4\u03B5\u03B6\u03B7\u03B8\u03B9\u03BA\u03BB\u03BC\u03BD\u03BE\u03BF\u03C0\u03C1\u03C2\u03C3\u03C4\u03C5\u03C6\u03C7\u03C8\u03C9\u03D1\u03D2\u03D6\u2022\u2026\u2032\u2033\u203E\u2044\u2118\u2111\u211C\u2122\u2135\u2190\u2191\u2192\u2193\u2194\u21B5\u21D0\u21D1\u21D2\u21D3\u21D4\u2200\u2202\u2203\u2205\u2207\u2208\u2209\u220B\u220F\u2211\u2212\u2217\u221A\u221D\u221E\u2220\u2227\u2228\u2229\u222A\u222B\u2234\u223C\u2245\u2248\u2260\u2261\u2264\u2265\u2282\u2283\u2284\u2286\u2287\u2295\u2297\u22A5\u22C5\u2308\u2309\u230A\u230B\u2329\u232A\u25CA\u2660\u2663\u2665\u2666\u0022\u0026\u003C\u003E\u0152\u0153\u0160\u0161\u0178\u02C6\u02DC\u2002\u2003\u2009\u200C\u200D\u200E\u200F\u2013\u2014\u2018\u2019\u201A\u201C\u201D\u201E\u2020\u2021\u2030\u2039\u203A\u20AC";
188
189                         var htmlDecoded = WebUtility.HtmlDecode ("&nbsp;&iexcl;&cent;&pound;&curren;&yen;&brvbar;&sect;&uml;&copy;&ordf;&laquo;&not;&shy;&reg;&macr;&deg;&plusmn;&sup2;&sup3;&acute;&micro;&para;&middot;&cedil;&sup1;&ordm;&raquo;&frac14;&frac12;&frac34;&iquest;&Agrave;&Aacute;&Acirc;&Atilde;&Auml;&Aring;&AElig;&Ccedil;&Egrave;&Eacute;&Ecirc;&Euml;&Igrave;&Iacute;&Icirc;&Iuml;&ETH;&Ntilde;&Ograve;&Oacute;&Ocirc;&Otilde;&Ouml;&times;&Oslash;&Ugrave;&Uacute;&Ucirc;&Uuml;&Yacute;&THORN;&szlig;&agrave;&aacute;&acirc;&atilde;&auml;&aring;&aelig;&ccedil;&egrave;&eacute;&ecirc;&euml;&igrave;&iacute;&icirc;&iuml;&eth;&ntilde;&ograve;&oacute;&ocirc;&otilde;&ouml;&divide;&oslash;&ugrave;&uacute;&ucirc;&uuml;&yacute;&thorn;&yuml;&fnof;&Alpha;&Beta;&Gamma;&Delta;&Epsilon;&Zeta;&Eta;&Theta;&Iota;&Kappa;&Lambda;&Mu;&Nu;&Xi;&Omicron;&Pi;&Rho;&Sigma;&Tau;&Upsilon;&Phi;&Chi;&Psi;&Omega;&alpha;&beta;&gamma;&delta;&epsilon;&zeta;&eta;&theta;&iota;&kappa;&lambda;&mu;&nu;&xi;&omicron;&pi;&rho;&sigmaf;&sigma;&tau;&upsilon;&phi;&chi;&psi;&omega;&thetasym;&upsih;&piv;&bull;&hellip;&prime;&Prime;&oline;&frasl;&weierp;&image;&real;&trade;&alefsym;&larr;&uarr;&rarr;&darr;&harr;&crarr;&lArr;&uArr;&rArr;&dArr;&hArr;&forall;&part;&exist;&empty;&nabla;&isin;&notin;&ni;&prod;&sum;&minus;&lowast;&radic;&prop;&infin;&ang;&and;&or;&cap;&cup;&int;&there4;&sim;&cong;&asymp;&ne;&equiv;&le;&ge;&sub;&sup;&nsub;&sube;&supe;&oplus;&otimes;&perp;&sdot;&lceil;&rceil;&lfloor;&rfloor;&lang;&rang;&loz;&spades;&clubs;&hearts;&diams;&quot;&amp;&lt;&gt;&OElig;&oelig;&Scaron;&scaron;&Yuml;&circ;&tilde;&ensp;&emsp;&thinsp;&zwnj;&zwj;&lrm;&rlm;&ndash;&mdash;&lsquo;&rsquo;&sbquo;&ldquo;&rdquo;&bdquo;&dagger;&Dagger;&permil;&lsaquo;&rsaquo;&euro;");
190                         
191                         Assert.AreEqual (expected, htmlDecoded);
192                 }
193         }
194 }
195 #endif
196