Add new test
[mono.git] / mcs / mcs / cs-tokenizer.cs
1 //\r
2 // cs-tokenizer.cs: The Tokenizer for the C# compiler\r
3 //                  This also implements the preprocessor\r
4 //\r
5 // Author: Miguel de Icaza (miguel@gnu.org)\r
6 //\r
7 // Licensed under the terms of the GNU GPL\r
8 //\r
9 // (C) 2001 Ximian, Inc (http://www.ximian.com)\r
10 //\r
11 \r
12 /*\r
13  * TODO:\r
14  *   Make sure we accept the proper Unicode ranges, per the spec.\r
15  *   Report error 1032\r
16 */\r
17 \r
18 using System;\r
19 using System.Text;\r
20 using System.Collections;\r
21 using System.IO;\r
22 using System.Globalization;\r
23 \r
24 namespace Mono.CSharp\r
25 {\r
26         /// <summary>\r
27         ///    Tokenizer for C# source code. \r
28         /// </summary>\r
29 \r
30         public class Tokenizer : yyParser.yyInput\r
31         {\r
32                 StreamReader reader;\r
33                 public string ref_name;\r
34                 public int ref_line = 1;\r
35                 public int line = 1;\r
36                 public int col = 1;\r
37                 public int current_token;\r
38                 bool handle_get_set = false;\r
39                 bool handle_remove_add = false;\r
40                 bool handle_assembly = false;\r
41 \r
42                 //\r
43                 // Whether tokens have been seen on this line\r
44                 //\r
45                 bool tokens_seen = false;\r
46                 \r
47                 //\r
48                 // Returns a verbose representation of the current location\r
49                 //\r
50                 public string location {\r
51                         get {\r
52                                 string det;\r
53 \r
54                                 if (current_token == Token.ERROR)\r
55                                         det = "detail: " + error_details;\r
56                                 else\r
57                                         det = "";\r
58                                 \r
59                                 // return "Line:     "+line+" Col: "+col + "\n" +\r
60                                 //       "VirtLine: "+ref_line +\r
61                                 //       " Token: "+current_token + " " + det;\r
62 \r
63                                 return ref_name + " " + "(" + line + "," + col + "), Token:" + current_token + " " + det;\r
64                         }\r
65                 }\r
66 \r
67                 public bool PropertyParsing {\r
68                         get {\r
69                                 return handle_get_set;\r
70                         }\r
71 \r
72                         set {\r
73                                 handle_get_set = value;\r
74                         }\r
75                 }\r
76 \r
77                 public bool AssemblyTargetParsing {\r
78                         get {\r
79                                 return handle_assembly;\r
80                         }\r
81 \r
82                         set {\r
83                                 handle_assembly = value;\r
84                         }\r
85                 }\r
86 \r
87                 public bool EventParsing {\r
88                         get {\r
89                                 return handle_remove_add;\r
90                         }\r
91 \r
92                         set {\r
93                                 handle_remove_add = value;\r
94                         }\r
95                 }\r
96                 \r
97                 //\r
98                 // Class variables\r
99                 // \r
100                 static Hashtable keywords;\r
101                 static NumberStyles styles;\r
102                 static NumberFormatInfo csharp_format_info;\r
103                 \r
104                 //\r
105                 // Values for the associated token returned\r
106                 //\r
107                 System.Text.StringBuilder number;\r
108                 int putback_char;\r
109                 Object val;\r
110 \r
111                 //\r
112                 // Pre-processor\r
113                 //\r
114                 Hashtable defines;\r
115 \r
116                 const int TAKING        = 1;\r
117                 const int TAKEN_BEFORE  = 2;\r
118                 const int ELSE_SEEN     = 4;\r
119                 const int PARENT_TAKING = 8;\r
120                 \r
121                 //\r
122                 // pre-processor if stack state:\r
123                 //\r
124                 Stack ifstack;\r
125                 \r
126                 //\r
127                 // Details about the error encoutered by the tokenizer\r
128                 //\r
129                 string error_details;\r
130                 \r
131                 public string error {\r
132                         get {\r
133                                 return error_details;\r
134                         }\r
135                 }\r
136                 \r
137                 public int Line {\r
138                         get {\r
139                                 return line;\r
140                         }\r
141                 }\r
142 \r
143                 public int Col {\r
144                         get {\r
145                                 return col;\r
146                         }\r
147                 }\r
148                 \r
149                 static void InitTokens ()\r
150                 {\r
151                         keywords = new Hashtable ();\r
152 \r
153                         keywords.Add ("abstract", Token.ABSTRACT);\r
154                         keywords.Add ("as", Token.AS);\r
155                         keywords.Add ("add", Token.ADD);\r
156                         keywords.Add ("assembly", Token.ASSEMBLY);\r
157                         keywords.Add ("base", Token.BASE);\r
158                         keywords.Add ("bool", Token.BOOL);\r
159                         keywords.Add ("break", Token.BREAK);\r
160                         keywords.Add ("byte", Token.BYTE);\r
161                         keywords.Add ("case", Token.CASE);\r
162                         keywords.Add ("catch", Token.CATCH);\r
163                         keywords.Add ("char", Token.CHAR);\r
164                         keywords.Add ("checked", Token.CHECKED);\r
165                         keywords.Add ("class", Token.CLASS);\r
166                         keywords.Add ("const", Token.CONST);\r
167                         keywords.Add ("continue", Token.CONTINUE);\r
168                         keywords.Add ("decimal", Token.DECIMAL);\r
169                         keywords.Add ("default", Token.DEFAULT);\r
170                         keywords.Add ("delegate", Token.DELEGATE);\r
171                         keywords.Add ("do", Token.DO);\r
172                         keywords.Add ("double", Token.DOUBLE);\r
173                         keywords.Add ("else", Token.ELSE);\r
174                         keywords.Add ("enum", Token.ENUM);\r
175                         keywords.Add ("event", Token.EVENT);\r
176                         keywords.Add ("explicit", Token.EXPLICIT);\r
177                         keywords.Add ("extern", Token.EXTERN);\r
178                         keywords.Add ("false", Token.FALSE);\r
179                         keywords.Add ("finally", Token.FINALLY);\r
180                         keywords.Add ("fixed", Token.FIXED);\r
181                         keywords.Add ("float", Token.FLOAT);\r
182                         keywords.Add ("for", Token.FOR);\r
183                         keywords.Add ("foreach", Token.FOREACH);\r
184                         keywords.Add ("goto", Token.GOTO);\r
185                         keywords.Add ("get", Token.GET);\r
186                         keywords.Add ("if", Token.IF);\r
187                         keywords.Add ("implicit", Token.IMPLICIT);\r
188                         keywords.Add ("in", Token.IN);\r
189                         keywords.Add ("int", Token.INT);\r
190                         keywords.Add ("interface", Token.INTERFACE);\r
191                         keywords.Add ("internal", Token.INTERNAL);\r
192                         keywords.Add ("is", Token.IS);\r
193                         keywords.Add ("lock", Token.LOCK);\r
194                         keywords.Add ("long", Token.LONG);\r
195                         keywords.Add ("namespace", Token.NAMESPACE);\r
196                         keywords.Add ("new", Token.NEW);\r
197                         keywords.Add ("null", Token.NULL);\r
198                         keywords.Add ("object", Token.OBJECT);\r
199                         keywords.Add ("operator", Token.OPERATOR);\r
200                         keywords.Add ("out", Token.OUT);\r
201                         keywords.Add ("override", Token.OVERRIDE);\r
202                         keywords.Add ("params", Token.PARAMS);\r
203                         keywords.Add ("private", Token.PRIVATE);\r
204                         keywords.Add ("protected", Token.PROTECTED);\r
205                         keywords.Add ("public", Token.PUBLIC);\r
206                         keywords.Add ("readonly", Token.READONLY);\r
207                         keywords.Add ("ref", Token.REF);\r
208                         keywords.Add ("remove", Token.REMOVE);\r
209                         keywords.Add ("return", Token.RETURN);\r
210                         keywords.Add ("sbyte", Token.SBYTE);\r
211                         keywords.Add ("sealed", Token.SEALED);\r
212                         keywords.Add ("set", Token.SET);\r
213                         keywords.Add ("short", Token.SHORT);\r
214                         keywords.Add ("sizeof", Token.SIZEOF);\r
215                         keywords.Add ("stackalloc", Token.STACKALLOC);\r
216                         keywords.Add ("static", Token.STATIC);\r
217                         keywords.Add ("string", Token.STRING);\r
218                         keywords.Add ("struct", Token.STRUCT);\r
219                         keywords.Add ("switch", Token.SWITCH);\r
220                         keywords.Add ("this", Token.THIS);\r
221                         keywords.Add ("throw", Token.THROW);\r
222                         keywords.Add ("true", Token.TRUE);\r
223                         keywords.Add ("try", Token.TRY);\r
224                         keywords.Add ("typeof", Token.TYPEOF);\r
225                         keywords.Add ("uint", Token.UINT);\r
226                         keywords.Add ("ulong", Token.ULONG);\r
227                         keywords.Add ("unchecked", Token.UNCHECKED);\r
228                         keywords.Add ("unsafe", Token.UNSAFE);\r
229                         keywords.Add ("ushort", Token.USHORT);\r
230                         keywords.Add ("using", Token.USING);\r
231                         keywords.Add ("virtual", Token.VIRTUAL);\r
232                         keywords.Add ("void", Token.VOID);\r
233                         keywords.Add ("volatile", Token.VOLATILE);\r
234                         keywords.Add ("while", Token.WHILE);\r
235                 }\r
236 \r
237                 //\r
238                 // Class initializer\r
239                 // \r
240                 static Tokenizer ()\r
241                 {\r
242                         InitTokens ();\r
243                         csharp_format_info = new NumberFormatInfo ();\r
244                         csharp_format_info.CurrencyDecimalSeparator = ".";\r
245                         styles = NumberStyles.AllowExponent | NumberStyles.AllowDecimalPoint;\r
246                 }\r
247 \r
248                 bool is_keyword (string name)\r
249                 {\r
250                         bool res;\r
251                         \r
252                         res = keywords.Contains (name);\r
253                         if (handle_get_set == false && (name == "get" || name == "set"))\r
254                                 return false;\r
255                         if (handle_remove_add == false && (name == "remove" || name == "add"))\r
256                                 return false;\r
257                         if (handle_assembly == false && (name == "assembly"))\r
258                                 return false;\r
259                         return res;\r
260                 }\r
261 \r
262                 int GetKeyword (string name)\r
263                 {\r
264                         return (int) (keywords [name]);\r
265                 }\r
266 \r
267                 public Location Location {\r
268                         get {\r
269                                 return new Location (ref_line);\r
270                         }\r
271                 }\r
272                 \r
273                 public Tokenizer (System.IO.Stream input, string fname, ArrayList defs)\r
274                 {\r
275                         this.ref_name = fname;\r
276                         reader = new System.IO.StreamReader (input);\r
277                         putback_char = -1;\r
278 \r
279                         if (defs != null){\r
280                                 defines = new Hashtable ();\r
281                                 foreach (string def in defs)\r
282                                         defines [def] = true;\r
283                         }\r
284 \r
285                         //\r
286                         // FIXME: This could be `Location.Push' but we have to\r
287                         // find out why the MS compiler allows this\r
288                         //\r
289                         Mono.CSharp.Location.Push (fname);\r
290                 }\r
291 \r
292                 bool is_identifier_start_character (char c)\r
293                 {\r
294                         return Char.IsLetter (c) || c == '_' ;\r
295                 }\r
296 \r
297                 bool is_identifier_part_character (char c)\r
298                 {\r
299                         return (Char.IsLetter (c) || Char.IsDigit (c) || c == '_');\r
300                 }\r
301 \r
302                 int is_punct (char c, ref bool doread)\r
303                 {\r
304                         int d;\r
305                         int t;\r
306 \r
307                         doread = false;\r
308 \r
309                         switch (c){\r
310                         case '{':\r
311                                 return Token.OPEN_BRACE;\r
312                         case '}':\r
313                                 return Token.CLOSE_BRACE;\r
314                         case '[':\r
315                                 return Token.OPEN_BRACKET;\r
316                         case ']':\r
317                                 return Token.CLOSE_BRACKET;\r
318                         case '(':\r
319                                 return Token.OPEN_PARENS;\r
320                         case ')':\r
321                                 return Token.CLOSE_PARENS;\r
322                         case ',':\r
323                                 return Token.COMMA;\r
324                         case ':':\r
325                                 return Token.COLON;\r
326                         case ';':\r
327                                 return Token.SEMICOLON;\r
328                         case '~':\r
329                                 return Token.TILDE;\r
330                         case '?':\r
331                                 return Token.INTERR;\r
332                         }\r
333 \r
334                         d = peekChar ();\r
335                         if (c == '+'){\r
336                                 \r
337                                 if (d == '+')\r
338                                         t = Token.OP_INC;\r
339                                 else if (d == '=')\r
340                                         t = Token.OP_ADD_ASSIGN;\r
341                                 else\r
342                                         return Token.PLUS;\r
343                                 doread = true;\r
344                                 return t;\r
345                         }\r
346                         if (c == '-'){\r
347                                 if (d == '-')\r
348                                         t = Token.OP_DEC;\r
349                                 else if (d == '=')\r
350                                         t = Token.OP_SUB_ASSIGN;\r
351                                 else if (d == '>')\r
352                                         t = Token.OP_PTR;\r
353                                 else\r
354                                         return Token.MINUS;\r
355                                 doread = true;\r
356                                 return t;\r
357                         }\r
358 \r
359                         if (c == '!'){\r
360                                 if (d == '='){\r
361                                         doread = true;\r
362                                         return Token.OP_NE;\r
363                                 }\r
364                                 return Token.BANG;\r
365                         }\r
366 \r
367                         if (c == '='){\r
368                                 if (d == '='){\r
369                                         doread = true;\r
370                                         return Token.OP_EQ;\r
371                                 }\r
372                                 return Token.ASSIGN;\r
373                         }\r
374 \r
375                         if (c == '&'){\r
376                                 if (d == '&'){\r
377                                         doread = true;\r
378                                         return Token.OP_AND;\r
379                                 } else if (d == '='){\r
380                                         doread = true;\r
381                                         return Token.OP_AND_ASSIGN;\r
382                                 }\r
383                                 return Token.BITWISE_AND;\r
384                         }\r
385 \r
386                         if (c == '|'){\r
387                                 if (d == '|'){\r
388                                         doread = true;\r
389                                         return Token.OP_OR;\r
390                                 } else if (d == '='){\r
391                                         doread = true;\r
392                                         return Token.OP_OR_ASSIGN;\r
393                                 }\r
394                                 return Token.BITWISE_OR;\r
395                         }\r
396 \r
397                         if (c == '*'){\r
398                                 if (d == '='){\r
399                                         doread = true;\r
400                                         return Token.OP_MULT_ASSIGN;\r
401                                 }\r
402                                 return Token.STAR;\r
403                         }\r
404 \r
405                         if (c == '/'){\r
406                                 if (d == '='){\r
407                                         doread = true;\r
408                                         return Token.OP_DIV_ASSIGN;\r
409                                 }\r
410                                 return Token.DIV;\r
411                         }\r
412 \r
413                         if (c == '%'){\r
414                                 if (d == '='){\r
415                                         doread = true;\r
416                                         return Token.OP_MOD_ASSIGN;\r
417                                 }\r
418                                 return Token.PERCENT;\r
419                         }\r
420 \r
421                         if (c == '^'){\r
422                                 if (d == '='){\r
423                                         doread = true;\r
424                                         return Token.OP_XOR_ASSIGN;\r
425                                 }\r
426                                 return Token.CARRET;\r
427                         }\r
428 \r
429                         if (c == '<'){\r
430                                 if (d == '<'){\r
431                                         getChar ();\r
432                                         d = peekChar ();\r
433 \r
434                                         if (d == '='){\r
435                                                 doread = true;\r
436                                                 return Token.OP_SHIFT_LEFT_ASSIGN;\r
437                                         }\r
438                                         return Token.OP_SHIFT_LEFT;\r
439                                 } else if (d == '='){\r
440                                         doread = true;\r
441                                         return Token.OP_LE;\r
442                                 }\r
443                                 return Token.OP_LT;\r
444                         }\r
445 \r
446                         if (c == '>'){\r
447                                 if (d == '>'){\r
448                                         getChar ();\r
449                                         d = peekChar ();\r
450 \r
451                                         if (d == '='){\r
452                                                 doread = true;\r
453                                                 return Token.OP_SHIFT_RIGHT_ASSIGN;\r
454                                         }\r
455                                         return Token.OP_SHIFT_RIGHT;\r
456                                 } else if (d == '='){\r
457                                         doread = true;\r
458                                         return Token.OP_GE;\r
459                                 }\r
460                                 return Token.OP_GT;\r
461                         }\r
462                         return Token.ERROR;\r
463                 }\r
464 \r
465                 bool decimal_digits (int c)\r
466                 {\r
467                         int d;\r
468                         bool seen_digits = false;\r
469                         \r
470                         if (c != -1)\r
471                                 number.Append ((char) c);\r
472                         \r
473                         while ((d = peekChar ()) != -1){\r
474                                 if (Char.IsDigit ((char)d)){\r
475                                         number.Append ((char) d);\r
476                                         getChar ();\r
477                                         seen_digits = true;\r
478                                 } else\r
479                                         break;\r
480                         }\r
481                         \r
482                         return seen_digits;\r
483                 }\r
484 \r
485                 void hex_digits (int c)\r
486                 {\r
487                         int d;\r
488 \r
489                         if (c != -1)\r
490                                 number.Append ((char) c);\r
491                         while ((d = peekChar ()) != -1){\r
492                                 char e = Char.ToUpper ((char) d);\r
493                                 \r
494                                 if (Char.IsDigit (e) || (e >= 'A' && e <= 'F')){\r
495                                         number.Append ((char) e);\r
496                                         getChar ();\r
497                                 } else\r
498                                         break;\r
499                         }\r
500                 }\r
501                 \r
502                 int real_type_suffix (int c)\r
503                 {\r
504                         int t;\r
505 \r
506                         switch (c){\r
507                         case 'F': case 'f':\r
508                                 t =  Token.LITERAL_FLOAT;\r
509                                 break;\r
510                         case 'D': case 'd':\r
511                                 t = Token.LITERAL_DOUBLE;\r
512                                 break;\r
513                         case 'M': case 'm':\r
514                                  t= Token.LITERAL_DECIMAL;\r
515                                 break;\r
516                         default:\r
517                                 return Token.NONE;\r
518                         }\r
519                         return t;\r
520                 }\r
521 \r
522                 int integer_type_suffix (ulong ul, int c)\r
523                 {\r
524                         bool is_unsigned = false;\r
525                         bool is_long = false;\r
526 \r
527                         if (c != -1){\r
528                                 bool scanning = true;\r
529                                 do {\r
530                                         switch (c){\r
531                                         case 'U': case 'u':\r
532                                                 if (is_unsigned)\r
533                                                         scanning = false;\r
534                                                 is_unsigned = true;\r
535                                                 getChar ();\r
536                                                 break;\r
537 \r
538                                         case 'l':\r
539                                                 if (!is_unsigned){\r
540                                                         //\r
541                                                         // if we have not seen anything in between\r
542                                                         // report this error\r
543                                                         //\r
544                                                         Report.Warning (\r
545                                                                 78, Location,\r
546                                                         "the 'l' suffix is easily confused with digit `1'," +\r
547                                                         " use 'L' for clarity");\r
548                                                 }\r
549                                                 goto case 'L';\r
550                                                 \r
551                                         case 'L': \r
552                                                 if (is_long)\r
553                                                         scanning = false;\r
554                                                 is_long = true;\r
555                                                 getChar ();\r
556                                                 break;\r
557                                                 \r
558                                         default:\r
559                                                 scanning = false;\r
560                                                 break;\r
561                                         }\r
562                                         c = peekChar ();\r
563                                 } while (scanning);\r
564                         }\r
565 \r
566                         if (is_long && is_unsigned){\r
567                                 val = ul;\r
568                                 return Token.LITERAL_INTEGER;\r
569                         } else if (is_unsigned){\r
570                                 // uint if possible, or ulong else.\r
571 \r
572                                 if ((ul & 0xffffffff00000000) == 0)\r
573                                         val = (uint) ul;\r
574                                 else\r
575                                         val = ul;\r
576                         } else if (is_long){\r
577                                 // long if possible, ulong otherwise\r
578                                 if ((ul & 0x8000000000000000) != 0)\r
579                                         val = ul;\r
580                                 else\r
581                                         val = (long) ul;\r
582                         } else {\r
583                                 // int, uint, long or ulong in that order\r
584                                 if ((ul & 0xffffffff00000000) == 0){\r
585                                         uint ui = (uint) ul;\r
586                                         \r
587                                         if ((ui & 0x80000000) != 0)\r
588                                                 val = ui;\r
589                                         else\r
590                                                 val = (int) ui;\r
591                                 } else {\r
592                                         if ((ul & 0x8000000000000000) != 0)\r
593                                                 val = ul;\r
594                                         else\r
595                                                 val = (long) ul;\r
596                                 }\r
597                         }\r
598                         return Token.LITERAL_INTEGER;\r
599                 }\r
600                                 \r
601                 //\r
602                 // given `c' as the next char in the input decide whether\r
603                 // we need to convert to a special type, and then choose\r
604                 // the best representation for the integer\r
605                 //\r
606                 int adjust_int (int c)\r
607                 {\r
608                         ulong ul = System.UInt64.Parse (number.ToString ());\r
609                         return integer_type_suffix (ul, c);\r
610                 }\r
611 \r
612                 int adjust_real (int t)\r
613                 {\r
614                         string s = number.ToString ();\r
615 \r
616                         switch (t){\r
617                         case Token.LITERAL_DECIMAL:\r
618                                 val = new System.Decimal ();\r
619                                 val = System.Decimal.Parse (\r
620                                         s, styles, csharp_format_info);\r
621                                 break;\r
622                         case Token.LITERAL_DOUBLE:\r
623                                 val = new System.Double ();\r
624                                 val = System.Double.Parse (\r
625                                         s, styles, csharp_format_info);\r
626                                 break;\r
627                         case Token.LITERAL_FLOAT:\r
628                                 val = new System.Double ();\r
629                                 val = (float) System.Double.Parse (\r
630                                         s, styles, csharp_format_info);\r
631                                 break;\r
632 \r
633                         case Token.NONE:\r
634                                 val = new System.Double ();\r
635                                 val = System.Double.Parse (\r
636                                         s, styles, csharp_format_info);\r
637                                 t = Token.LITERAL_DOUBLE;\r
638                                 break;\r
639                         }\r
640                         return t;\r
641                 }\r
642 \r
643                 //\r
644                 // Invoked if we know we have .digits or digits\r
645                 //\r
646                 int is_number (int c)\r
647                 {\r
648                         bool is_real = false;\r
649                         number = new System.Text.StringBuilder ();\r
650                         int type;\r
651 \r
652                         number.Length = 0;\r
653 \r
654                         if (Char.IsDigit ((char)c)){\r
655                                 if (c == '0' && peekChar () == 'x' || peekChar () == 'X'){\r
656                                         ulong ul;\r
657                                         getChar ();\r
658                                         hex_digits (-1);\r
659 \r
660                                         string s = number.ToString ();\r
661 \r
662                                         ul = System.UInt64.Parse (s, NumberStyles.HexNumber);\r
663                                         return integer_type_suffix (ul, peekChar ());\r
664                                 }\r
665                                 decimal_digits (c);\r
666                                 c = getChar ();\r
667                         }\r
668 \r
669                         //\r
670                         // We need to handle the case of\r
671                         // "1.1" vs "1.string" (LITERAL_FLOAT vs NUMBER DOT IDENTIFIER)\r
672                         //\r
673                         if (c == '.'){\r
674                                 if (decimal_digits ('.')){\r
675                                         is_real = true;\r
676                                         c = getChar ();\r
677                                 } else {\r
678                                         putback ('.');\r
679                                         number.Length -= 1;\r
680                                         return adjust_int (-1);\r
681                                 }\r
682                         }\r
683                         \r
684                         if (c == 'e' || c == 'E'){\r
685                                 is_real = true;\r
686                                 number.Append ("e");\r
687                                 c = getChar ();\r
688                                 \r
689                                 if (c == '+'){\r
690                                         number.Append ((char) c);\r
691                                         c = getChar ();\r
692                                 } else if (c == '-'){\r
693                                         number.Append ((char) c);\r
694                                         c = getChar ();\r
695                                 }\r
696                                 decimal_digits (-1);\r
697                                 c = getChar ();\r
698                         }\r
699 \r
700                         type = real_type_suffix (c);\r
701                         if (type == Token.NONE && !is_real){\r
702                                 putback (c);\r
703                                 return adjust_int (c);\r
704                         } else \r
705                                 is_real = true;\r
706 \r
707                         if (type == Token.NONE){\r
708                                 putback (c);\r
709                         }\r
710                         \r
711                         if (is_real)\r
712                                 return adjust_real (type);\r
713 \r
714                         Console.WriteLine ("This should not be reached");\r
715                         throw new Exception ("Is Number should never reach this point");\r
716                 }\r
717                         \r
718                 int escape (int c)\r
719                 {\r
720                         int d;\r
721                         int v;\r
722 \r
723                         d = peekChar ();\r
724                         if (c != '\\')\r
725                                 return c;\r
726                         \r
727                         switch (d){\r
728                         case 'a':\r
729                                 v = '\a'; break;\r
730                         case 'b':\r
731                                 v = '\b'; break;\r
732                         case 'n':\r
733                                 v = '\n'; break;\r
734                         case 't':\r
735                                 v = '\t'; break;\r
736                         case 'v':\r
737                                 v = '\v'; break;\r
738                         case 'r':\r
739                                 v = '\r'; break;\r
740                         case '\\':\r
741                                 v = '\\'; break;\r
742                         case 'f':\r
743                                 v = '\f'; break;\r
744                         case '0':\r
745                                 v = 0; break;\r
746                         case '"':\r
747                                 v = '"'; break;\r
748                         case '\'':\r
749                                 v = '\''; break;\r
750                         default:\r
751                                 error_details = "cs1009: Unrecognized escape sequence " + (char)d;\r
752                                 return -1;\r
753                         }\r
754                         getChar ();\r
755                         return v;\r
756                 }\r
757 \r
758                 int getChar ()\r
759                 {\r
760                         if (putback_char != -1){\r
761                                 int x = putback_char;\r
762                                 putback_char = -1;\r
763 \r
764                                 return x;\r
765                         }\r
766                         return reader.Read ();\r
767                 }\r
768 \r
769                 int peekChar ()\r
770                 {\r
771                         if (putback_char != -1)\r
772                                 return putback_char;\r
773                         return reader.Peek ();\r
774                 }\r
775 \r
776                 void putback (int c)\r
777                 {\r
778                         if (putback_char != -1)\r
779                                 throw new Exception ("This should not happen putback on putback");\r
780                         putback_char = c;\r
781                 }\r
782 \r
783                 public bool advance ()\r
784                 {\r
785                         return peekChar () != -1;\r
786                 }\r
787 \r
788                 public Object Value {\r
789                         get {\r
790                                 return val;\r
791                         }\r
792                 }\r
793 \r
794                 public Object value ()\r
795                 {\r
796                         return val;\r
797                 }\r
798                 \r
799                 public int token ()\r
800                 {\r
801                         current_token = xtoken ();\r
802                         return current_token;\r
803                 }\r
804 \r
805                 static StringBuilder static_cmd_arg = new System.Text.StringBuilder ();\r
806                 \r
807                 void get_cmd_arg (out string cmd, out string arg)\r
808                 {\r
809                         int c;\r
810                         \r
811                         tokens_seen = false;\r
812                         arg = "";\r
813                         static_cmd_arg.Length = 0;\r
814                                 \r
815                         while ((c = getChar ()) != -1 && (c != '\n') && ((c != ' ') || c == '\t')){\r
816                                 if (c == '\r')\r
817                                         continue;\r
818                                 static_cmd_arg.Append ((char) c);\r
819                         }\r
820 \r
821                         cmd = static_cmd_arg.ToString ();\r
822 \r
823                         if (c == '\n'){\r
824                                 line++;\r
825                                 ref_line++;\r
826                                 return;\r
827                         }\r
828 \r
829                         // skip over white space\r
830                         while ((c = getChar ()) != -1 && (c != '\n') && ((c == ' ') || (c == '\t')))\r
831                                 ;\r
832 \r
833                         if (c == '\n'){\r
834                                 line++;\r
835                                 ref_line++;\r
836                                 return;\r
837                         }\r
838                         \r
839                         static_cmd_arg.Length = 0;\r
840                         static_cmd_arg.Append ((char) c);\r
841                         \r
842                         while ((c = getChar ()) != -1 && (c != '\n')){\r
843                                 if (c == '\r')\r
844                                         continue;\r
845                                 static_cmd_arg.Append ((char) c);\r
846                         }\r
847 \r
848                         if (c == '\n'){\r
849                                 line++;\r
850                                 ref_line++;\r
851                         }\r
852                         arg = static_cmd_arg.ToString ().Trim ();\r
853                 }\r
854 \r
855                 //\r
856                 // Handles the #line directive\r
857                 //\r
858                 bool PreProcessLine (string arg)\r
859                 {\r
860                         if (arg == "")\r
861                                 return false;\r
862 \r
863                         if (arg == "default"){\r
864                                 line = ref_line = line;\r
865                                 return false;\r
866                         }\r
867                         \r
868                         try {\r
869                                 int pos;\r
870 \r
871                                 if ((pos = arg.IndexOf (' ')) != -1 && pos != 0){\r
872                                         ref_line = System.Int32.Parse (arg.Substring (0, pos));\r
873                                         pos++;\r
874                                         \r
875                                         char [] quotes = { '\"' };\r
876                                         \r
877                                         ref_name = arg.Substring (pos);\r
878                                         ref_name.TrimStart (quotes);\r
879                                         ref_name.TrimEnd (quotes);\r
880                                 } else {\r
881                                         ref_line = System.Int32.Parse (arg);\r
882                                 }\r
883                         } catch {\r
884                                 return false;\r
885                         }\r
886                         \r
887                         return true;\r
888                 }\r
889 \r
890                 //\r
891                 // Handles #define and #undef\r
892                 //\r
893                 void PreProcessDefinition (bool is_define, string arg)\r
894                 {\r
895                         if (arg == "" || arg == "true" || arg == "false"){\r
896                                 Report.Error(1001, Location, "Missing identifer to pre-processor directive");\r
897                                 return;\r
898                         }\r
899 \r
900                         if (is_define){\r
901                                 if (defines == null)\r
902                                         defines = new Hashtable ();\r
903                                 defines [arg] = 1;\r
904                         } else {\r
905                                 if (defines == null)\r
906                                         return;\r
907                                 if (defines.Contains (arg))\r
908                                         defines.Remove (arg);\r
909                         }\r
910                 }\r
911 \r
912                 bool eval_val (string s)\r
913                 {\r
914                         if (s == "true")\r
915                                 return true;\r
916                         if (s == "false")\r
917                                 return false;\r
918                         \r
919                         if (defines == null)\r
920                                 return false;\r
921                         if (defines.Contains (s))\r
922                                 return true;\r
923 \r
924                         return false;\r
925                 }\r
926 \r
927                 bool pp_primary (ref string s)\r
928                 {\r
929                         s.Trim ();\r
930                         int len = s.Length;\r
931 \r
932                         if (len > 0){\r
933                                 char c = s [0];\r
934                                 \r
935                                 if (c == '('){\r
936                                         s = s.Substring (1);\r
937                                         bool val = pp_expr (ref s);\r
938                                         if (s.Length > 0 && s [0] == ')')\r
939                                                 return val;\r
940                                         report1517 ();\r
941                                         return false;\r
942                                 }\r
943                                 \r
944                                 if (Char.IsLetter (c) || c == '_'){\r
945                                         int j = 1;\r
946 \r
947                                         while (j < len){\r
948                                                 c = s [j];\r
949                                                 \r
950                                                 if (Char.IsLetter (c) || Char.IsDigit (c) || c == '_'){\r
951                                                         j++;\r
952                                                         continue;\r
953                                                 }\r
954                                                 bool v = eval_val (s.Substring (0, j));\r
955                                                 s = s.Substring (j);\r
956                                                 return v;\r
957                                         }\r
958                                         bool vv = eval_val (s);\r
959                                         s = "";\r
960                                         return vv;\r
961                                 }\r
962                         }\r
963                         report1517 ();\r
964                         return false;\r
965                 }\r
966                 \r
967                 bool pp_unary (ref string s)\r
968                 {\r
969                         s = s.Trim ();\r
970                         int len = s.Length;\r
971 \r
972                         if (len > 0){\r
973                                 if (s [0] == '!'){\r
974                                         if (len > 1 && s [1] == '='){\r
975                                                 report1517 ();\r
976                                                 return false;\r
977                                         }\r
978                                         s = s.Substring (1);\r
979                                         return ! pp_primary (ref s);\r
980                                 } else\r
981                                         return pp_primary (ref s);\r
982                         } else {\r
983                                 report1517 ();\r
984                                 return false;\r
985                         }\r
986                 }\r
987                 \r
988                 bool pp_eq (ref string s)\r
989                 {\r
990                         bool va = pp_unary (ref s);\r
991 \r
992                         s = s.Trim ();\r
993                         int len = s.Length;\r
994                         if (len > 0){\r
995                                 if (s [0] == '='){\r
996                                         if (len > 2 && s [1] == '='){\r
997                                                 s = s.Substring (2);\r
998                                                 return va == pp_unary (ref s);\r
999                                         } else {\r
1000                                                 report1517 ();\r
1001                                                 return false;\r
1002                                         }\r
1003                                 } else if (s [0] == '!' && len > 1 && s [1] == '='){\r
1004                                         s = s.Substring (2);\r
1005 \r
1006                                         return va != pp_unary (ref s);\r
1007 \r
1008                                 }\r
1009                         }\r
1010 \r
1011                         return va;\r
1012                                 \r
1013                 }\r
1014                 \r
1015                 bool pp_and (ref string s)\r
1016                 {\r
1017                         bool va = pp_eq (ref s);\r
1018 \r
1019                         s = s.Trim ();\r
1020                         int len = s.Length;\r
1021                         if (len > 0){\r
1022                                 if (s [0] == '&'){\r
1023                                         if (len > 2 && s [1] == '&'){\r
1024                                                 s = s.Substring (2);\r
1025                                                 return va && pp_eq (ref s);\r
1026                                         } else {\r
1027                                                 report1517 ();\r
1028                                                 return false;\r
1029                                         }\r
1030                                 } \r
1031                         }\r
1032                         return va;\r
1033                 }\r
1034                 \r
1035                 //\r
1036                 // Evaluates an expression for `#if' or `#elif'\r
1037                 //\r
1038                 bool pp_expr (ref string s)\r
1039                 {\r
1040                         bool va = pp_and (ref s);\r
1041 \r
1042                         s = s.Trim ();\r
1043                         int len = s.Length;\r
1044                         if (len > 0){\r
1045                                 if (s [0] == '|'){\r
1046                                         if (len > 2 && s [1] == '|'){\r
1047                                                 s = s.Substring (2);\r
1048                                                 return va || pp_and (ref s);\r
1049                                         } else {\r
1050                                                 report1517 ();\r
1051                                                 return false;\r
1052                                         }\r
1053                                 } else {\r
1054                                         report1517 ();\r
1055                                         return false;\r
1056                                 }\r
1057                         }\r
1058 \r
1059                         return va;\r
1060                 }\r
1061 \r
1062                 bool eval (string s)\r
1063                 {\r
1064                         bool v = pp_expr (ref s);\r
1065 \r
1066                         return v;\r
1067                 }\r
1068                 \r
1069                 void report1517 ()\r
1070                 {\r
1071                         Report.Error (1517, Location, "Invalid pre-processor directive");\r
1072                 }\r
1073 \r
1074                 void report1028 (string extra)\r
1075                 {\r
1076                         Report.Error (\r
1077                                 1028, Location,\r
1078                                 "Unexpected processor directive (" + extra + ")");\r
1079                 }\r
1080                 \r
1081                 //\r
1082                 // if true, then the code continues processing the code\r
1083                 // if false, the code stays in a loop until another directive is\r
1084                 // reached.\r
1085                 //\r
1086                 bool handle_preprocessing_directive ()\r
1087                 {\r
1088                         char [] blank = { ' ', '\t' };\r
1089                         string cmd, arg;\r
1090                         \r
1091                         get_cmd_arg (out cmd, out arg);\r
1092                         \r
1093                         switch (cmd){\r
1094                         case "line":\r
1095                                 if (!PreProcessLine (arg))\r
1096                                         Report.Error (\r
1097                                                 1576, Location,\r
1098                                                 "Argument to #line directive is missing or invalid");\r
1099                                 return true;\r
1100 \r
1101                         case "define":\r
1102                                 PreProcessDefinition (true, arg);\r
1103                                 return true;\r
1104 \r
1105                         case "undef":\r
1106                                 PreProcessDefinition (false, arg);\r
1107                                 return true;\r
1108 \r
1109                         case "error":\r
1110                                 Report.Error (1029, Location, "#error: '" + arg + "'");\r
1111                                 return true;\r
1112 \r
1113                         case "warning":\r
1114                                 Report.Warning (1030, Location, "#warning: '" + arg + "'");\r
1115                                 return true;\r
1116 \r
1117                         case "region":\r
1118                                 arg = "true";\r
1119                                 goto case "if";\r
1120 \r
1121                         case "endregion":\r
1122                                 goto case "endif";\r
1123                                 \r
1124                         case "if":\r
1125                                 if (arg == ""){\r
1126                                         report1517 ();\r
1127                                         return true;\r
1128                                 }\r
1129                                 bool taking = false;\r
1130                                 if (ifstack == null)\r
1131                                         ifstack = new Stack ();\r
1132 \r
1133                                 if (ifstack.Count == 0){\r
1134                                         taking = true;\r
1135                                 } else {\r
1136                                         int state = (int) ifstack.Peek ();\r
1137                                         if ((state & TAKING) != 0)\r
1138                                                 taking = true;\r
1139                                 }\r
1140                                         \r
1141                                 if (eval (arg) && taking){\r
1142                                         ifstack.Push (TAKING | TAKEN_BEFORE | PARENT_TAKING);\r
1143                                         return true;\r
1144                                 } else {\r
1145                                         ifstack.Push (taking ? PARENT_TAKING : 0);\r
1146                                         return false;\r
1147                                 }\r
1148                                 \r
1149                         case "endif":\r
1150                                 if (ifstack == null || ifstack.Count == 0){\r
1151                                         report1028 ("no #if for this #endif");\r
1152                                         return true;\r
1153                                 } else {\r
1154                                         ifstack.Pop ();\r
1155                                         if (ifstack.Count == 0)\r
1156                                                 return true;\r
1157                                         else {\r
1158                                                 int state = (int) ifstack.Peek ();\r
1159 \r
1160                                                 if ((state & TAKING) != 0)\r
1161                                                         return true;\r
1162                                                 else\r
1163                                                         return false;\r
1164                                         }\r
1165                                 }\r
1166 \r
1167                         case "elif":\r
1168                                 if (ifstack == null || ifstack.Count == 0){\r
1169                                         report1028 ("no #if for this #elif");\r
1170                                         return true;\r
1171                                 } else {\r
1172                                         int state = (int) ifstack.Peek ();\r
1173 \r
1174                                         if ((state & ELSE_SEEN) != 0){\r
1175                                                 report1028 ("#elif not valid after #else");\r
1176                                                 return true;\r
1177                                         }\r
1178 \r
1179                                         if ((state & (TAKEN_BEFORE | TAKING)) != 0)\r
1180                                                 return false;\r
1181 \r
1182                                         if (eval (arg) && ((state & PARENT_TAKING) != 0)){\r
1183                                                 state = (int) ifstack.Pop ();\r
1184                                                 ifstack.Push (state | TAKING | TAKEN_BEFORE);\r
1185                                                 return true;\r
1186                                         } else \r
1187                                                 return false;\r
1188                                 }\r
1189 \r
1190                         case "else":\r
1191                                 if (ifstack == null || ifstack.Count == 0){\r
1192                                         Report.Error (\r
1193                                                 1028, Location,\r
1194                                                 "Unexpected processor directive (no #if for this #else)");\r
1195                                         return true;\r
1196                                 } else {\r
1197                                         int state = (int) ifstack.Peek ();\r
1198 \r
1199                                         if ((state & ELSE_SEEN) != 0){\r
1200                                                 report1028 ("#else within #else");\r
1201                                                 return true;\r
1202                                         }\r
1203 \r
1204                                         ifstack.Pop ();\r
1205                                         ifstack.Push (state | ELSE_SEEN);\r
1206 \r
1207                                         if ((state & TAKEN_BEFORE) == 0){\r
1208                                                 if ((state & PARENT_TAKING) != 0)\r
1209                                                         return true;\r
1210                                                 else\r
1211                                                         return false;\r
1212                                         }\r
1213                                         return false;\r
1214                                 }\r
1215                         }\r
1216                         \r
1217                         Report.Error (1024, "Preprocessor directive expected (got: " + cmd + ")");\r
1218                         return true;\r
1219                 }\r
1220                 \r
1221                 public int xtoken ()\r
1222                 {\r
1223                         int t;\r
1224                         bool allow_keyword_as_ident = false;\r
1225                         bool doread = false;\r
1226                         int c;\r
1227 \r
1228                         val = null;\r
1229                         // optimization: eliminate col and implement #directive semantic correctly.\r
1230                         for (;(c = getChar ()) != -1; col++) {\r
1231                                 if (is_identifier_start_character ((char) c)){\r
1232                                         System.Text.StringBuilder id = new System.Text.StringBuilder ();\r
1233                                         string ids;\r
1234 \r
1235                                         tokens_seen = true;\r
1236                                         id.Append ((char) c);\r
1237                                         \r
1238                                         while ((c = peekChar ()) != -1) {\r
1239                                                 if (is_identifier_part_character ((char) c)){\r
1240                                                         id.Append ((char)getChar ());\r
1241                                                         col++;\r
1242                                                 } else \r
1243                                                         break;\r
1244                                         }\r
1245                                         \r
1246                                         ids = id.ToString ();\r
1247 \r
1248                                         if (!is_keyword (ids) || allow_keyword_as_ident) {\r
1249                                                 val = ids;\r
1250                                                 if (ids.Length > 512){\r
1251                                                         Report.Error (\r
1252                                                                 645, Location,\r
1253                                                                 "Identifier too long (limit is 512 chars)");\r
1254                                                 }\r
1255                                                 allow_keyword_as_ident = false;\r
1256                                                 return Token.IDENTIFIER;\r
1257                                         }\r
1258 \r
1259                                         // true, false and null are in the hash anyway.\r
1260                                         return GetKeyword (ids);\r
1261 \r
1262                                 }\r
1263 \r
1264                                 if (c == '.'){\r
1265                                         tokens_seen = true;\r
1266                                         if (Char.IsDigit ((char) peekChar ()))\r
1267                                                 return is_number (c);\r
1268                                         return Token.DOT;\r
1269                                 }\r
1270                                 \r
1271                                 if (Char.IsDigit ((char) c)){\r
1272                                         tokens_seen = true;\r
1273                                         return is_number (c);\r
1274                                 }\r
1275 \r
1276                                 // Handle double-slash comments.\r
1277                                 if (c == '/'){\r
1278                                         int d = peekChar ();\r
1279                                 \r
1280                                         if (d == '/'){\r
1281                                                 getChar ();\r
1282                                                 while ((d = getChar ()) != -1 && (d != '\n'))\r
1283                                                         col++;\r
1284                                                 line++;\r
1285                                                 ref_line++;\r
1286                                                 col = 0;\r
1287                                                 continue;\r
1288                                         } else if (d == '*'){\r
1289                                                 getChar ();\r
1290 \r
1291                                                 while ((d = getChar ()) != -1){\r
1292                                                         if (d == '*' && peekChar () == '/'){\r
1293                                                                 getChar ();\r
1294                                                                 col++;\r
1295                                                                 break;\r
1296                                                         }\r
1297                                                         if (d == '\n'){\r
1298                                                                 line++;\r
1299                                                                 ref_line++;\r
1300                                                                 col = 0;\r
1301                                                         }\r
1302                                                 }\r
1303                                                 continue;\r
1304                                         }\r
1305                                 }\r
1306 \r
1307                                 /* For now, ignore pre-processor commands */\r
1308                                 // FIXME: In C# the '#' is not limited to appear\r
1309                                 // on the first column.\r
1310                                 if (c == '#' && !tokens_seen){\r
1311                                 start_again:\r
1312                                         \r
1313                                         bool cont = handle_preprocessing_directive ();\r
1314 \r
1315                                         if (cont){\r
1316                                                 col = 0;\r
1317                                                 continue;\r
1318                                         }\r
1319                                         col = 1;\r
1320 \r
1321                                         bool skipping = false;\r
1322                                         for (;(c = getChar ()) != -1; col++){\r
1323                                                 if (c == '\n'){\r
1324                                                         col = 0;\r
1325                                                         line++;\r
1326                                                         ref_line++;\r
1327                                                         skipping = false;\r
1328                                                 } else if (c == ' ' || c == '\t' || c == '\v' || c == '\r')\r
1329                                                         continue;\r
1330                                                 else if (c != '#')\r
1331                                                         skipping = true;\r
1332                                                 if (c == '#' && !skipping)\r
1333                                                         goto start_again;\r
1334                                         }\r
1335                                         tokens_seen = false;\r
1336                                         if (c == -1)\r
1337                                                 Report.Error (1027, Location, "#endif expected");\r
1338                                         continue;\r
1339                                 }\r
1340                                 \r
1341                                 if ((t = is_punct ((char)c, ref doread)) != Token.ERROR){\r
1342                                         tokens_seen = true;\r
1343                                         if (doread){\r
1344                                                 getChar ();\r
1345                                                 col++;\r
1346                                         }\r
1347                                         return t;\r
1348                                 }\r
1349                                 \r
1350                                 if (c == '"'){\r
1351                                         System.Text.StringBuilder s = new System.Text.StringBuilder ();\r
1352                                         tokens_seen = true;\r
1353                                         \r
1354                                         while ((c = getChar ()) != -1){\r
1355                                                 if (c == '"'){\r
1356                                                         allow_keyword_as_ident = false;\r
1357                                                         val = s.ToString ();\r
1358                                                         return Token.LITERAL_STRING;\r
1359                                                 }\r
1360 \r
1361                                                 if (!allow_keyword_as_ident){\r
1362                                                         c = escape (c);\r
1363                                                         if (c == -1)\r
1364                                                                 return Token.ERROR;\r
1365                                                 }\r
1366                                                 s.Append ((char) c);\r
1367                                         }\r
1368                                 }\r
1369 \r
1370                                 if (c == '\''){\r
1371                                         c = getChar ();\r
1372                                         tokens_seen = true;\r
1373                                         if (c == '\''){\r
1374                                                 error_details = "Empty character literal";\r
1375                                                 Report.Error (1011, Location, error_details);\r
1376                                                 return Token.ERROR;\r
1377                                         }\r
1378                                         c = escape (c);\r
1379                                         if (c == -1)\r
1380                                                 return Token.ERROR;\r
1381                                         val = new System.Char ();\r
1382                                         val = (char) c;\r
1383                                         c = getChar ();\r
1384 \r
1385                                         if (c != '\''){\r
1386                                                 error_details = "Too many characters in character literal";\r
1387                                                 Report.Error (1012, Location, error_details);\r
1388 \r
1389                                                 // Try to recover, read until newline or next "'"\r
1390                                                 while ((c = getChar ()) != -1){\r
1391                                                         if (c == '\n' || c == '\'')\r
1392                                                                 break;\r
1393                                                         \r
1394                                                 }\r
1395                                                 return Token.ERROR;\r
1396                                         }\r
1397                                         return Token.LITERAL_CHARACTER;\r
1398                                 }\r
1399                                 \r
1400                                 // white space\r
1401                                 if (c == '\n'){\r
1402                                         line++;\r
1403                                         ref_line++;\r
1404                                         col = 0;\r
1405                                         tokens_seen = false;\r
1406                                         continue;\r
1407                                 }\r
1408 \r
1409                                 if (c == ' ' || c == '\t' || c == '\f' || c == '\v' || c == '\r'){\r
1410                                         if (c == '\t')\r
1411                                                 col = (((col + 8) / 8) * 8) - 1;\r
1412                                         continue;\r
1413                                 }\r
1414 \r
1415                                 if (c == '@'){\r
1416                                         tokens_seen = true;\r
1417                                         allow_keyword_as_ident = true;\r
1418                                         continue;\r
1419                                 }\r
1420 \r
1421                                 error_details = ((char)c).ToString ();\r
1422                                 \r
1423                                 return Token.ERROR;\r
1424                         }\r
1425 \r
1426                         if (ifstack != null && ifstack.Count > 1)\r
1427                                 Report.Error (1027, Location, "#endif expected");\r
1428                         return Token.EOF;\r
1429                 }\r
1430         }\r
1431 }\r
1432 \r