**** Merged from MCS ****
[mono.git] / mcs / gmcs / cs-tokenizer.cs
1 //\r
2 // cs-tokenizer.cs: The Tokenizer for the C# compiler\r
3 //                  This also implements the preprocessor\r
4 //\r
5 // Author: Miguel de Icaza (miguel@gnu.org)\r
6 //\r
7 // Licensed under the terms of the GNU GPL\r
8 //\r
9 // (C) 2001, 2002 Ximian, Inc (http://www.ximian.com)\r
10 //\r
11 \r
12 /*\r
13  * TODO:\r
14  *   Make sure we accept the proper Unicode ranges, per the spec.\r
15  *   Report error 1032\r
16 */\r
17 \r
18 using System;\r
19 using System.Text;\r
20 using System.Collections;\r
21 using System.IO;\r
22 using System.Globalization;\r
23 using System.Reflection;\r
24 \r
25 namespace Mono.CSharp\r
26 {\r
27         /// <summary>\r
28         ///    Tokenizer for C# source code. \r
29         /// </summary>\r
30 \r
31         public class Tokenizer : yyParser.yyInput\r
32         {\r
33                 SeekableStreamReader reader;\r
34                 public SourceFile ref_name;\r
35                 public SourceFile file_name;\r
36                 public int ref_line = 1;\r
37                 public int line = 1;\r
38                 public int col = 1;\r
39                 public int current_token;\r
40                 bool handle_get_set = false;\r
41                 bool handle_remove_add = false;\r
42                 bool handle_assembly = false;\r
43                 bool handle_constraints = false;\r
44 \r
45                 //\r
46                 // Whether tokens have been seen on this line\r
47                 //\r
48                 bool tokens_seen = false;\r
49 \r
50                 //\r
51                 // Whether a token has been seen on the file\r
52                 // This is needed because `define' is not allowed to be used\r
53                 // after a token has been seen.\r
54                 //\r
55                 bool any_token_seen = false;\r
56                 static Hashtable tokenValues;\r
57                 \r
58                 private static Hashtable TokenValueName\r
59                 {\r
60                         get {\r
61                                 if (tokenValues == null)\r
62                                         tokenValues = GetTokenValueNameHash ();\r
63 \r
64                                 return tokenValues;\r
65                         }\r
66                 }\r
67 \r
68                 private static Hashtable GetTokenValueNameHash ()\r
69                 {\r
70                         Type t = typeof (Token);\r
71                         FieldInfo [] fields = t.GetFields ();\r
72                         Hashtable hash = new Hashtable ();\r
73                         foreach (FieldInfo field in fields) {\r
74                                 if (field.IsLiteral && field.IsStatic && field.FieldType == typeof (int))\r
75                                         hash.Add (field.GetValue (null), field.Name);\r
76                         }\r
77                         return hash;\r
78                 }\r
79                 \r
80                 //\r
81                 // Returns a verbose representation of the current location\r
82                 //\r
83                 public string location {\r
84                         get {\r
85                                 string det;\r
86 \r
87                                 if (current_token == Token.ERROR)\r
88                                         det = "detail: " + error_details;\r
89                                 else\r
90                                         det = "";\r
91                                 \r
92                                 // return "Line:     "+line+" Col: "+col + "\n" +\r
93                                 //       "VirtLine: "+ref_line +\r
94                                 //       " Token: "+current_token + " " + det;\r
95                                 string current_token_name = TokenValueName [current_token] as string;\r
96                                 if (current_token_name == null)\r
97                                         current_token_name = current_token.ToString ();\r
98 \r
99                                 return String.Format ("{0} ({1},{2}), Token: {3} {4}", ref_name.Name,\r
100                                                                                        ref_line,\r
101                                                                                        col,\r
102                                                                                        current_token_name,\r
103                                                                                        det);\r
104                         }\r
105                 }\r
106 \r
107                 public bool PropertyParsing {\r
108                         get {\r
109                                 return handle_get_set;\r
110                         }\r
111 \r
112                         set {\r
113                                 handle_get_set = value;\r
114                         }\r
115                 }\r
116 \r
117                 public bool AssemblyTargetParsing {\r
118                         get {\r
119                                 return handle_assembly;\r
120                         }\r
121 \r
122                         set {\r
123                                 handle_assembly = value;\r
124                         }\r
125                 }\r
126 \r
127                 public bool EventParsing {\r
128                         get {\r
129                                 return handle_remove_add;\r
130                         }\r
131 \r
132                         set {\r
133                                 handle_remove_add = value;\r
134                         }\r
135                 }\r
136 \r
137                 public bool ConstraintsParsing {\r
138                         get {\r
139                                 return handle_constraints;\r
140                         }\r
141 \r
142                         set {\r
143                                 handle_constraints = value;\r
144                         }\r
145                 }\r
146                 \r
147                 //\r
148                 // Class variables\r
149                 // \r
150                 static CharArrayHashtable[] keywords;\r
151                 static NumberStyles styles;\r
152                 static NumberFormatInfo csharp_format_info;\r
153                 \r
154                 //\r
155                 // Values for the associated token returned\r
156                 //\r
157                 int putback_char;\r
158                 Object val;\r
159 \r
160                 //\r
161                 // Pre-processor\r
162                 //\r
163                 Hashtable defines;\r
164 \r
165                 const int TAKING        = 1;\r
166                 const int TAKEN_BEFORE  = 2;\r
167                 const int ELSE_SEEN     = 4;\r
168                 const int PARENT_TAKING = 8;\r
169                 const int REGION        = 16;           \r
170 \r
171                 //\r
172                 // pre-processor if stack state:\r
173                 //\r
174                 Stack ifstack;\r
175 \r
176                 static System.Text.StringBuilder string_builder;\r
177 \r
178                 const int max_id_size = 512;\r
179                 static char [] id_builder = new char [max_id_size];\r
180 \r
181                 static CharArrayHashtable [] identifiers = new CharArrayHashtable [max_id_size + 1];\r
182 \r
183                 const int max_number_size = 128;\r
184                 static char [] number_builder = new char [max_number_size];\r
185                 static int number_pos;\r
186                 \r
187                 //\r
188                 // Details about the error encoutered by the tokenizer\r
189                 //\r
190                 string error_details;\r
191                 \r
192                 public string error {\r
193                         get {\r
194                                 return error_details;\r
195                         }\r
196                 }\r
197                 \r
198                 public int Line {\r
199                         get {\r
200                                 return ref_line;\r
201                         }\r
202                 }\r
203 \r
204                 public int Col {\r
205                         get {\r
206                                 return col;\r
207                         }\r
208                 }\r
209 \r
210                 static void AddKeyword (string kw, int token) {\r
211                         if (keywords [kw.Length] == null) {\r
212                                 keywords [kw.Length] = new CharArrayHashtable (kw.Length);\r
213                         }\r
214                         keywords [kw.Length] [kw.ToCharArray ()] = token;\r
215                 }\r
216 \r
217                 static void InitTokens ()\r
218                 {\r
219                         keywords = new CharArrayHashtable [64];\r
220 \r
221                         AddKeyword ("abstract", Token.ABSTRACT);\r
222                         AddKeyword ("as", Token.AS);\r
223                         AddKeyword ("add", Token.ADD);\r
224                         AddKeyword ("assembly", Token.ASSEMBLY);\r
225                         AddKeyword ("base", Token.BASE);\r
226                         AddKeyword ("bool", Token.BOOL);\r
227                         AddKeyword ("break", Token.BREAK);\r
228                         AddKeyword ("byte", Token.BYTE);\r
229                         AddKeyword ("case", Token.CASE);\r
230                         AddKeyword ("catch", Token.CATCH);\r
231                         AddKeyword ("char", Token.CHAR);\r
232                         AddKeyword ("checked", Token.CHECKED);\r
233                         AddKeyword ("class", Token.CLASS);\r
234                         AddKeyword ("const", Token.CONST);\r
235                         AddKeyword ("continue", Token.CONTINUE);\r
236                         AddKeyword ("decimal", Token.DECIMAL);\r
237                         AddKeyword ("default", Token.DEFAULT);\r
238                         AddKeyword ("delegate", Token.DELEGATE);\r
239                         AddKeyword ("do", Token.DO);\r
240                         AddKeyword ("double", Token.DOUBLE);\r
241                         AddKeyword ("else", Token.ELSE);\r
242                         AddKeyword ("enum", Token.ENUM);\r
243                         AddKeyword ("event", Token.EVENT);\r
244                         AddKeyword ("explicit", Token.EXPLICIT);\r
245                         AddKeyword ("extern", Token.EXTERN);\r
246                         AddKeyword ("false", Token.FALSE);\r
247                         AddKeyword ("finally", Token.FINALLY);\r
248                         AddKeyword ("fixed", Token.FIXED);\r
249                         AddKeyword ("float", Token.FLOAT);\r
250                         AddKeyword ("for", Token.FOR);\r
251                         AddKeyword ("foreach", Token.FOREACH);\r
252                         AddKeyword ("goto", Token.GOTO);\r
253                         AddKeyword ("get", Token.GET);\r
254                         AddKeyword ("if", Token.IF);\r
255                         AddKeyword ("implicit", Token.IMPLICIT);\r
256                         AddKeyword ("in", Token.IN);\r
257                         AddKeyword ("int", Token.INT);\r
258                         AddKeyword ("interface", Token.INTERFACE);\r
259                         AddKeyword ("internal", Token.INTERNAL);\r
260                         AddKeyword ("is", Token.IS);\r
261                         AddKeyword ("lock", Token.LOCK);\r
262                         AddKeyword ("long", Token.LONG);\r
263                         AddKeyword ("namespace", Token.NAMESPACE);\r
264                         AddKeyword ("new", Token.NEW);\r
265                         AddKeyword ("null", Token.NULL);\r
266                         AddKeyword ("object", Token.OBJECT);\r
267                         AddKeyword ("operator", Token.OPERATOR);\r
268                         AddKeyword ("out", Token.OUT);\r
269                         AddKeyword ("override", Token.OVERRIDE);\r
270                         AddKeyword ("params", Token.PARAMS);\r
271                         AddKeyword ("private", Token.PRIVATE);\r
272                         AddKeyword ("protected", Token.PROTECTED);\r
273                         AddKeyword ("public", Token.PUBLIC);\r
274                         AddKeyword ("readonly", Token.READONLY);\r
275                         AddKeyword ("ref", Token.REF);\r
276                         AddKeyword ("remove", Token.REMOVE);\r
277                         AddKeyword ("return", Token.RETURN);\r
278                         AddKeyword ("sbyte", Token.SBYTE);\r
279                         AddKeyword ("sealed", Token.SEALED);\r
280                         AddKeyword ("set", Token.SET);\r
281                         AddKeyword ("short", Token.SHORT);\r
282                         AddKeyword ("sizeof", Token.SIZEOF);\r
283                         AddKeyword ("stackalloc", Token.STACKALLOC);\r
284                         AddKeyword ("static", Token.STATIC);\r
285                         AddKeyword ("string", Token.STRING);\r
286                         AddKeyword ("struct", Token.STRUCT);\r
287                         AddKeyword ("switch", Token.SWITCH);\r
288                         AddKeyword ("this", Token.THIS);\r
289                         AddKeyword ("throw", Token.THROW);\r
290                         AddKeyword ("true", Token.TRUE);\r
291                         AddKeyword ("try", Token.TRY);\r
292                         AddKeyword ("typeof", Token.TYPEOF);\r
293                         AddKeyword ("uint", Token.UINT);\r
294                         AddKeyword ("ulong", Token.ULONG);\r
295                         AddKeyword ("unchecked", Token.UNCHECKED);\r
296                         AddKeyword ("unsafe", Token.UNSAFE);\r
297                         AddKeyword ("ushort", Token.USHORT);\r
298                         AddKeyword ("using", Token.USING);\r
299                         AddKeyword ("virtual", Token.VIRTUAL);\r
300                         AddKeyword ("void", Token.VOID);\r
301                         AddKeyword ("volatile", Token.VOLATILE);\r
302                         AddKeyword ("where", Token.WHERE);\r
303                         AddKeyword ("while", Token.WHILE);\r
304                 }\r
305 \r
306                 //\r
307                 // Class initializer\r
308                 // \r
309                 static Tokenizer ()\r
310                 {\r
311                         InitTokens ();\r
312                         csharp_format_info = NumberFormatInfo.InvariantInfo;\r
313                         styles = NumberStyles.Float;\r
314                         \r
315                         string_builder = new System.Text.StringBuilder ();\r
316                 }\r
317 \r
318                 int GetKeyword (char[] id, int id_len)\r
319                 {\r
320                         /*\r
321                          * Keywords are stored in an array of hashtables grouped by their\r
322                          * length.\r
323                          */\r
324 \r
325                         if ((id_len >= keywords.Length) || (keywords [id_len] == null))\r
326                                 return -1;\r
327                         object o = keywords [id_len] [id];\r
328 \r
329                         if (o == null)\r
330                                 return -1;\r
331                         \r
332                         int res = (int) o;\r
333 \r
334                         if (handle_get_set == false && (res == Token.GET || res == Token.SET))\r
335                                 return -1;\r
336                         if (handle_remove_add == false && (res == Token.REMOVE || res == Token.ADD))\r
337                                 return -1;\r
338                         if (handle_assembly == false && res == Token.ASSEMBLY)\r
339                                 return -1;\r
340                         if (handle_constraints == false && res == Token.WHERE)\r
341                                 return -1;\r
342                         return res;\r
343                         \r
344                 }\r
345 \r
346                 public Location Location {\r
347                         get {\r
348                                 return new Location (ref_line);\r
349                         }\r
350                 }\r
351 \r
352                 void define (string def)\r
353                 {\r
354                         if (!RootContext.AllDefines.Contains (def)){\r
355                                 RootContext.AllDefines [def] = true;\r
356                         }\r
357                         if (defines.Contains (def))\r
358                                 return;\r
359                         defines [def] = true;\r
360                 }\r
361                 \r
362                 public Tokenizer (SeekableStreamReader input, SourceFile file, ArrayList defs)\r
363                 {\r
364                         this.ref_name = file;\r
365                         this.file_name = file;\r
366                         reader = input;\r
367                         \r
368                         putback_char = -1;\r
369 \r
370                         if (defs != null){\r
371                                 defines = new Hashtable ();\r
372                                 foreach (string def in defs)\r
373                                         define (def);\r
374                         }\r
375 \r
376                         //\r
377                         // FIXME: This could be `Location.Push' but we have to\r
378                         // find out why the MS compiler allows this\r
379                         //\r
380                         Mono.CSharp.Location.Push (file);\r
381                 }\r
382 \r
383                 public static void Cleanup () {\r
384                         identifiers = null;\r
385                 }\r
386 \r
387                 static bool is_identifier_start_character (char c)\r
388                 {\r
389                         return (c >= 'A' && c <= 'Z') || (c >= 'a' && c <= 'z') || c == '_' || Char.IsLetter (c);\r
390                 }\r
391 \r
392                 static bool is_identifier_part_character (char c)\r
393                 {\r
394                         return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || c == '_' || (c >= '0' && c <= '9') || Char.IsLetter (c);\r
395                 }
396                 
397                 public static bool IsValidIdentifier (string s)
398                 {
399                         if (s == null || s.Length == 0)
400                                 return false;
401                         
402                         if (!is_identifier_start_character (s [0]))
403                                 return false;
404                         
405                         for (int i = 1; i < s.Length; i ++)
406                                 if (! is_identifier_part_character (s [i]))
407                                         return false;
408                         
409                         return true;
410                 }\r
411 \r
412                 bool parse_less_than ()\r
413                 {\r
414                 start:\r
415                         int the_token = token ();\r
416                         switch (the_token) {\r
417                         case Token.IDENTIFIER:\r
418                         case Token.OBJECT:\r
419                         case Token.STRING:\r
420                         case Token.BOOL:\r
421                         case Token.DECIMAL:\r
422                         case Token.FLOAT:\r
423                         case Token.DOUBLE:\r
424                         case Token.SBYTE:\r
425                         case Token.BYTE:\r
426                         case Token.SHORT:\r
427                         case Token.USHORT:\r
428                         case Token.INT:\r
429                         case Token.UINT:\r
430                         case Token.LONG:\r
431                         case Token.ULONG:\r
432                         case Token.CHAR:\r
433                         case Token.VOID:\r
434                                 break;\r
435 \r
436                         default:\r
437                                 return false;\r
438                         }\r
439                 again:\r
440                         the_token = token ();\r
441 \r
442                         if (the_token == Token.OP_GENERICS_GT)\r
443                                 return true;\r
444                         else if ((the_token == Token.COMMA) || (the_token == Token.DOT))\r
445                                 goto start;\r
446                         else if (the_token == Token.OP_GENERICS_LT) {\r
447                                 if (!parse_less_than ())\r
448                                         return false;\r
449                                 goto again;\r
450                         }\r
451 \r
452                         return false;\r
453                 }\r
454 \r
455                 bool parsing_less_than = false;\r
456                 int parsing_generic_less_than = 0;\r
457 \r
458                 int is_punct (char c, ref bool doread)\r
459                 {\r
460                         int d;\r
461                         int t;\r
462 \r
463                         doread = false;\r
464 \r
465                         switch (c){\r
466                         case '{':\r
467                                 return Token.OPEN_BRACE;\r
468                         case '}':\r
469                                 return Token.CLOSE_BRACE;\r
470                         case '[':\r
471                                 return Token.OPEN_BRACKET;\r
472                         case ']':\r
473                                 return Token.CLOSE_BRACKET;\r
474                         case '(':\r
475                                 return Token.OPEN_PARENS;\r
476                         case ')': {\r
477                                 if (deambiguate_close_parens == 0)\r
478                                         return Token.CLOSE_PARENS;\r
479 \r
480                                 --deambiguate_close_parens;\r
481 \r
482                                 // Save current position and parse next token.\r
483                                 int old = reader.Position;\r
484                                 int new_token = token ();\r
485                                 reader.Position = old;\r
486                                 putback_char = -1;\r
487 \r
488                                 if (new_token == Token.OPEN_PARENS)\r
489                                         return Token.CLOSE_PARENS_OPEN_PARENS;\r
490                                 else if (new_token == Token.MINUS)\r
491                                         return Token.CLOSE_PARENS_MINUS;\r
492                                 else if (IsCastToken (new_token))\r
493                                         return Token.CLOSE_PARENS_CAST;\r
494                                 else\r
495                                         return Token.CLOSE_PARENS_NO_CAST;\r
496                         }\r
497 \r
498                         case ',':\r
499                                 return Token.COMMA;\r
500                         case ':':\r
501                                 return Token.COLON;\r
502                         case ';':\r
503                                 return Token.SEMICOLON;\r
504                         case '~':\r
505                                 return Token.TILDE;\r
506                         case '?':\r
507                                 return Token.INTERR;\r
508                         }\r
509 \r
510                         if (c == '<') {\r
511                                 if (parsing_generic_less_than++ > 0)\r
512                                         return Token.OP_GENERICS_LT;\r
513 \r
514                                 // Save current position and parse next token.\r
515                                 int old = reader.Position;\r
516                                 bool is_generic_lt = parse_less_than ();\r
517                                 reader.Position = old;\r
518                                 putback_char = -1;\r
519 \r
520                                 if (is_generic_lt) {\r
521                                         parsing_generic_less_than++;\r
522                                         return Token.OP_GENERICS_LT;\r
523                                 } else\r
524                                         parsing_generic_less_than = 0;\r
525 \r
526                                 d = peekChar ();\r
527                                 if (d == '<'){\r
528                                         getChar ();\r
529                                         d = peekChar ();\r
530 \r
531                                         if (d == '='){\r
532                                                 doread = true;\r
533                                                 return Token.OP_SHIFT_LEFT_ASSIGN;\r
534                                         }\r
535                                         return Token.OP_SHIFT_LEFT;\r
536                                 } else if (d == '='){\r
537                                         doread = true;\r
538                                         return Token.OP_LE;\r
539                                 }\r
540                                 return Token.OP_LT;\r
541                         } else if (c == '>') {\r
542                                 if (parsing_generic_less_than > 0) {\r
543                                         parsing_generic_less_than--;\r
544                                         return Token.OP_GENERICS_GT;\r
545                                 }\r
546 \r
547                                 d = peekChar ();\r
548                                 if (d == '>'){\r
549                                         getChar ();\r
550                                         d = peekChar ();\r
551 \r
552                                         if (d == '='){\r
553                                                 doread = true;\r
554                                                 return Token.OP_SHIFT_RIGHT_ASSIGN;\r
555                                         }\r
556                                         return Token.OP_SHIFT_RIGHT;\r
557                                 } else if (d == '='){\r
558                                         doread = true;\r
559                                         return Token.OP_GE;\r
560                                 }\r
561                                 return Token.OP_GT;\r
562                         }\r
563 \r
564                         d = peekChar ();\r
565                         if (c == '+'){\r
566                                 \r
567                                 if (d == '+')\r
568                                         t = Token.OP_INC;\r
569                                 else if (d == '=')\r
570                                         t = Token.OP_ADD_ASSIGN;\r
571                                 else\r
572                                         return Token.PLUS;\r
573                                 doread = true;\r
574                                 return t;\r
575                         }\r
576                         if (c == '-'){\r
577                                 if (d == '-')\r
578                                         t = Token.OP_DEC;\r
579                                 else if (d == '=')\r
580                                         t = Token.OP_SUB_ASSIGN;\r
581                                 else if (d == '>')\r
582                                         t = Token.OP_PTR;\r
583                                 else\r
584                                         return Token.MINUS;\r
585                                 doread = true;\r
586                                 return t;\r
587                         }\r
588 \r
589                         if (c == '!'){\r
590                                 if (d == '='){\r
591                                         doread = true;\r
592                                         return Token.OP_NE;\r
593                                 }\r
594                                 return Token.BANG;\r
595                         }\r
596 \r
597                         if (c == '='){\r
598                                 if (d == '='){\r
599                                         doread = true;\r
600                                         return Token.OP_EQ;\r
601                                 }\r
602                                 return Token.ASSIGN;\r
603                         }\r
604 \r
605                         if (c == '&'){\r
606                                 if (d == '&'){\r
607                                         doread = true;\r
608                                         return Token.OP_AND;\r
609                                 } else if (d == '='){\r
610                                         doread = true;\r
611                                         return Token.OP_AND_ASSIGN;\r
612                                 }\r
613                                 return Token.BITWISE_AND;\r
614                         }\r
615 \r
616                         if (c == '|'){\r
617                                 if (d == '|'){\r
618                                         doread = true;\r
619                                         return Token.OP_OR;\r
620                                 } else if (d == '='){\r
621                                         doread = true;\r
622                                         return Token.OP_OR_ASSIGN;\r
623                                 }\r
624                                 return Token.BITWISE_OR;\r
625                         }\r
626 \r
627                         if (c == '*'){\r
628                                 if (d == '='){\r
629                                         doread = true;\r
630                                         return Token.OP_MULT_ASSIGN;\r
631                                 }\r
632                                 return Token.STAR;\r
633                         }\r
634 \r
635                         if (c == '/'){\r
636                                 if (d == '='){\r
637                                         doread = true;\r
638                                         return Token.OP_DIV_ASSIGN;\r
639                                 }\r
640                                 return Token.DIV;\r
641                         }\r
642 \r
643                         if (c == '%'){\r
644                                 if (d == '='){\r
645                                         doread = true;\r
646                                         return Token.OP_MOD_ASSIGN;\r
647                                 }\r
648                                 return Token.PERCENT;\r
649                         }\r
650 \r
651                         if (c == '^'){\r
652                                 if (d == '='){\r
653                                         doread = true;\r
654                                         return Token.OP_XOR_ASSIGN;\r
655                                 }\r
656                                 return Token.CARRET;\r
657                         }\r
658 \r
659                         return Token.ERROR;\r
660                 }\r
661 \r
662                 int deambiguate_close_parens = 0;\r
663 \r
664                 public void Deambiguate_CloseParens ()\r
665                 {\r
666                         putback (')');\r
667                         deambiguate_close_parens++;\r
668                 }\r
669 \r
670                 void Error_NumericConstantTooLong ()\r
671                 {\r
672                         Report.Error (1021, Location, "Numeric constant too long");                     \r
673                 }\r
674                 \r
675                 bool decimal_digits (int c)\r
676                 {\r
677                         int d;\r
678                         bool seen_digits = false;\r
679                         \r
680                         if (c != -1){\r
681                                 if (number_pos == max_number_size)\r
682                                         Error_NumericConstantTooLong ();\r
683                                 number_builder [number_pos++] = (char) c;\r
684                         }\r
685                         \r
686                         //\r
687                         // We use peekChar2, because decimal_digits needs to do a \r
688                         // 2-character look-ahead (5.ToString for example).\r
689                         //\r
690                         while ((d = peekChar2 ()) != -1){\r
691                                 if (d >= '0' && d <= '9'){\r
692                                         if (number_pos == max_number_size)\r
693                                                 Error_NumericConstantTooLong ();\r
694                                         number_builder [number_pos++] = (char) d;\r
695                                         getChar ();\r
696                                         seen_digits = true;\r
697                                 } else\r
698                                         break;\r
699                         }\r
700                         \r
701                         return seen_digits;\r
702                 }\r
703 \r
704                 bool is_hex (int e)\r
705                 {\r
706                         return (e >= '0' && e <= '9') || (e >= 'A' && e <= 'F') || (e >= 'a' && e <= 'f');\r
707                 }\r
708                 \r
709                 void hex_digits (int c)\r
710                 {\r
711                         if (c != -1)\r
712                                 number_builder [number_pos++] = (char) c;\r
713                         \r
714                 }\r
715                 \r
716                 int real_type_suffix (int c)\r
717                 {\r
718                         int t;\r
719 \r
720                         switch (c){\r
721                         case 'F': case 'f':\r
722                                 t =  Token.LITERAL_FLOAT;\r
723                                 break;\r
724                         case 'D': case 'd':\r
725                                 t = Token.LITERAL_DOUBLE;\r
726                                 break;\r
727                         case 'M': case 'm':\r
728                                  t= Token.LITERAL_DECIMAL;\r
729                                 break;\r
730                         default:\r
731                                 return Token.NONE;\r
732                         }\r
733                         return t;\r
734                 }\r
735 \r
736                 int integer_type_suffix (ulong ul, int c)\r
737                 {\r
738                         bool is_unsigned = false;\r
739                         bool is_long = false;\r
740 \r
741                         if (c != -1){\r
742                                 bool scanning = true;\r
743                                 do {\r
744                                         switch (c){\r
745                                         case 'U': case 'u':\r
746                                                 if (is_unsigned)\r
747                                                         scanning = false;\r
748                                                 is_unsigned = true;\r
749                                                 getChar ();\r
750                                                 break;\r
751 \r
752                                         case 'l':\r
753                                                 if (!is_unsigned){\r
754                                                         //\r
755                                                         // if we have not seen anything in between\r
756                                                         // report this error\r
757                                                         //\r
758                                                         Report.Warning (\r
759                                                                 78, Location,\r
760                                                         "the 'l' suffix is easily confused with digit `1'," +\r
761                                                         " use 'L' for clarity");\r
762                                                 }\r
763                                                 goto case 'L';\r
764                                                 \r
765                                         case 'L': \r
766                                                 if (is_long)\r
767                                                         scanning = false;\r
768                                                 is_long = true;\r
769                                                 getChar ();\r
770                                                 break;\r
771                                                 \r
772                                         default:\r
773                                                 scanning = false;\r
774                                                 break;\r
775                                         }\r
776                                         c = peekChar ();\r
777                                 } while (scanning);\r
778                         }\r
779 \r
780                         if (is_long && is_unsigned){\r
781                                 val = ul;\r
782                                 return Token.LITERAL_INTEGER;\r
783                         } else if (is_unsigned){\r
784                                 // uint if possible, or ulong else.\r
785 \r
786                                 if ((ul & 0xffffffff00000000) == 0)\r
787                                         val = (uint) ul;\r
788                                 else\r
789                                         val = ul;\r
790                         } else if (is_long){\r
791                                 // long if possible, ulong otherwise\r
792                                 if ((ul & 0x8000000000000000) != 0)\r
793                                         val = ul;\r
794                                 else\r
795                                         val = (long) ul;\r
796                         } else {\r
797                                 // int, uint, long or ulong in that order\r
798                                 if ((ul & 0xffffffff00000000) == 0){\r
799                                         uint ui = (uint) ul;\r
800                                         \r
801                                         if ((ui & 0x80000000) != 0)\r
802                                                 val = ui;\r
803                                         else\r
804                                                 val = (int) ui;\r
805                                 } else {\r
806                                         if ((ul & 0x8000000000000000) != 0)\r
807                                                 val = ul;\r
808                                         else\r
809                                                 val = (long) ul;\r
810                                 }\r
811                         }\r
812                         return Token.LITERAL_INTEGER;\r
813                 }\r
814                                 \r
815                 //\r
816                 // given `c' as the next char in the input decide whether\r
817                 // we need to convert to a special type, and then choose\r
818                 // the best representation for the integer\r
819                 //\r
820                 int adjust_int (int c)\r
821                 {\r
822                         try {\r
823                                 if (number_pos > 9){\r
824                                         ulong ul = (uint) (number_builder [0] - '0');\r
825 \r
826                                         for (int i = 1; i < number_pos; i++){\r
827                                                 ul = checked ((ul * 10) + ((uint)(number_builder [i] - '0')));\r
828                                         }\r
829                                         return integer_type_suffix (ul, c);\r
830                                 } else {\r
831                                         uint ui = (uint) (number_builder [0] - '0');\r
832 \r
833                                         for (int i = 1; i < number_pos; i++){\r
834                                                 ui = checked ((ui * 10) + ((uint)(number_builder [i] - '0')));\r
835                                         }\r
836                                         return integer_type_suffix (ui, c);\r
837                                 }\r
838                         } catch (OverflowException) {\r
839                                 error_details = "Integral constant is too large";\r
840                                 Report.Error (1021, Location, error_details);\r
841                                 val = 0ul;\r
842                                 return Token.LITERAL_INTEGER;\r
843                         }\r
844                 }\r
845                 \r
846                 int adjust_real (int t)\r
847                 {\r
848                         string s = new String (number_builder, 0, number_pos);\r
849 \r
850                         switch (t){\r
851                         case Token.LITERAL_DECIMAL:\r
852                                 try {\r
853                                         val = System.Decimal.Parse (s, styles, csharp_format_info);\r
854                                 } catch (OverflowException) {\r
855                                         val = 0m;     \r
856                                         error_details = "Floating-point constant is outside the range of the type 'decimal'";\r
857                                         Report.Error (594, Location, error_details);\r
858                                 }\r
859                                 break;\r
860                         case Token.LITERAL_FLOAT:\r
861                                 try {\r
862                                         val = (float) System.Double.Parse (s, styles, csharp_format_info);\r
863                                 } catch (OverflowException) {\r
864                                         val = 0.0f;     \r
865                                         error_details = "Floating-point constant is outside the range of the type 'float'";\r
866                                         Report.Error (594, Location, error_details);\r
867                                 }\r
868                                 break;\r
869                                 \r
870                         case Token.LITERAL_DOUBLE:\r
871                         case Token.NONE:\r
872                                 t = Token.LITERAL_DOUBLE;\r
873                                 try {\r
874                                         val = System.Double.Parse (s, styles, csharp_format_info);\r
875                                 } catch (OverflowException) {\r
876                                         val = 0.0;     \r
877                                         error_details = "Floating-point constant is outside the range of the type 'double'";\r
878                                         Report.Error (594, Location, error_details);\r
879                                 }\r
880                                 break;\r
881                         }\r
882                         return t;\r
883                 }\r
884 \r
885                 int handle_hex ()\r
886                 {\r
887                         int d;\r
888                         ulong ul;\r
889                         \r
890                         getChar ();\r
891                         while ((d = peekChar ()) != -1){\r
892                                 if (is_hex (d)){\r
893                                         number_builder [number_pos++] = (char) d;\r
894                                         getChar ();\r
895                                 } else\r
896                                         break;\r
897                         }\r
898                         \r
899                         string s = new String (number_builder, 0, number_pos);\r
900                         try {\r
901                                 if (number_pos <= 8)\r
902                                         ul = System.UInt32.Parse (s, NumberStyles.HexNumber);\r
903                                 else\r
904                                         ul = System.UInt64.Parse (s, NumberStyles.HexNumber);\r
905                         } catch (OverflowException){\r
906                                 error_details = "Integral constant is too large";\r
907                                 Report.Error (1021, Location, error_details);\r
908                                 val = 0ul;\r
909                                 return Token.LITERAL_INTEGER;\r
910                         }\r
911                         \r
912                         return integer_type_suffix (ul, peekChar ());\r
913                 }\r
914 \r
915                 //\r
916                 // Invoked if we know we have .digits or digits\r
917                 //\r
918                 int is_number (int c)\r
919                 {\r
920                         bool is_real = false;\r
921                         int type;\r
922 \r
923                         number_pos = 0;\r
924 \r
925                         if (c >= '0' && c <= '9'){\r
926                                 if (c == '0'){\r
927                                         int peek = peekChar ();\r
928 \r
929                                         if (peek == 'x' || peek == 'X')\r
930                                                 return handle_hex ();\r
931                                 }\r
932                                 decimal_digits (c);\r
933                                 c = getChar ();\r
934                         }\r
935 \r
936                         //\r
937                         // We need to handle the case of\r
938                         // "1.1" vs "1.string" (LITERAL_FLOAT vs NUMBER DOT IDENTIFIER)\r
939                         //\r
940                         if (c == '.'){\r
941                                 if (decimal_digits ('.')){\r
942                                         is_real = true;\r
943                                         c = getChar ();\r
944                                 } else {\r
945                                         putback ('.');\r
946                                         number_pos--;\r
947                                         return adjust_int (-1);\r
948                                 }\r
949                         }\r
950                         \r
951                         if (c == 'e' || c == 'E'){\r
952                                 is_real = true;\r
953                                 if (number_pos == max_number_size)\r
954                                         Error_NumericConstantTooLong ();\r
955                                 number_builder [number_pos++] = 'e';\r
956                                 c = getChar ();\r
957                                 \r
958                                 if (c == '+'){\r
959                                         if (number_pos == max_number_size)\r
960                                                 Error_NumericConstantTooLong ();\r
961                                         number_builder [number_pos++] = '+';\r
962                                         c = -1;\r
963                                 } else if (c == '-') {\r
964                                         if (number_pos == max_number_size)\r
965                                                 Error_NumericConstantTooLong ();\r
966                                         number_builder [number_pos++] = '-';\r
967                                         c = -1;\r
968                                 } else {\r
969                                         if (number_pos == max_number_size)\r
970                                                 Error_NumericConstantTooLong ();\r
971                                         number_builder [number_pos++] = '+';\r
972                                 }\r
973                                         \r
974                                 decimal_digits (c);\r
975                                 c = getChar ();\r
976                         }\r
977 \r
978                         type = real_type_suffix (c);\r
979                         if (type == Token.NONE && !is_real){\r
980                                 putback (c);\r
981                                 return adjust_int (c);\r
982                         } else \r
983                                 is_real = true;\r
984 \r
985                         if (type == Token.NONE){\r
986                                 putback (c);\r
987                         }\r
988                         \r
989                         if (is_real)\r
990                                 return adjust_real (type);\r
991 \r
992                         Console.WriteLine ("This should not be reached");\r
993                         throw new Exception ("Is Number should never reach this point");\r
994                 }\r
995 \r
996                 //\r
997                 // Accepts exactly count (4 or 8) hex, no more no less\r
998                 //\r
999                 int getHex (int count, out bool error)\r
1000                 {\r
1001                         int i;\r
1002                         int total = 0;\r
1003                         int c;\r
1004                         int top = count != -1 ? count : 4;\r
1005                         \r
1006                         getChar ();\r
1007                         error = false;\r
1008                         for (i = 0; i < top; i++){\r
1009                                 c = getChar ();\r
1010                                 \r
1011                                 if (c >= '0' && c <= '9')\r
1012                                         c = (int) c - (int) '0';\r
1013                                 else if (c >= 'A' && c <= 'F')\r
1014                                         c = (int) c - (int) 'A' + 10;\r
1015                                 else if (c >= 'a' && c <= 'f')\r
1016                                         c = (int) c - (int) 'a' + 10;\r
1017                                 else {\r
1018                                         error = true;\r
1019                                         return 0;\r
1020                                 }\r
1021                                 \r
1022                                 total = (total * 16) + c;\r
1023                                 if (count == -1){\r
1024                                         int p = peekChar ();\r
1025                                         if (p == -1)\r
1026                                                 break;\r
1027                                         if (!is_hex ((char)p))\r
1028                                                 break;\r
1029                                 }\r
1030                         }\r
1031                         return total;\r
1032                 }\r
1033 \r
1034                 int escape (int c)\r
1035                 {\r
1036                         bool error;\r
1037                         int d;\r
1038                         int v;\r
1039 \r
1040                         d = peekChar ();\r
1041                         if (c != '\\')\r
1042                                 return c;\r
1043                         \r
1044                         switch (d){\r
1045                         case 'a':\r
1046                                 v = '\a'; break;\r
1047                         case 'b':\r
1048                                 v = '\b'; break;\r
1049                         case 'n':\r
1050                                 v = '\n'; break;\r
1051                         case 't':\r
1052                                 v = '\t'; break;\r
1053                         case 'v':\r
1054                                 v = '\v'; break;\r
1055                         case 'r':\r
1056                                 v = '\r'; break;\r
1057                         case '\\':\r
1058                                 v = '\\'; break;\r
1059                         case 'f':\r
1060                                 v = '\f'; break;\r
1061                         case '0':\r
1062                                 v = 0; break;\r
1063                         case '"':\r
1064                                 v = '"'; break;\r
1065                         case '\'':\r
1066                                 v = '\''; break;\r
1067                         case 'x':\r
1068                                 v = getHex (-1, out error);\r
1069                                 if (error)\r
1070                                         goto default;\r
1071                                 return v;\r
1072                         case 'u':\r
1073                                 v = getHex (4, out error);\r
1074                                 if (error)\r
1075                                         goto default;\r
1076                                 return v;\r
1077                         case 'U':\r
1078                                 v = getHex (8, out error);\r
1079                                 if (error)\r
1080                                         goto default;\r
1081                                 return v;\r
1082                         default:\r
1083                                 Report.Error (1009, Location, "Unrecognized escape sequence in " + (char)d);\r
1084                                 return d;\r
1085                         }\r
1086                         getChar ();\r
1087                         return v;\r
1088                 }\r
1089 \r
1090                 int getChar ()\r
1091                 {\r
1092                         if (putback_char != -1){\r
1093                                 int x = putback_char;\r
1094                                 putback_char = -1;\r
1095 \r
1096                                 return x;\r
1097                         }\r
1098                         return reader.Read ();\r
1099                 }\r
1100 \r
1101                 int peekChar ()\r
1102                 {\r
1103                         if (putback_char != -1)\r
1104                                 return putback_char;\r
1105                         putback_char = reader.Read ();\r
1106                         return putback_char;\r
1107                 }\r
1108 \r
1109                 int peekChar2 ()\r
1110                 {\r
1111                         if (putback_char != -1)\r
1112                                 return putback_char;\r
1113                         return reader.Peek ();\r
1114                 }\r
1115                 \r
1116                 void putback (int c)\r
1117                 {\r
1118                         if (putback_char != -1){\r
1119                                 Console.WriteLine ("Col: " + col);\r
1120                                 Console.WriteLine ("Row: " + line);\r
1121                                 Console.WriteLine ("Name: " + ref_name.Name);\r
1122                                 Console.WriteLine ("Current [{0}] putting back [{1}]  ", putback_char, c);\r
1123                                 throw new Exception ("This should not happen putback on putback");\r
1124                         }\r
1125                         putback_char = c;\r
1126                 }\r
1127 \r
1128                 public bool advance ()\r
1129                 {\r
1130                         return peekChar () != -1;\r
1131                 }\r
1132 \r
1133                 public Object Value {\r
1134                         get {\r
1135                                 return val;\r
1136                         }\r
1137                 }\r
1138 \r
1139                 public Object value ()\r
1140                 {\r
1141                         return val;\r
1142                 }\r
1143 \r
1144                 bool IsCastToken (int token)\r
1145                 {\r
1146                         switch (token) {\r
1147                         case Token.BANG:\r
1148                         case Token.TILDE:\r
1149                         case Token.IDENTIFIER:\r
1150                         case Token.LITERAL_INTEGER:\r
1151                         case Token.LITERAL_FLOAT:\r
1152                         case Token.LITERAL_DOUBLE:\r
1153                         case Token.LITERAL_DECIMAL:\r
1154                         case Token.LITERAL_CHARACTER:\r
1155                         case Token.LITERAL_STRING:\r
1156                         case Token.BASE:\r
1157                         case Token.CHECKED:\r
1158                         case Token.FALSE:\r
1159                         case Token.FIXED:\r
1160                         case Token.NEW:\r
1161                         case Token.NULL:\r
1162                         case Token.SIZEOF:\r
1163                         case Token.THIS:\r
1164                         case Token.THROW:\r
1165                         case Token.TRUE:\r
1166                         case Token.TYPEOF:\r
1167                         case Token.UNCHECKED:\r
1168                         case Token.UNSAFE:\r
1169 \r
1170                                 //\r
1171                                 // These can be part of a member access\r
1172                                 //\r
1173                         case Token.INT:\r
1174                         case Token.UINT:\r
1175                         case Token.SHORT:\r
1176                         case Token.USHORT:\r
1177                         case Token.LONG:\r
1178                         case Token.ULONG:\r
1179                         case Token.DOUBLE:\r
1180                         case Token.FLOAT:\r
1181                         case Token.CHAR:\r
1182                                 return true;\r
1183 \r
1184                         default:\r
1185                                 return false;\r
1186                         }\r
1187                 }\r
1188 \r
1189                 public int token ()\r
1190                 {\r
1191                         current_token = xtoken ();\r
1192 \r
1193                         if (current_token != Token.DEFAULT)\r
1194                                 return current_token;\r
1195 \r
1196                         int c = consume_whitespace ();\r
1197                         if (c == -1)\r
1198                                 current_token = Token.ERROR;\r
1199                         else if (c == '(')\r
1200                                 current_token = Token.DEFAULT_OPEN_PARENS;\r
1201                         else\r
1202                                 putback (c);\r
1203 \r
1204                         return current_token;\r
1205                 }\r
1206 \r
1207                 static StringBuilder static_cmd_arg = new System.Text.StringBuilder ();\r
1208                 \r
1209                 void get_cmd_arg (out string cmd, out string arg)\r
1210                 {\r
1211                         int c;\r
1212                         \r
1213                         tokens_seen = false;\r
1214                         arg = "";\r
1215                         static_cmd_arg.Length = 0;\r
1216 \r
1217                         // skip over white space\r
1218                         while ((c = getChar ()) != -1 && (c != '\n') && ((c == '\r') || (c == ' ') || (c == '\t')))\r
1219                                 ;\r
1220                                 \r
1221                         while ((c != -1) && (c != '\n') && (c != ' ') && (c != '\t') && (c != '\r')){\r
1222                                 if (is_identifier_part_character ((char) c)){\r
1223                                         static_cmd_arg.Append ((char) c);\r
1224                                         c = getChar ();\r
1225                                 } else {\r
1226                                         putback (c);\r
1227                                         break;\r
1228                                 }\r
1229                         }\r
1230 \r
1231                         cmd = static_cmd_arg.ToString ();\r
1232 \r
1233                         if (c == '\n'){\r
1234                                 line++;\r
1235                                 ref_line++;\r
1236                                 return;\r
1237                         } else if (c == '\r')\r
1238                                 col = 0;\r
1239 \r
1240                         // skip over white space\r
1241                         while ((c = getChar ()) != -1 && (c != '\n') && ((c == '\r') || (c == ' ') || (c == '\t')))\r
1242                                 ;\r
1243 \r
1244                         if (c == '\n'){\r
1245                                 line++;\r
1246                                 ref_line++;\r
1247                                 return;\r
1248                         } else if (c == '\r'){\r
1249                                 col = 0;\r
1250                                 return;\r
1251                         }\r
1252                         \r
1253                         static_cmd_arg.Length = 0;\r
1254                         static_cmd_arg.Append ((char) c);\r
1255                         \r
1256                         while ((c = getChar ()) != -1 && (c != '\n') && (c != '\r')){\r
1257                                 static_cmd_arg.Append ((char) c);\r
1258                         }\r
1259 \r
1260                         if (c == '\n'){\r
1261                                 line++;\r
1262                                 ref_line++;\r
1263                         } else if (c == '\r')\r
1264                                 col = 0;\r
1265                         arg = static_cmd_arg.ToString ().Trim ();\r
1266                 }\r
1267 \r
1268                 //\r
1269                 // Handles the #line directive\r
1270                 //\r
1271                 bool PreProcessLine (string arg)\r
1272                 {\r
1273                         if (arg == "")\r
1274                                 return false;\r
1275 \r
1276                         if (arg == "default"){\r
1277                                 ref_line = line;\r
1278                                 ref_name = file_name;\r
1279                                 Location.Push (ref_name);\r
1280                                 return true;\r
1281                         } else if (arg == "hidden"){\r
1282                                 //\r
1283                                 // We ignore #line hidden\r
1284                                 //\r
1285                                 return true;\r
1286                         }\r
1287                         \r
1288                         try {\r
1289                                 int pos;\r
1290 \r
1291                                 if ((pos = arg.IndexOf (' ')) != -1 && pos != 0){\r
1292                                         ref_line = System.Int32.Parse (arg.Substring (0, pos));\r
1293                                         pos++;\r
1294                                         \r
1295                                         char [] quotes = { '\"' };\r
1296                                         \r
1297                                         string name = arg.Substring (pos). Trim (quotes);\r
1298                                         ref_name = Location.LookupFile (name);\r
1299                                         file_name.HasLineDirective = true;\r
1300                                         ref_name.HasLineDirective = true;\r
1301                                         Location.Push (ref_name);\r
1302                                 } else {\r
1303                                         ref_line = System.Int32.Parse (arg);\r
1304                                 }\r
1305                         } catch {\r
1306                                 return false;\r
1307                         }\r
1308                         \r
1309                         return true;\r
1310                 }\r
1311 \r
1312                 //\r
1313                 // Handles #define and #undef\r
1314                 //\r
1315                 void PreProcessDefinition (bool is_define, string arg)\r
1316                 {\r
1317                         if (arg == "" || arg == "true" || arg == "false"){\r
1318                                 Report.Error (1001, Location, "Missing identifer to pre-processor directive");\r
1319                                 return;\r
1320                         }\r
1321 \r
1322                         char[] whitespace = { ' ', '\t' };\r
1323                         if (arg.IndexOfAny (whitespace) != -1){\r
1324                                 Report.Error (1025, Location, "Single-line comment or end-of-line expected");\r
1325                                 return;\r
1326                         }\r
1327 \r
1328                         if (!is_identifier_start_character (arg [0]))\r
1329                                 Report.Error (1001, Location, "Identifier expected: " + arg);\r
1330                         \r
1331                         foreach (char c in arg.Substring (1)){\r
1332                                 if (!is_identifier_part_character (c)){\r
1333                                         Report.Error (1001, Location, "Identifier expected: " + arg);\r
1334                                         return;\r
1335                                 }\r
1336                         }\r
1337 \r
1338                         if (is_define){\r
1339                                 if (defines == null)\r
1340                                         defines = new Hashtable ();\r
1341                                 define (arg);\r
1342                         } else {\r
1343                                 if (defines == null)\r
1344                                         return;\r
1345                                 if (defines.Contains (arg))\r
1346                                         defines.Remove (arg);\r
1347                         }\r
1348                 }\r
1349 \r
1350                 bool eval_val (string s)\r
1351                 {\r
1352                         if (s == "true")\r
1353                                 return true;\r
1354                         if (s == "false")\r
1355                                 return false;\r
1356                         \r
1357                         if (defines == null)\r
1358                                 return false;\r
1359                         if (defines.Contains (s))\r
1360                                 return true;\r
1361 \r
1362                         return false;\r
1363                 }\r
1364 \r
1365                 bool pp_primary (ref string s)\r
1366                 {\r
1367                         s = s.Trim ();\r
1368                         int len = s.Length;\r
1369 \r
1370                         if (len > 0){\r
1371                                 char c = s [0];\r
1372                                 \r
1373                                 if (c == '('){\r
1374                                         s = s.Substring (1);\r
1375                                         bool val = pp_expr (ref s);\r
1376                                         if (s.Length > 0 && s [0] == ')'){\r
1377                                                 s = s.Substring (1);\r
1378                                                 return val;\r
1379                                         }\r
1380                                         Error_InvalidDirective ();\r
1381                                         return false;\r
1382                                 }\r
1383                                 \r
1384                                 if (is_identifier_start_character (c)){\r
1385                                         int j = 1;\r
1386 \r
1387                                         while (j < len){\r
1388                                                 c = s [j];\r
1389                                                 \r
1390                                                 if (is_identifier_part_character (c)){\r
1391                                                         j++;\r
1392                                                         continue;\r
1393                                                 }\r
1394                                                 bool v = eval_val (s.Substring (0, j));\r
1395                                                 s = s.Substring (j);\r
1396                                                 return v;\r
1397                                         }\r
1398                                         bool vv = eval_val (s);\r
1399                                         s = "";\r
1400                                         return vv;\r
1401                                 }\r
1402                         }\r
1403                         Error_InvalidDirective ();\r
1404                         return false;\r
1405                 }\r
1406                 \r
1407                 bool pp_unary (ref string s)\r
1408                 {\r
1409                         s = s.Trim ();\r
1410                         int len = s.Length;\r
1411 \r
1412                         if (len > 0){\r
1413                                 if (s [0] == '!'){\r
1414                                         if (len > 1 && s [1] == '='){\r
1415                                                 Error_InvalidDirective ();\r
1416                                                 return false;\r
1417                                         }\r
1418                                         s = s.Substring (1);\r
1419                                         return ! pp_primary (ref s);\r
1420                                 } else\r
1421                                         return pp_primary (ref s);\r
1422                         } else {\r
1423                                 Error_InvalidDirective ();\r
1424                                 return false;\r
1425                         }\r
1426                 }\r
1427                 \r
1428                 bool pp_eq (ref string s)\r
1429                 {\r
1430                         bool va = pp_unary (ref s);\r
1431 \r
1432                         s = s.Trim ();\r
1433                         int len = s.Length;\r
1434                         if (len > 0){\r
1435                                 if (s [0] == '='){\r
1436                                         if (len > 2 && s [1] == '='){\r
1437                                                 s = s.Substring (2);\r
1438                                                 return va == pp_unary (ref s);\r
1439                                         } else {\r
1440                                                 Error_InvalidDirective ();\r
1441                                                 return false;\r
1442                                         }\r
1443                                 } else if (s [0] == '!' && len > 1 && s [1] == '='){\r
1444                                         s = s.Substring (2);\r
1445 \r
1446                                         return va != pp_unary (ref s);\r
1447 \r
1448                                 } \r
1449                         }\r
1450 \r
1451                         return va;\r
1452                                 \r
1453                 }\r
1454                 \r
1455                 bool pp_and (ref string s)\r
1456                 {\r
1457                         bool va = pp_eq (ref s);\r
1458 \r
1459                         s = s.Trim ();\r
1460                         int len = s.Length;\r
1461                         if (len > 0){\r
1462                                 if (s [0] == '&'){\r
1463                                         if (len > 2 && s [1] == '&'){\r
1464                                                 s = s.Substring (2);\r
1465                                                 return (va & pp_eq (ref s));\r
1466                                         } else {\r
1467                                                 Error_InvalidDirective ();\r
1468                                                 return false;\r
1469                                         }\r
1470                                 } \r
1471                         }\r
1472                         return va;\r
1473                 }\r
1474                 \r
1475                 //\r
1476                 // Evaluates an expression for `#if' or `#elif'\r
1477                 //\r
1478                 bool pp_expr (ref string s)\r
1479                 {\r
1480                         bool va = pp_and (ref s);\r
1481                         s = s.Trim ();\r
1482                         int len = s.Length;\r
1483                         if (len > 0){\r
1484                                 char c = s [0];\r
1485                                 \r
1486                                 if (c == '|'){\r
1487                                         if (len > 2 && s [1] == '|'){\r
1488                                                 s = s.Substring (2);\r
1489                                                 return va | pp_expr (ref s);\r
1490                                         } else {\r
1491                                                 Error_InvalidDirective ();\r
1492                                                 return false;\r
1493                                         }\r
1494                                 } \r
1495                         }\r
1496                         \r
1497                         return va;\r
1498                 }\r
1499 \r
1500                 bool eval (string s)\r
1501                 {\r
1502                         bool v = pp_expr (ref s);\r
1503                         s = s.Trim ();\r
1504                         if (s.Length != 0){\r
1505                                 Error_InvalidDirective ();\r
1506                                 return false;\r
1507                         }\r
1508 \r
1509                         return v;\r
1510                 }\r
1511                 \r
1512                 void Error_InvalidDirective ()\r
1513                 {\r
1514                         Report.Error (1517, Location, "Invalid pre-processor directive");\r
1515                 }\r
1516 \r
1517                 void Error_UnexpectedDirective (string extra)\r
1518                 {\r
1519                         Report.Error (\r
1520                                 1028, Location,\r
1521                                 "Unexpected processor directive (" + extra + ")");\r
1522                 }\r
1523 \r
1524                 void Error_TokensSeen ()\r
1525                 {\r
1526                         Report.Error (\r
1527                                 1032, Location,\r
1528                                 "Cannot define or undefine pre-processor symbols after a token in the file");\r
1529                 }\r
1530                 \r
1531                 //\r
1532                 // if true, then the code continues processing the code\r
1533                 // if false, the code stays in a loop until another directive is\r
1534                 // reached.\r
1535                 //\r
1536                 bool handle_preprocessing_directive (bool caller_is_taking)\r
1537                 {\r
1538                         string cmd, arg;\r
1539                         bool region_directive = false;\r
1540 \r
1541                         get_cmd_arg (out cmd, out arg);\r
1542 \r
1543                         // Eat any trailing whitespaces and single-line comments\r
1544                         if (arg.IndexOf ("//") != -1)\r
1545                                 arg = arg.Substring (0, arg.IndexOf ("//"));\r
1546                         arg = arg.TrimEnd (' ', '\t');\r
1547 \r
1548                         //\r
1549                         // The first group of pre-processing instructions is always processed\r
1550                         //\r
1551                         switch (cmd){\r
1552                         case "pragma":\r
1553                                 if (RootContext.V2)\r
1554                                         return true;\r
1555                                 break;\r
1556                                 \r
1557                         case "line":\r
1558                                 if (!PreProcessLine (arg))\r
1559                                         Report.Error (\r
1560                                                 1576, Location,\r
1561                                                 "Argument to #line directive is missing or invalid");\r
1562                                 return true;\r
1563 \r
1564                         case "region":\r
1565                                 region_directive = true;\r
1566                                 arg = "true";\r
1567                                 goto case "if";\r
1568 \r
1569                         case "endregion":\r
1570                                 region_directive = true;\r
1571                                 goto case "endif";\r
1572                                 \r
1573                         case "if":\r
1574                                 if (arg == ""){\r
1575                                         Error_InvalidDirective ();\r
1576                                         return true;\r
1577                                 }\r
1578                                 bool taking = false;\r
1579                                 if (ifstack == null)\r
1580                                         ifstack = new Stack ();\r
1581 \r
1582                                 if (ifstack.Count == 0){\r
1583                                         taking = true;\r
1584                                 } else {\r
1585                                         int state = (int) ifstack.Peek ();\r
1586                                         if ((state & TAKING) != 0)\r
1587                                                 taking = true;\r
1588                                 }\r
1589 \r
1590                                 if (eval (arg) && taking){\r
1591                                         int push = TAKING | TAKEN_BEFORE | PARENT_TAKING;\r
1592                                         if (region_directive)\r
1593                                                 push |= REGION;\r
1594                                         ifstack.Push (push);\r
1595                                         return true;\r
1596                                 } else {\r
1597                                         int push = (taking ? PARENT_TAKING : 0);\r
1598                                         if (region_directive)\r
1599                                                 push |= REGION;\r
1600                                         ifstack.Push (push);\r
1601                                         return false;\r
1602                                 }\r
1603                                 \r
1604                         case "endif":\r
1605                                 if (ifstack == null || ifstack.Count == 0){\r
1606                                         Error_UnexpectedDirective ("no #if for this #endif");\r
1607                                         return true;\r
1608                                 } else {\r
1609                                         int pop = (int) ifstack.Pop ();\r
1610                                         \r
1611                                         if (region_directive && ((pop & REGION) == 0))\r
1612                                                 Report.Error (1027, Location, "#endif directive expected");\r
1613                                         else if (!region_directive && ((pop & REGION) != 0))\r
1614                                                 Report.Error (1038, Location, "#endregion directive expected");\r
1615                                         \r
1616                                         if (ifstack.Count == 0)\r
1617                                                 return true;\r
1618                                         else {\r
1619                                                 int state = (int) ifstack.Peek ();\r
1620 \r
1621                                                 if ((state & TAKING) != 0)\r
1622                                                         return true;\r
1623                                                 else\r
1624                                                         return false;\r
1625                                         }\r
1626                                 }\r
1627 \r
1628                         case "elif":\r
1629                                 if (ifstack == null || ifstack.Count == 0){\r
1630                                         Error_UnexpectedDirective ("no #if for this #elif");\r
1631                                         return true;\r
1632                                 } else {\r
1633                                         int state = (int) ifstack.Peek ();\r
1634 \r
1635                                         if ((state & REGION) != 0) {\r
1636                                                 Report.Error (1038, Location, "#endregion directive expected");\r
1637                                                 return true;\r
1638                                         }\r
1639 \r
1640                                         if ((state & ELSE_SEEN) != 0){\r
1641                                                 Error_UnexpectedDirective ("#elif not valid after #else");\r
1642                                                 return true;\r
1643                                         }\r
1644 \r
1645                                         if ((state & (TAKEN_BEFORE | TAKING)) != 0)\r
1646                                                 return false;\r
1647 \r
1648                                         if (eval (arg) && ((state & PARENT_TAKING) != 0)){\r
1649                                                 state = (int) ifstack.Pop ();\r
1650                                                 ifstack.Push (state | TAKING | TAKEN_BEFORE);\r
1651                                                 return true;\r
1652                                         } else \r
1653                                                 return false;\r
1654                                 }\r
1655 \r
1656                         case "else":\r
1657                                 if (ifstack == null || ifstack.Count == 0){\r
1658                                         Report.Error (\r
1659                                                 1028, Location,\r
1660                                                 "Unexpected processor directive (no #if for this #else)");\r
1661                                         return true;\r
1662                                 } else {\r
1663                                         int state = (int) ifstack.Peek ();\r
1664 \r
1665                                         if ((state & REGION) != 0) {\r
1666                                                 Report.Error (1038, Location, "#endregion directive expected");\r
1667                                                 return true;\r
1668                                         }\r
1669 \r
1670                                         if ((state & ELSE_SEEN) != 0){\r
1671                                                 Error_UnexpectedDirective ("#else within #else");\r
1672                                                 return true;\r
1673                                         }\r
1674 \r
1675                                         ifstack.Pop ();\r
1676 \r
1677                                         bool ret;\r
1678                                         if ((state & TAKEN_BEFORE) == 0){\r
1679                                                 ret = ((state & PARENT_TAKING) != 0);\r
1680                                         } else\r
1681                                                 ret = false;\r
1682                                         \r
1683                                         if (ret)\r
1684                                                 state |= TAKING;\r
1685                                         else\r
1686                                                 state &= ~TAKING;\r
1687                                         \r
1688                                         ifstack.Push (state | ELSE_SEEN);\r
1689                                         \r
1690                                         return ret;\r
1691                                 }\r
1692                         }\r
1693 \r
1694                         //\r
1695                         // These are only processed if we are in a `taking' block\r
1696                         //\r
1697                         if (!caller_is_taking)\r
1698                                 return false;\r
1699                                         \r
1700                         switch (cmd){\r
1701                         case "define":\r
1702                                 if (any_token_seen){\r
1703                                         Error_TokensSeen ();\r
1704                                         return true;\r
1705                                 }\r
1706                                 PreProcessDefinition (true, arg);\r
1707                                 return true;\r
1708 \r
1709                         case "undef":\r
1710                                 if (any_token_seen){\r
1711                                         Error_TokensSeen ();\r
1712                                         return true;\r
1713                                 }\r
1714                                 PreProcessDefinition (false, arg);\r
1715                                 return true;\r
1716 \r
1717                         case "error":\r
1718                                 Report.Error (1029, Location, "#error: '" + arg + "'");\r
1719                                 return true;\r
1720 \r
1721                         case "warning":\r
1722                                 Report.Warning (1030, Location, "#warning: '" + arg + "'");\r
1723                                 return true;\r
1724                         }\r
1725 \r
1726                         Report.Error (1024, Location, "Preprocessor directive expected (got: " + cmd + ")");\r
1727                         return true;\r
1728 \r
1729                 }\r
1730 \r
1731                 private int consume_string (bool quoted) \r
1732                 {\r
1733                         int c;\r
1734                         string_builder.Length = 0;\r
1735                                                                 \r
1736                         while ((c = getChar ()) != -1){\r
1737                                 if (c == '"'){\r
1738                                         if (quoted && peekChar () == '"'){\r
1739                                                 string_builder.Append ((char) c);\r
1740                                                 getChar ();\r
1741                                                 continue;\r
1742                                         } else {\r
1743                                                 val = string_builder.ToString ();\r
1744                                                 return Token.LITERAL_STRING;\r
1745                                         }\r
1746                                 }\r
1747 \r
1748                                 if (c == '\n'){\r
1749                                         if (!quoted)\r
1750                                                 Report.Error (1010, Location, "Newline in constant");\r
1751                                         line++;\r
1752                                         ref_line++;\r
1753                                         col = 0;\r
1754                                 } else\r
1755                                         col++;\r
1756 \r
1757                                 if (!quoted){\r
1758                                         c = escape (c);\r
1759                                         if (c == -1)\r
1760                                                 return Token.ERROR;\r
1761                                 }\r
1762                                 string_builder.Append ((char) c);\r
1763                         }\r
1764 \r
1765                         Report.Error (1039, Location, "Unterminated string literal");\r
1766                         return Token.EOF;\r
1767                 }\r
1768 \r
1769                 private int consume_identifier (int s, bool quoted) \r
1770                 {\r
1771                         int pos = 1;\r
1772                         int c;\r
1773                         \r
1774                         id_builder [0] = (char) s;\r
1775                                         \r
1776                         while ((c = reader.Read ()) != -1) {\r
1777                                 if (is_identifier_part_character ((char) c)){\r
1778                                         if (pos == max_id_size){\r
1779                                                 Report.Error (645, Location, "Identifier too long (limit is 512 chars)");\r
1780                                                 return Token.ERROR;\r
1781                                         }\r
1782                                         \r
1783                                         id_builder [pos++] = (char) c;\r
1784                                         putback_char = -1;\r
1785                                         col++;\r
1786                                 } else {\r
1787                                         putback_char = c;\r
1788                                         break;\r
1789                                 }\r
1790                         }\r
1791 \r
1792                         //\r
1793                         // Optimization: avoids doing the keyword lookup\r
1794                         // on uppercase letters and _\r
1795                         //\r
1796                         if (s >= 'a'){\r
1797                                 int keyword = GetKeyword (id_builder, pos);\r
1798                                 if (keyword != -1 && !quoted)\r
1799                                 return keyword;\r
1800                         }\r
1801 \r
1802                         //\r
1803                         // Keep identifiers in an array of hashtables to avoid needless\r
1804                         // allocations\r
1805                         //\r
1806 \r
1807                         if (identifiers [pos] != null) {\r
1808                                 val = identifiers [pos][id_builder];\r
1809                                 if (val != null) {\r
1810                                         return Token.IDENTIFIER;\r
1811                                 }\r
1812                         }\r
1813                         else\r
1814                                 identifiers [pos] = new CharArrayHashtable (pos);\r
1815 \r
1816                         val = new String (id_builder, 0, pos);\r
1817 \r
1818                         char [] chars = new char [pos];\r
1819                         Array.Copy (id_builder, chars, pos);\r
1820 \r
1821                         identifiers [pos] [chars] = val;\r
1822 \r
1823                         return Token.IDENTIFIER;\r
1824                 }\r
1825 \r
1826                 int consume_whitespace ()\r
1827                 {\r
1828                         int t;\r
1829                         bool doread = false;\r
1830                         int c;\r
1831 \r
1832                         val = null;\r
1833                         // optimization: eliminate col and implement #directive semantic correctly.\r
1834                         for (;(c = getChar ()) != -1; col++) {\r
1835                                 if (c == ' ')\r
1836                                         continue;\r
1837                                 \r
1838                                 if (c == '\t') {\r
1839                                         col = (((col + 8) / 8) * 8) - 1;\r
1840                                         continue;\r
1841                                 }\r
1842                                 \r
1843                                 if (c == ' ' || c == '\f' || c == '\v' || c == 0xa0)\r
1844                                         continue;\r
1845 \r
1846                                 if (c == '\r') {\r
1847                                         if (peekChar () == '\n')\r
1848                                                 getChar ();\r
1849 \r
1850                                         line++;\r
1851                                         ref_line++;\r
1852                                         col = 0;\r
1853                                         any_token_seen |= tokens_seen;\r
1854                                         tokens_seen = false;\r
1855                                         continue;\r
1856                                 }\r
1857 \r
1858                                 // Handle double-slash comments.\r
1859                                 if (c == '/'){\r
1860                                         int d = peekChar ();\r
1861                                 \r
1862                                         if (d == '/'){\r
1863                                                 getChar ();\r
1864                                                 while ((d = getChar ()) != -1 && (d != '\n') && d != '\r')\r
1865                                                         col++;\r
1866                                                 if (d == '\n'){\r
1867                                                         line++;\r
1868                                                         ref_line++;\r
1869                                                         col = 0;\r
1870                                                 }\r
1871                                                 any_token_seen |= tokens_seen;\r
1872                                                 tokens_seen = false;\r
1873                                                 continue;\r
1874                                         } else if (d == '*'){\r
1875                                                 getChar ();\r
1876 \r
1877                                                 while ((d = getChar ()) != -1){\r
1878                                                         if (d == '*' && peekChar () == '/'){\r
1879                                                                 getChar ();\r
1880                                                                 col++;\r
1881                                                                 break;\r
1882                                                         }\r
1883                                                         if (d == '\n'){\r
1884                                                                 line++;\r
1885                                                                 ref_line++;\r
1886                                                                 col = 0;\r
1887                                                                 any_token_seen |= tokens_seen;\r
1888                                                                 tokens_seen = false;\r
1889                                                         }\r
1890                                                 }\r
1891                                                 continue;\r
1892                                         }\r
1893                                         goto is_punct_label;\r
1894                                 }\r
1895 \r
1896                         is_punct_label:\r
1897                                 // white space\r
1898                                 if (c == '\n'){\r
1899                                         line++;\r
1900                                         ref_line++;\r
1901                                         col = 0;\r
1902                                         any_token_seen |= tokens_seen;\r
1903                                         tokens_seen = false;\r
1904                                         continue;\r
1905                                 }\r
1906 \r
1907                                 /* For now, ignore pre-processor commands */\r
1908                                 // FIXME: In C# the '#' is not limited to appear\r
1909                                 // on the first column.\r
1910                                 if (c == '#' && !tokens_seen){\r
1911                                         bool cont = true;\r
1912                                         \r
1913                                 start_again:\r
1914                                         \r
1915                                         cont = handle_preprocessing_directive (cont);\r
1916 \r
1917                                         if (cont){\r
1918                                                 col = 0;\r
1919                                                 continue;\r
1920                                         }\r
1921                                         col = 1;\r
1922 \r
1923                                         bool skipping = false;\r
1924                                         for (;(c = getChar ()) != -1; col++){\r
1925                                                 if (c == '\n'){\r
1926                                                         col = 0;\r
1927                                                         line++;\r
1928                                                         ref_line++;\r
1929                                                         skipping = false;\r
1930                                                 } else if (c == ' ' || c == '\t' || c == '\v' || c == '\r' || c == 0xa0)\r
1931                                                         continue;\r
1932                                                 else if (c != '#')\r
1933                                                         skipping = true;\r
1934                                                 if (c == '#' && !skipping)\r
1935                                                         goto start_again;\r
1936                                         }\r
1937                                         any_token_seen |= tokens_seen;\r
1938                                         tokens_seen = false;\r
1939                                         if (c == -1)\r
1940                                                 Report.Error (1027, Location, "#endif/#endregion expected");\r
1941                                         continue;\r
1942                                 }\r
1943 \r
1944                                 return c;\r
1945                         }\r
1946 \r
1947                         return -1;\r
1948                 }\r
1949                 \r
1950                 public int xtoken ()\r
1951                 {\r
1952                         int t;\r
1953                         bool doread = false;\r
1954                         int c;\r
1955 \r
1956                         val = null;\r
1957                         // optimization: eliminate col and implement #directive semantic correctly.\r
1958 \r
1959                         c = consume_whitespace ();\r
1960                         if (c == -1)\r
1961                                 return Token.EOF;\r
1962 \r
1963                         if (is_identifier_start_character ((char)c)){\r
1964                                 tokens_seen = true;\r
1965                                 return consume_identifier (c, false);\r
1966                         }\r
1967 \r
1968                 is_punct_label:\r
1969                         if ((t = is_punct ((char)c, ref doread)) != Token.ERROR){\r
1970                                 tokens_seen = true;\r
1971                                 if (doread){\r
1972                                         getChar ();\r
1973                                         col++;\r
1974                                 }\r
1975                                 return t;\r
1976                         }\r
1977 \r
1978                         if (c >= '0' && c <= '9'){\r
1979                                 tokens_seen = true;\r
1980                                 return is_number (c);\r
1981                         }\r
1982 \r
1983                         if (c == '.'){\r
1984                                 tokens_seen = true;\r
1985                                 int peek = peekChar ();\r
1986                                 if (peek >= '0' && peek <= '9')\r
1987                                         return is_number (c);\r
1988                                 return Token.DOT;\r
1989                         }\r
1990 \r
1991                         if (c == '"') \r
1992                                 return consume_string (false);\r
1993 \r
1994                         if (c == '\''){\r
1995                                 c = getChar ();\r
1996                                 tokens_seen = true;\r
1997                                 if (c == '\''){\r
1998                                         error_details = "Empty character literal";\r
1999                                         Report.Error (1011, Location, error_details);\r
2000                                         return Token.ERROR;\r
2001                                 }\r
2002                                 c = escape (c);\r
2003                                 if (c == -1)\r
2004                                         return Token.ERROR;\r
2005                                 val = new System.Char ();\r
2006                                 val = (char) c;\r
2007                                 c = getChar ();\r
2008 \r
2009                                 if (c != '\''){\r
2010                                         error_details = "Too many characters in character literal";\r
2011                                         Report.Error (1012, Location, error_details);\r
2012 \r
2013                                         // Try to recover, read until newline or next "'"\r
2014                                         while ((c = getChar ()) != -1){\r
2015                                                 if (c == '\n' || c == '\''){\r
2016                                                         line++;\r
2017                                                         ref_line++;\r
2018                                                         col = 0;\r
2019                                                         break;\r
2020                                                 } else\r
2021                                                         col++;\r
2022                                         }\r
2023                                         return Token.ERROR;\r
2024                                 }\r
2025                                 return Token.LITERAL_CHARACTER;\r
2026                         }\r
2027                                 \r
2028                         if (c == '@') {\r
2029                                 c = getChar ();\r
2030                                 if (c == '"') {\r
2031                                         tokens_seen = true;\r
2032                                         return consume_string (true);\r
2033                                 } else if (is_identifier_start_character ((char) c)){\r
2034                                         return consume_identifier (c, true);\r
2035                                 } else {\r
2036                                         Report.Error (1033, Location, "'@' must be followed by string constant or identifier");\r
2037                                 }\r
2038                         }\r
2039 \r
2040                         if (c == '#') {\r
2041                                 error_details = "Preprocessor directives must appear as the first non-whitespace " +\r
2042                                         "character on a line.";\r
2043 \r
2044                                 Report.Error (1040, Location, error_details);\r
2045 \r
2046                                 return Token.ERROR;\r
2047                         }\r
2048 \r
2049                         error_details = ((char)c).ToString ();\r
2050 \r
2051                         return Token.ERROR;\r
2052                 }\r
2053 \r
2054                 public void cleanup ()\r
2055                 {\r
2056                         if (ifstack != null && ifstack.Count >= 1) {\r
2057                                 int state = (int) ifstack.Pop ();\r
2058                                 if ((state & REGION) != 0)\r
2059                                         Report.Error (1038, "#endregion directive expected");\r
2060                                 else \r
2061                                         Report.Error (1027, "#endif directive expected");\r
2062                         }\r
2063                                 \r
2064                 }\r
2065         }\r
2066 }\r
2067 \r