2004-02-14 Francisco Figueiredo Jr. <fxjrlists@yahoo.com.br>
[mono.git] / mcs / gmcs / cs-tokenizer.cs
1 //\r
2 // cs-tokenizer.cs: The Tokenizer for the C# compiler\r
3 //                  This also implements the preprocessor\r
4 //\r
5 // Author: Miguel de Icaza (miguel@gnu.org)\r
6 //\r
7 // Licensed under the terms of the GNU GPL\r
8 //\r
9 // (C) 2001, 2002 Ximian, Inc (http://www.ximian.com)\r
10 //\r
11 \r
12 /*\r
13  * TODO:\r
14  *   Make sure we accept the proper Unicode ranges, per the spec.\r
15  *   Report error 1032\r
16 */\r
17 \r
18 using System;\r
19 using System.Text;\r
20 using System.Collections;\r
21 using System.IO;\r
22 using System.Globalization;\r
23 using System.Reflection;\r
24 \r
25 namespace Mono.CSharp\r
26 {\r
27         /// <summary>\r
28         ///    Tokenizer for C# source code. \r
29         /// </summary>\r
30 \r
31         public class Tokenizer : yyParser.yyInput\r
32         {\r
33                 SeekableStreamReader reader;\r
34                 public SourceFile ref_name;\r
35                 public SourceFile file_name;\r
36                 public int ref_line = 1;\r
37                 public int line = 1;\r
38                 public int col = 1;\r
39                 public int current_token;\r
40                 bool handle_get_set = false;\r
41                 bool handle_remove_add = false;\r
42                 bool handle_assembly = false;\r
43                 bool handle_constraints = false;\r
44 \r
45                 //\r
46                 // Whether tokens have been seen on this line\r
47                 //\r
48                 bool tokens_seen = false;\r
49 \r
50                 //\r
51                 // Whether a token has been seen on the file\r
52                 // This is needed because `define' is not allowed to be used\r
53                 // after a token has been seen.\r
54                 //\r
55                 bool any_token_seen = false;\r
56                 static Hashtable tokenValues;\r
57                 \r
58                 private static Hashtable TokenValueName\r
59                 {\r
60                         get {\r
61                                 if (tokenValues == null)\r
62                                         tokenValues = GetTokenValueNameHash ();\r
63 \r
64                                 return tokenValues;\r
65                         }\r
66                 }\r
67 \r
68                 private static Hashtable GetTokenValueNameHash ()\r
69                 {\r
70                         Type t = typeof (Token);\r
71                         FieldInfo [] fields = t.GetFields ();\r
72                         Hashtable hash = new Hashtable ();\r
73                         foreach (FieldInfo field in fields) {\r
74                                 if (field.IsLiteral && field.IsStatic && field.FieldType == typeof (int))\r
75                                         hash.Add (field.GetValue (null), field.Name);\r
76                         }\r
77                         return hash;\r
78                 }\r
79                 \r
80                 //\r
81                 // Returns a verbose representation of the current location\r
82                 //\r
83                 public string location {\r
84                         get {\r
85                                 string det;\r
86 \r
87                                 if (current_token == Token.ERROR)\r
88                                         det = "detail: " + error_details;\r
89                                 else\r
90                                         det = "";\r
91                                 \r
92                                 // return "Line:     "+line+" Col: "+col + "\n" +\r
93                                 //       "VirtLine: "+ref_line +\r
94                                 //       " Token: "+current_token + " " + det;\r
95                                 string current_token_name = TokenValueName [current_token] as string;\r
96                                 if (current_token_name == null)\r
97                                         current_token_name = current_token.ToString ();\r
98 \r
99                                 return String.Format ("{0} ({1},{2}), Token: {3} {4}", ref_name.Name,\r
100                                                                                        ref_line,\r
101                                                                                        col,\r
102                                                                                        current_token_name,\r
103                                                                                        det);\r
104                         }\r
105                 }\r
106 \r
107                 public bool PropertyParsing {\r
108                         get {\r
109                                 return handle_get_set;\r
110                         }\r
111 \r
112                         set {\r
113                                 handle_get_set = value;\r
114                         }\r
115                 }\r
116 \r
117                 public bool AssemblyTargetParsing {\r
118                         get {\r
119                                 return handle_assembly;\r
120                         }\r
121 \r
122                         set {\r
123                                 handle_assembly = value;\r
124                         }\r
125                 }\r
126 \r
127                 public bool EventParsing {\r
128                         get {\r
129                                 return handle_remove_add;\r
130                         }\r
131 \r
132                         set {\r
133                                 handle_remove_add = value;\r
134                         }\r
135                 }\r
136 \r
137                 public bool ConstraintsParsing {\r
138                         get {\r
139                                 return handle_constraints;\r
140                         }\r
141 \r
142                         set {\r
143                                 handle_constraints = value;\r
144                         }\r
145                 }\r
146                 \r
147                 //\r
148                 // Class variables\r
149                 // \r
150                 static CharArrayHashtable[] keywords;\r
151                 static NumberStyles styles;\r
152                 static NumberFormatInfo csharp_format_info;\r
153                 \r
154                 //\r
155                 // Values for the associated token returned\r
156                 //\r
157                 int putback_char;\r
158                 Object val;\r
159 \r
160                 //\r
161                 // Pre-processor\r
162                 //\r
163                 Hashtable defines;\r
164 \r
165                 const int TAKING        = 1;\r
166                 const int TAKEN_BEFORE  = 2;\r
167                 const int ELSE_SEEN     = 4;\r
168                 const int PARENT_TAKING = 8;\r
169                 const int REGION        = 16;           \r
170 \r
171                 //\r
172                 // pre-processor if stack state:\r
173                 //\r
174                 Stack ifstack;\r
175 \r
176                 static System.Text.StringBuilder string_builder;\r
177 \r
178                 const int max_id_size = 512;\r
179                 static char [] id_builder = new char [max_id_size];\r
180 \r
181                 static CharArrayHashtable [] identifiers = new CharArrayHashtable [max_id_size + 1];\r
182 \r
183                 const int max_number_size = 128;\r
184                 static char [] number_builder = new char [max_number_size];\r
185                 static int number_pos;\r
186                 \r
187                 //\r
188                 // Details about the error encoutered by the tokenizer\r
189                 //\r
190                 string error_details;\r
191                 \r
192                 public string error {\r
193                         get {\r
194                                 return error_details;\r
195                         }\r
196                 }\r
197                 \r
198                 public int Line {\r
199                         get {\r
200                                 return ref_line;\r
201                         }\r
202                 }\r
203 \r
204                 public int Col {\r
205                         get {\r
206                                 return col;\r
207                         }\r
208                 }\r
209 \r
210                 static void AddKeyword (string kw, int token) {\r
211                         if (keywords [kw.Length] == null) {\r
212                                 keywords [kw.Length] = new CharArrayHashtable (kw.Length);\r
213                         }\r
214                         keywords [kw.Length] [kw.ToCharArray ()] = token;\r
215                 }\r
216 \r
217                 static void InitTokens ()\r
218                 {\r
219                         keywords = new CharArrayHashtable [64];\r
220 \r
221                         AddKeyword ("abstract", Token.ABSTRACT);\r
222                         AddKeyword ("as", Token.AS);\r
223                         AddKeyword ("add", Token.ADD);\r
224                         AddKeyword ("assembly", Token.ASSEMBLY);\r
225                         AddKeyword ("base", Token.BASE);\r
226                         AddKeyword ("bool", Token.BOOL);\r
227                         AddKeyword ("break", Token.BREAK);\r
228                         AddKeyword ("byte", Token.BYTE);\r
229                         AddKeyword ("case", Token.CASE);\r
230                         AddKeyword ("catch", Token.CATCH);\r
231                         AddKeyword ("char", Token.CHAR);\r
232                         AddKeyword ("checked", Token.CHECKED);\r
233                         AddKeyword ("class", Token.CLASS);\r
234                         AddKeyword ("const", Token.CONST);\r
235                         AddKeyword ("continue", Token.CONTINUE);\r
236                         AddKeyword ("decimal", Token.DECIMAL);\r
237                         AddKeyword ("default", Token.DEFAULT);\r
238                         AddKeyword ("delegate", Token.DELEGATE);\r
239                         AddKeyword ("do", Token.DO);\r
240                         AddKeyword ("double", Token.DOUBLE);\r
241                         AddKeyword ("else", Token.ELSE);\r
242                         AddKeyword ("enum", Token.ENUM);\r
243                         AddKeyword ("event", Token.EVENT);\r
244                         AddKeyword ("explicit", Token.EXPLICIT);\r
245                         AddKeyword ("extern", Token.EXTERN);\r
246                         AddKeyword ("false", Token.FALSE);\r
247                         AddKeyword ("finally", Token.FINALLY);\r
248                         AddKeyword ("fixed", Token.FIXED);\r
249                         AddKeyword ("float", Token.FLOAT);\r
250                         AddKeyword ("for", Token.FOR);\r
251                         AddKeyword ("foreach", Token.FOREACH);\r
252                         AddKeyword ("goto", Token.GOTO);\r
253                         AddKeyword ("get", Token.GET);\r
254                         AddKeyword ("if", Token.IF);\r
255                         AddKeyword ("implicit", Token.IMPLICIT);\r
256                         AddKeyword ("in", Token.IN);\r
257                         AddKeyword ("int", Token.INT);\r
258                         AddKeyword ("interface", Token.INTERFACE);\r
259                         AddKeyword ("internal", Token.INTERNAL);\r
260                         AddKeyword ("is", Token.IS);\r
261                         AddKeyword ("lock", Token.LOCK);\r
262                         AddKeyword ("long", Token.LONG);\r
263                         AddKeyword ("namespace", Token.NAMESPACE);\r
264                         AddKeyword ("new", Token.NEW);\r
265                         AddKeyword ("null", Token.NULL);\r
266                         AddKeyword ("object", Token.OBJECT);\r
267                         AddKeyword ("operator", Token.OPERATOR);\r
268                         AddKeyword ("out", Token.OUT);\r
269                         AddKeyword ("override", Token.OVERRIDE);\r
270                         AddKeyword ("params", Token.PARAMS);\r
271                         AddKeyword ("private", Token.PRIVATE);\r
272                         AddKeyword ("protected", Token.PROTECTED);\r
273                         AddKeyword ("public", Token.PUBLIC);\r
274                         AddKeyword ("readonly", Token.READONLY);\r
275                         AddKeyword ("ref", Token.REF);\r
276                         AddKeyword ("remove", Token.REMOVE);\r
277                         AddKeyword ("return", Token.RETURN);\r
278                         AddKeyword ("sbyte", Token.SBYTE);\r
279                         AddKeyword ("sealed", Token.SEALED);\r
280                         AddKeyword ("set", Token.SET);\r
281                         AddKeyword ("short", Token.SHORT);\r
282                         AddKeyword ("sizeof", Token.SIZEOF);\r
283                         AddKeyword ("stackalloc", Token.STACKALLOC);\r
284                         AddKeyword ("static", Token.STATIC);\r
285                         AddKeyword ("string", Token.STRING);\r
286                         AddKeyword ("struct", Token.STRUCT);\r
287                         AddKeyword ("switch", Token.SWITCH);\r
288                         AddKeyword ("this", Token.THIS);\r
289                         AddKeyword ("throw", Token.THROW);\r
290                         AddKeyword ("true", Token.TRUE);\r
291                         AddKeyword ("try", Token.TRY);\r
292                         AddKeyword ("typeof", Token.TYPEOF);\r
293                         AddKeyword ("uint", Token.UINT);\r
294                         AddKeyword ("ulong", Token.ULONG);\r
295                         AddKeyword ("unchecked", Token.UNCHECKED);\r
296                         AddKeyword ("unsafe", Token.UNSAFE);\r
297                         AddKeyword ("ushort", Token.USHORT);\r
298                         AddKeyword ("using", Token.USING);\r
299                         AddKeyword ("virtual", Token.VIRTUAL);\r
300                         AddKeyword ("void", Token.VOID);\r
301                         AddKeyword ("volatile", Token.VOLATILE);\r
302                         AddKeyword ("where", Token.WHERE);\r
303                         AddKeyword ("while", Token.WHILE);\r
304 \r
305                         if (RootContext.V2){\r
306                                 AddKeyword ("__yield", Token.YIELD);\r
307                                 AddKeyword ("yield", Token.YIELD);\r
308                         }\r
309                 }\r
310 \r
311                 //\r
312                 // Class initializer\r
313                 // \r
314                 static Tokenizer ()\r
315                 {\r
316                         InitTokens ();\r
317                         csharp_format_info = NumberFormatInfo.InvariantInfo;\r
318                         styles = NumberStyles.Float;\r
319                         \r
320                         string_builder = new System.Text.StringBuilder ();\r
321                 }\r
322 \r
323                 int GetKeyword (char[] id, int id_len)\r
324                 {\r
325                         /*\r
326                          * Keywords are stored in an array of hashtables grouped by their\r
327                          * length.\r
328                          */\r
329 \r
330                         if ((id_len >= keywords.Length) || (keywords [id_len] == null))\r
331                                 return -1;\r
332                         object o = keywords [id_len] [id];\r
333 \r
334                         if (o == null)\r
335                                 return -1;\r
336                         \r
337                         int res = (int) o;\r
338 \r
339                         if (handle_get_set == false && (res == Token.GET || res == Token.SET))\r
340                                 return -1;\r
341                         if (handle_remove_add == false && (res == Token.REMOVE || res == Token.ADD))\r
342                                 return -1;\r
343                         if (handle_assembly == false && res == Token.ASSEMBLY)\r
344                                 return -1;\r
345                         if (handle_constraints == false && res == Token.WHERE)\r
346                                 return -1;\r
347                         return res;\r
348                         \r
349                 }\r
350 \r
351                 public Location Location {\r
352                         get {\r
353                                 return new Location (ref_line);\r
354                         }\r
355                 }\r
356 \r
357                 void define (string def)\r
358                 {\r
359                         if (!RootContext.AllDefines.Contains (def)){\r
360                                 RootContext.AllDefines [def] = true;\r
361                         }\r
362                         if (defines.Contains (def))\r
363                                 return;\r
364                         defines [def] = true;\r
365                 }\r
366                 \r
367                 public Tokenizer (SeekableStreamReader input, SourceFile file, ArrayList defs)\r
368                 {\r
369                         this.ref_name = file;\r
370                         this.file_name = file;\r
371                         reader = input;\r
372                         \r
373                         putback_char = -1;\r
374 \r
375                         if (defs != null){\r
376                                 defines = new Hashtable ();\r
377                                 foreach (string def in defs)\r
378                                         define (def);\r
379                         }\r
380 \r
381                         //\r
382                         // FIXME: This could be `Location.Push' but we have to\r
383                         // find out why the MS compiler allows this\r
384                         //\r
385                         Mono.CSharp.Location.Push (file);\r
386                 }\r
387 \r
388                 public static void Cleanup () {\r
389                         identifiers = null;\r
390                 }\r
391 \r
392                 bool is_identifier_start_character (char c)\r
393                 {\r
394                         return (c >= 'A' && c <= 'Z') || (c >= 'a' && c <= 'z') || c == '_' || Char.IsLetter (c);\r
395                 }\r
396 \r
397                 bool is_identifier_part_character (char c)\r
398                 {\r
399                         return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || c == '_' || (c >= '0' && c <= '9') || Char.IsLetter (c);\r
400                 }\r
401 \r
402                 bool parse_less_than ()\r
403                 {\r
404                 start:\r
405                         int the_token = token ();\r
406                         switch (the_token) {\r
407                         case Token.IDENTIFIER:\r
408                         case Token.OBJECT:\r
409                         case Token.STRING:\r
410                         case Token.BOOL:\r
411                         case Token.DECIMAL:\r
412                         case Token.FLOAT:\r
413                         case Token.DOUBLE:\r
414                         case Token.SBYTE:\r
415                         case Token.BYTE:\r
416                         case Token.SHORT:\r
417                         case Token.USHORT:\r
418                         case Token.INT:\r
419                         case Token.UINT:\r
420                         case Token.LONG:\r
421                         case Token.ULONG:\r
422                         case Token.CHAR:\r
423                         case Token.VOID:\r
424                                 break;\r
425 \r
426                         default:\r
427                                 return false;\r
428                         }\r
429                 again:\r
430                         the_token = token ();\r
431 \r
432                         if (the_token == Token.OP_GENERICS_GT)\r
433                                 return true;\r
434                         else if (the_token == Token.COMMA)\r
435                                 goto start;\r
436                         else if (the_token == Token.OP_GENERICS_LT) {\r
437                                 if (!parse_less_than ())\r
438                                         return false;\r
439                                 goto again;\r
440                         }\r
441 \r
442                         return false;\r
443                 }\r
444 \r
445                 bool parsing_less_than = false;\r
446                 int parsing_generic_less_than = 0;\r
447 \r
448                 int is_punct (char c, ref bool doread)\r
449                 {\r
450                         int d;\r
451                         int t;\r
452 \r
453                         doread = false;\r
454 \r
455                         switch (c){\r
456                         case '{':\r
457                                 return Token.OPEN_BRACE;\r
458                         case '}':\r
459                                 return Token.CLOSE_BRACE;\r
460                         case '[':\r
461                                 return Token.OPEN_BRACKET;\r
462                         case ']':\r
463                                 return Token.CLOSE_BRACKET;\r
464                         case '(':\r
465                                 return Token.OPEN_PARENS;\r
466                         case ')': {\r
467                                 if (deambiguate_close_parens == 0)\r
468                                         return Token.CLOSE_PARENS;\r
469 \r
470                                 --deambiguate_close_parens;\r
471 \r
472                                 // Save current position and parse next token.\r
473                                 int old = reader.Position;\r
474                                 int new_token = token ();\r
475                                 reader.Position = old;\r
476                                 putback_char = -1;\r
477 \r
478                                 if (new_token == Token.OPEN_PARENS)\r
479                                         return Token.CLOSE_PARENS_OPEN_PARENS;\r
480                                 else if (new_token == Token.MINUS)\r
481                                         return Token.CLOSE_PARENS_MINUS;\r
482                                 else if (IsCastToken (new_token))\r
483                                         return Token.CLOSE_PARENS_CAST;\r
484                                 else\r
485                                         return Token.CLOSE_PARENS_NO_CAST;\r
486                         }\r
487 \r
488                         case ',':\r
489                                 return Token.COMMA;\r
490                         case ':':\r
491                                 return Token.COLON;\r
492                         case ';':\r
493                                 return Token.SEMICOLON;\r
494                         case '~':\r
495                                 return Token.TILDE;\r
496                         case '?':\r
497                                 return Token.INTERR;\r
498                         }\r
499 \r
500                         if (c == '<') {\r
501                                 if (parsing_generic_less_than++ > 0)\r
502                                         return Token.OP_GENERICS_LT;\r
503 \r
504                                 // Save current position and parse next token.\r
505                                 int old = reader.Position;\r
506                                 bool is_generic_lt = parse_less_than ();\r
507                                 reader.Position = old;\r
508                                 putback_char = -1;\r
509 \r
510                                 if (is_generic_lt) {\r
511                                         parsing_generic_less_than++;\r
512                                         return Token.OP_GENERICS_LT;\r
513                                 } else\r
514                                         parsing_generic_less_than = 0;\r
515 \r
516                                 d = peekChar ();\r
517                                 if (d == '<'){\r
518                                         getChar ();\r
519                                         d = peekChar ();\r
520 \r
521                                         if (d == '='){\r
522                                                 doread = true;\r
523                                                 return Token.OP_SHIFT_LEFT_ASSIGN;\r
524                                         }\r
525                                         return Token.OP_SHIFT_LEFT;\r
526                                 } else if (d == '='){\r
527                                         doread = true;\r
528                                         return Token.OP_LE;\r
529                                 }\r
530                                 return Token.OP_LT;\r
531                         } else if (c == '>') {\r
532                                 if (parsing_generic_less_than > 0) {\r
533                                         parsing_generic_less_than--;\r
534                                         return Token.OP_GENERICS_GT;\r
535                                 }\r
536 \r
537                                 d = peekChar ();\r
538                                 if (d == '>'){\r
539                                         getChar ();\r
540                                         d = peekChar ();\r
541 \r
542                                         if (d == '='){\r
543                                                 doread = true;\r
544                                                 return Token.OP_SHIFT_RIGHT_ASSIGN;\r
545                                         }\r
546                                         return Token.OP_SHIFT_RIGHT;\r
547                                 } else if (d == '='){\r
548                                         doread = true;\r
549                                         return Token.OP_GE;\r
550                                 }\r
551                                 return Token.OP_GT;\r
552                         }\r
553 \r
554                         d = peekChar ();\r
555                         if (c == '+'){\r
556                                 \r
557                                 if (d == '+')\r
558                                         t = Token.OP_INC;\r
559                                 else if (d == '=')\r
560                                         t = Token.OP_ADD_ASSIGN;\r
561                                 else\r
562                                         return Token.PLUS;\r
563                                 doread = true;\r
564                                 return t;\r
565                         }\r
566                         if (c == '-'){\r
567                                 if (d == '-')\r
568                                         t = Token.OP_DEC;\r
569                                 else if (d == '=')\r
570                                         t = Token.OP_SUB_ASSIGN;\r
571                                 else if (d == '>')\r
572                                         t = Token.OP_PTR;\r
573                                 else\r
574                                         return Token.MINUS;\r
575                                 doread = true;\r
576                                 return t;\r
577                         }\r
578 \r
579                         if (c == '!'){\r
580                                 if (d == '='){\r
581                                         doread = true;\r
582                                         return Token.OP_NE;\r
583                                 }\r
584                                 return Token.BANG;\r
585                         }\r
586 \r
587                         if (c == '='){\r
588                                 if (d == '='){\r
589                                         doread = true;\r
590                                         return Token.OP_EQ;\r
591                                 }\r
592                                 return Token.ASSIGN;\r
593                         }\r
594 \r
595                         if (c == '&'){\r
596                                 if (d == '&'){\r
597                                         doread = true;\r
598                                         return Token.OP_AND;\r
599                                 } else if (d == '='){\r
600                                         doread = true;\r
601                                         return Token.OP_AND_ASSIGN;\r
602                                 }\r
603                                 return Token.BITWISE_AND;\r
604                         }\r
605 \r
606                         if (c == '|'){\r
607                                 if (d == '|'){\r
608                                         doread = true;\r
609                                         return Token.OP_OR;\r
610                                 } else if (d == '='){\r
611                                         doread = true;\r
612                                         return Token.OP_OR_ASSIGN;\r
613                                 }\r
614                                 return Token.BITWISE_OR;\r
615                         }\r
616 \r
617                         if (c == '*'){\r
618                                 if (d == '='){\r
619                                         doread = true;\r
620                                         return Token.OP_MULT_ASSIGN;\r
621                                 }\r
622                                 return Token.STAR;\r
623                         }\r
624 \r
625                         if (c == '/'){\r
626                                 if (d == '='){\r
627                                         doread = true;\r
628                                         return Token.OP_DIV_ASSIGN;\r
629                                 }\r
630                                 return Token.DIV;\r
631                         }\r
632 \r
633                         if (c == '%'){\r
634                                 if (d == '='){\r
635                                         doread = true;\r
636                                         return Token.OP_MOD_ASSIGN;\r
637                                 }\r
638                                 return Token.PERCENT;\r
639                         }\r
640 \r
641                         if (c == '^'){\r
642                                 if (d == '='){\r
643                                         doread = true;\r
644                                         return Token.OP_XOR_ASSIGN;\r
645                                 }\r
646                                 return Token.CARRET;\r
647                         }\r
648 \r
649                         return Token.ERROR;\r
650                 }\r
651 \r
652                 int deambiguate_close_parens = 0;\r
653 \r
654                 public void Deambiguate_CloseParens ()\r
655                 {\r
656                         putback (')');\r
657                         deambiguate_close_parens++;\r
658                 }\r
659 \r
660                 void Error_NumericConstantTooLong ()\r
661                 {\r
662                         Report.Error (1021, Location, "Numeric constant too long");                     \r
663                 }\r
664                 \r
665                 bool decimal_digits (int c)\r
666                 {\r
667                         int d;\r
668                         bool seen_digits = false;\r
669                         \r
670                         if (c != -1){\r
671                                 if (number_pos == max_number_size)\r
672                                         Error_NumericConstantTooLong ();\r
673                                 number_builder [number_pos++] = (char) c;\r
674                         }\r
675                         \r
676                         //\r
677                         // We use peekChar2, because decimal_digits needs to do a \r
678                         // 2-character look-ahead (5.ToString for example).\r
679                         //\r
680                         while ((d = peekChar2 ()) != -1){\r
681                                 if (d >= '0' && d <= '9'){\r
682                                         if (number_pos == max_number_size)\r
683                                                 Error_NumericConstantTooLong ();\r
684                                         number_builder [number_pos++] = (char) d;\r
685                                         getChar ();\r
686                                         seen_digits = true;\r
687                                 } else\r
688                                         break;\r
689                         }\r
690                         \r
691                         return seen_digits;\r
692                 }\r
693 \r
694                 bool is_hex (int e)\r
695                 {\r
696                         return (e >= '0' && e <= '9') || (e >= 'A' && e <= 'F') || (e >= 'a' && e <= 'f');\r
697                 }\r
698                 \r
699                 void hex_digits (int c)\r
700                 {\r
701                         if (c != -1)\r
702                                 number_builder [number_pos++] = (char) c;\r
703                         \r
704                 }\r
705                 \r
706                 int real_type_suffix (int c)\r
707                 {\r
708                         int t;\r
709 \r
710                         switch (c){\r
711                         case 'F': case 'f':\r
712                                 t =  Token.LITERAL_FLOAT;\r
713                                 break;\r
714                         case 'D': case 'd':\r
715                                 t = Token.LITERAL_DOUBLE;\r
716                                 break;\r
717                         case 'M': case 'm':\r
718                                  t= Token.LITERAL_DECIMAL;\r
719                                 break;\r
720                         default:\r
721                                 return Token.NONE;\r
722                         }\r
723                         return t;\r
724                 }\r
725 \r
726                 int integer_type_suffix (ulong ul, int c)\r
727                 {\r
728                         bool is_unsigned = false;\r
729                         bool is_long = false;\r
730 \r
731                         if (c != -1){\r
732                                 bool scanning = true;\r
733                                 do {\r
734                                         switch (c){\r
735                                         case 'U': case 'u':\r
736                                                 if (is_unsigned)\r
737                                                         scanning = false;\r
738                                                 is_unsigned = true;\r
739                                                 getChar ();\r
740                                                 break;\r
741 \r
742                                         case 'l':\r
743                                                 if (!is_unsigned){\r
744                                                         //\r
745                                                         // if we have not seen anything in between\r
746                                                         // report this error\r
747                                                         //\r
748                                                         Report.Warning (\r
749                                                                 78, Location,\r
750                                                         "the 'l' suffix is easily confused with digit `1'," +\r
751                                                         " use 'L' for clarity");\r
752                                                 }\r
753                                                 goto case 'L';\r
754                                                 \r
755                                         case 'L': \r
756                                                 if (is_long)\r
757                                                         scanning = false;\r
758                                                 is_long = true;\r
759                                                 getChar ();\r
760                                                 break;\r
761                                                 \r
762                                         default:\r
763                                                 scanning = false;\r
764                                                 break;\r
765                                         }\r
766                                         c = peekChar ();\r
767                                 } while (scanning);\r
768                         }\r
769 \r
770                         if (is_long && is_unsigned){\r
771                                 val = ul;\r
772                                 return Token.LITERAL_INTEGER;\r
773                         } else if (is_unsigned){\r
774                                 // uint if possible, or ulong else.\r
775 \r
776                                 if ((ul & 0xffffffff00000000) == 0)\r
777                                         val = (uint) ul;\r
778                                 else\r
779                                         val = ul;\r
780                         } else if (is_long){\r
781                                 // long if possible, ulong otherwise\r
782                                 if ((ul & 0x8000000000000000) != 0)\r
783                                         val = ul;\r
784                                 else\r
785                                         val = (long) ul;\r
786                         } else {\r
787                                 // int, uint, long or ulong in that order\r
788                                 if ((ul & 0xffffffff00000000) == 0){\r
789                                         uint ui = (uint) ul;\r
790                                         \r
791                                         if ((ui & 0x80000000) != 0)\r
792                                                 val = ui;\r
793                                         else\r
794                                                 val = (int) ui;\r
795                                 } else {\r
796                                         if ((ul & 0x8000000000000000) != 0)\r
797                                                 val = ul;\r
798                                         else\r
799                                                 val = (long) ul;\r
800                                 }\r
801                         }\r
802                         return Token.LITERAL_INTEGER;\r
803                 }\r
804                                 \r
805                 //\r
806                 // given `c' as the next char in the input decide whether\r
807                 // we need to convert to a special type, and then choose\r
808                 // the best representation for the integer\r
809                 //\r
810                 int adjust_int (int c)\r
811                 {\r
812                         try {\r
813                                 if (number_pos > 9){\r
814                                         ulong ul = (uint) (number_builder [0] - '0');\r
815 \r
816                                         for (int i = 1; i < number_pos; i++){\r
817                                                 ul = checked ((ul * 10) + ((uint)(number_builder [i] - '0')));\r
818                                         }\r
819                                         return integer_type_suffix (ul, c);\r
820                                 } else {\r
821                                         uint ui = (uint) (number_builder [0] - '0');\r
822 \r
823                                         for (int i = 1; i < number_pos; i++){\r
824                                                 ui = checked ((ui * 10) + ((uint)(number_builder [i] - '0')));\r
825                                         }\r
826                                         return integer_type_suffix (ui, c);\r
827                                 }\r
828                         } catch (OverflowException) {\r
829                                 error_details = "Integral constant is too large";\r
830                                 Report.Error (1021, Location, error_details);\r
831                                 val = 0ul;\r
832                                 return Token.LITERAL_INTEGER;\r
833                         }\r
834                 }\r
835                 \r
836                 int adjust_real (int t)\r
837                 {\r
838                         string s = new String (number_builder, 0, number_pos);\r
839 \r
840                         switch (t){\r
841                         case Token.LITERAL_DECIMAL:\r
842                                 try {\r
843                                         val = System.Decimal.Parse (s, styles, csharp_format_info);\r
844                                 } catch (OverflowException) {\r
845                                         val = 0m;     \r
846                                         error_details = "Floating-point constant is outside the range of the type 'decimal'";\r
847                                         Report.Error (594, Location, error_details);\r
848                                 }\r
849                                 break;\r
850                         case Token.LITERAL_FLOAT:\r
851                                 try {\r
852                                         val = (float) System.Double.Parse (s, styles, csharp_format_info);\r
853                                 } catch (OverflowException) {\r
854                                         val = 0.0f;     \r
855                                         error_details = "Floating-point constant is outside the range of the type 'float'";\r
856                                         Report.Error (594, Location, error_details);\r
857                                 }\r
858                                 break;\r
859                                 \r
860                         case Token.LITERAL_DOUBLE:\r
861                         case Token.NONE:\r
862                                 t = Token.LITERAL_DOUBLE;\r
863                                 try {\r
864                                         val = System.Double.Parse (s, styles, csharp_format_info);\r
865                                 } catch (OverflowException) {\r
866                                         val = 0.0;     \r
867                                         error_details = "Floating-point constant is outside the range of the type 'double'";\r
868                                         Report.Error (594, Location, error_details);\r
869                                 }\r
870                                 break;\r
871                         }\r
872                         return t;\r
873                 }\r
874 \r
875                 int handle_hex ()\r
876                 {\r
877                         int d;\r
878                         ulong ul;\r
879                         \r
880                         getChar ();\r
881                         while ((d = peekChar ()) != -1){\r
882                                 if (is_hex (d)){\r
883                                         number_builder [number_pos++] = (char) d;\r
884                                         getChar ();\r
885                                 } else\r
886                                         break;\r
887                         }\r
888                         \r
889                         string s = new String (number_builder, 0, number_pos);\r
890                         try {\r
891                                 if (number_pos <= 8)\r
892                                         ul = System.UInt32.Parse (s, NumberStyles.HexNumber);\r
893                                 else\r
894                                         ul = System.UInt64.Parse (s, NumberStyles.HexNumber);\r
895                         } catch (OverflowException){\r
896                                 error_details = "Integral constant is too large";\r
897                                 Report.Error (1021, Location, error_details);\r
898                                 val = 0ul;\r
899                                 return Token.LITERAL_INTEGER;\r
900                         }\r
901                         \r
902                         return integer_type_suffix (ul, peekChar ());\r
903                 }\r
904 \r
905                 //\r
906                 // Invoked if we know we have .digits or digits\r
907                 //\r
908                 int is_number (int c)\r
909                 {\r
910                         bool is_real = false;\r
911                         int type;\r
912 \r
913                         number_pos = 0;\r
914 \r
915                         if (c >= '0' && c <= '9'){\r
916                                 if (c == '0'){\r
917                                         int peek = peekChar ();\r
918 \r
919                                         if (peek == 'x' || peek == 'X')\r
920                                                 return handle_hex ();\r
921                                 }\r
922                                 decimal_digits (c);\r
923                                 c = getChar ();\r
924                         }\r
925 \r
926                         //\r
927                         // We need to handle the case of\r
928                         // "1.1" vs "1.string" (LITERAL_FLOAT vs NUMBER DOT IDENTIFIER)\r
929                         //\r
930                         if (c == '.'){\r
931                                 if (decimal_digits ('.')){\r
932                                         is_real = true;\r
933                                         c = getChar ();\r
934                                 } else {\r
935                                         putback ('.');\r
936                                         number_pos--;\r
937                                         return adjust_int (-1);\r
938                                 }\r
939                         }\r
940                         \r
941                         if (c == 'e' || c == 'E'){\r
942                                 is_real = true;\r
943                                 if (number_pos == max_number_size)\r
944                                         Error_NumericConstantTooLong ();\r
945                                 number_builder [number_pos++] = 'e';\r
946                                 c = getChar ();\r
947                                 \r
948                                 if (c == '+'){\r
949                                         if (number_pos == max_number_size)\r
950                                                 Error_NumericConstantTooLong ();\r
951                                         number_builder [number_pos++] = '+';\r
952                                         c = -1;\r
953                                 } else if (c == '-') {\r
954                                         if (number_pos == max_number_size)\r
955                                                 Error_NumericConstantTooLong ();\r
956                                         number_builder [number_pos++] = '-';\r
957                                         c = -1;\r
958                                 } else {\r
959                                         if (number_pos == max_number_size)\r
960                                                 Error_NumericConstantTooLong ();\r
961                                         number_builder [number_pos++] = '+';\r
962                                 }\r
963                                         \r
964                                 decimal_digits (c);\r
965                                 c = getChar ();\r
966                         }\r
967 \r
968                         type = real_type_suffix (c);\r
969                         if (type == Token.NONE && !is_real){\r
970                                 putback (c);\r
971                                 return adjust_int (c);\r
972                         } else \r
973                                 is_real = true;\r
974 \r
975                         if (type == Token.NONE){\r
976                                 putback (c);\r
977                         }\r
978                         \r
979                         if (is_real)\r
980                                 return adjust_real (type);\r
981 \r
982                         Console.WriteLine ("This should not be reached");\r
983                         throw new Exception ("Is Number should never reach this point");\r
984                 }\r
985 \r
986                 //\r
987                 // Accepts exactly count (4 or 8) hex, no more no less\r
988                 //\r
989                 int getHex (int count, out bool error)\r
990                 {\r
991                         int i;\r
992                         int total = 0;\r
993                         int c;\r
994                         int top = count != -1 ? count : 4;\r
995                         \r
996                         getChar ();\r
997                         error = false;\r
998                         for (i = 0; i < top; i++){\r
999                                 c = getChar ();\r
1000                                 \r
1001                                 if (c >= '0' && c <= '9')\r
1002                                         c = (int) c - (int) '0';\r
1003                                 else if (c >= 'A' && c <= 'F')\r
1004                                         c = (int) c - (int) 'A' + 10;\r
1005                                 else if (c >= 'a' && c <= 'f')\r
1006                                         c = (int) c - (int) 'a' + 10;\r
1007                                 else {\r
1008                                         error = true;\r
1009                                         return 0;\r
1010                                 }\r
1011                                 \r
1012                                 total = (total * 16) + c;\r
1013                                 if (count == -1){\r
1014                                         int p = peekChar ();\r
1015                                         if (p == -1)\r
1016                                                 break;\r
1017                                         if (!is_hex ((char)p))\r
1018                                                 break;\r
1019                                 }\r
1020                         }\r
1021                         return total;\r
1022                 }\r
1023 \r
1024                 int escape (int c)\r
1025                 {\r
1026                         bool error;\r
1027                         int d;\r
1028                         int v;\r
1029 \r
1030                         d = peekChar ();\r
1031                         if (c != '\\')\r
1032                                 return c;\r
1033                         \r
1034                         switch (d){\r
1035                         case 'a':\r
1036                                 v = '\a'; break;\r
1037                         case 'b':\r
1038                                 v = '\b'; break;\r
1039                         case 'n':\r
1040                                 v = '\n'; break;\r
1041                         case 't':\r
1042                                 v = '\t'; break;\r
1043                         case 'v':\r
1044                                 v = '\v'; break;\r
1045                         case 'r':\r
1046                                 v = '\r'; break;\r
1047                         case '\\':\r
1048                                 v = '\\'; break;\r
1049                         case 'f':\r
1050                                 v = '\f'; break;\r
1051                         case '0':\r
1052                                 v = 0; break;\r
1053                         case '"':\r
1054                                 v = '"'; break;\r
1055                         case '\'':\r
1056                                 v = '\''; break;\r
1057                         case 'x':\r
1058                                 v = getHex (-1, out error);\r
1059                                 if (error)\r
1060                                         goto default;\r
1061                                 return v;\r
1062                         case 'u':\r
1063                                 v = getHex (4, out error);\r
1064                                 if (error)\r
1065                                         goto default;\r
1066                                 return v;\r
1067                         case 'U':\r
1068                                 v = getHex (8, out error);\r
1069                                 if (error)\r
1070                                         goto default;\r
1071                                 return v;\r
1072                         default:\r
1073                                 Report.Error (1009, Location, "Unrecognized escape sequence in " + (char)d);\r
1074                                 return d;\r
1075                         }\r
1076                         getChar ();\r
1077                         return v;\r
1078                 }\r
1079 \r
1080                 int getChar ()\r
1081                 {\r
1082                         if (putback_char != -1){\r
1083                                 int x = putback_char;\r
1084                                 putback_char = -1;\r
1085 \r
1086                                 return x;\r
1087                         }\r
1088                         return reader.Read ();\r
1089                 }\r
1090 \r
1091                 int peekChar ()\r
1092                 {\r
1093                         if (putback_char != -1)\r
1094                                 return putback_char;\r
1095                         putback_char = reader.Read ();\r
1096                         return putback_char;\r
1097                 }\r
1098 \r
1099                 int peekChar2 ()\r
1100                 {\r
1101                         if (putback_char != -1)\r
1102                                 return putback_char;\r
1103                         return reader.Peek ();\r
1104                 }\r
1105                 \r
1106                 void putback (int c)\r
1107                 {\r
1108                         if (putback_char != -1){\r
1109                                 Console.WriteLine ("Col: " + col);\r
1110                                 Console.WriteLine ("Row: " + line);\r
1111                                 Console.WriteLine ("Name: " + ref_name.Name);\r
1112                                 Console.WriteLine ("Current [{0}] putting back [{1}]  ", putback_char, c);\r
1113                                 throw new Exception ("This should not happen putback on putback");\r
1114                         }\r
1115                         putback_char = c;\r
1116                 }\r
1117 \r
1118                 public bool advance ()\r
1119                 {\r
1120                         return peekChar () != -1;\r
1121                 }\r
1122 \r
1123                 public Object Value {\r
1124                         get {\r
1125                                 return val;\r
1126                         }\r
1127                 }\r
1128 \r
1129                 public Object value ()\r
1130                 {\r
1131                         return val;\r
1132                 }\r
1133 \r
1134                 bool IsCastToken (int token)\r
1135                 {\r
1136                         switch (token) {\r
1137                         case Token.BANG:\r
1138                         case Token.TILDE:\r
1139                         case Token.IDENTIFIER:\r
1140                         case Token.LITERAL_INTEGER:\r
1141                         case Token.LITERAL_FLOAT:\r
1142                         case Token.LITERAL_DOUBLE:\r
1143                         case Token.LITERAL_DECIMAL:\r
1144                         case Token.LITERAL_CHARACTER:\r
1145                         case Token.LITERAL_STRING:\r
1146                         case Token.BASE:\r
1147                         case Token.CHECKED:\r
1148                         case Token.FALSE:\r
1149                         case Token.FIXED:\r
1150                         case Token.NEW:\r
1151                         case Token.NULL:\r
1152                         case Token.SIZEOF:\r
1153                         case Token.THIS:\r
1154                         case Token.THROW:\r
1155                         case Token.TRUE:\r
1156                         case Token.TYPEOF:\r
1157                         case Token.UNCHECKED:\r
1158                         case Token.UNSAFE:\r
1159 \r
1160                                 //\r
1161                                 // These can be part of a member access\r
1162                                 //\r
1163                         case Token.INT:\r
1164                         case Token.UINT:\r
1165                         case Token.SHORT:\r
1166                         case Token.USHORT:\r
1167                         case Token.LONG:\r
1168                         case Token.ULONG:\r
1169                         case Token.DOUBLE:\r
1170                         case Token.FLOAT:\r
1171                         case Token.CHAR:\r
1172                                 return true;\r
1173 \r
1174                         default:\r
1175                                 return false;\r
1176                         }\r
1177                 }\r
1178 \r
1179                 public int token ()\r
1180                 {\r
1181                         current_token = xtoken ();\r
1182                         return current_token;\r
1183                 }\r
1184 \r
1185                 static StringBuilder static_cmd_arg = new System.Text.StringBuilder ();\r
1186                 \r
1187                 void get_cmd_arg (out string cmd, out string arg)\r
1188                 {\r
1189                         int c;\r
1190                         \r
1191                         tokens_seen = false;\r
1192                         arg = "";\r
1193                         static_cmd_arg.Length = 0;\r
1194                                 \r
1195                         while ((c = getChar ()) != -1 && (c != '\n') && (c != ' ') && (c != '\t') && (c != '\r')){\r
1196                                 static_cmd_arg.Append ((char) c);\r
1197                         }\r
1198 \r
1199                         cmd = static_cmd_arg.ToString ();\r
1200 \r
1201                         if (c == '\n'){\r
1202                                 line++;\r
1203                                 ref_line++;\r
1204                                 return;\r
1205                         } else if (c == '\r')\r
1206                                 col = 0;\r
1207 \r
1208                         // skip over white space\r
1209                         while ((c = getChar ()) != -1 && (c != '\n') && ((c == '\r') || (c == ' ') || (c == '\t')))\r
1210                                 ;\r
1211 \r
1212                         if (c == '\n'){\r
1213                                 line++;\r
1214                                 ref_line++;\r
1215                                 return;\r
1216                         } else if (c == '\r'){\r
1217                                 col = 0;\r
1218                                 return;\r
1219                         }\r
1220                         \r
1221                         static_cmd_arg.Length = 0;\r
1222                         static_cmd_arg.Append ((char) c);\r
1223                         \r
1224                         while ((c = getChar ()) != -1 && (c != '\n') && (c != '\r')){\r
1225                                 static_cmd_arg.Append ((char) c);\r
1226                         }\r
1227 \r
1228                         if (c == '\n'){\r
1229                                 line++;\r
1230                                 ref_line++;\r
1231                         } else if (c == '\r')\r
1232                                 col = 0;\r
1233                         arg = static_cmd_arg.ToString ().Trim ();\r
1234                 }\r
1235 \r
1236                 //\r
1237                 // Handles the #line directive\r
1238                 //\r
1239                 bool PreProcessLine (string arg)\r
1240                 {\r
1241                         if (arg == "")\r
1242                                 return false;\r
1243 \r
1244                         if (arg == "default"){\r
1245                                 ref_line = line;\r
1246                                 ref_name = file_name;\r
1247                                 Location.Push (ref_name);\r
1248                                 return true;\r
1249                         }\r
1250                         \r
1251                         try {\r
1252                                 int pos;\r
1253 \r
1254                                 if ((pos = arg.IndexOf (' ')) != -1 && pos != 0){\r
1255                                         ref_line = System.Int32.Parse (arg.Substring (0, pos));\r
1256                                         pos++;\r
1257                                         \r
1258                                         char [] quotes = { '\"' };\r
1259                                         \r
1260                                         string name = arg.Substring (pos). Trim (quotes);\r
1261                                         ref_name = Location.LookupFile (name);\r
1262                                         Location.Push (ref_name);\r
1263                                 } else {\r
1264                                         ref_line = System.Int32.Parse (arg);\r
1265                                 }\r
1266                         } catch {\r
1267                                 return false;\r
1268                         }\r
1269                         \r
1270                         return true;\r
1271                 }\r
1272 \r
1273                 //\r
1274                 // Handles #define and #undef\r
1275                 //\r
1276                 void PreProcessDefinition (bool is_define, string arg)\r
1277                 {\r
1278                         if (arg == "" || arg == "true" || arg == "false"){\r
1279                                 Report.Error (1001, Location, "Missing identifer to pre-processor directive");\r
1280                                 return;\r
1281                         }\r
1282 \r
1283                         char[] whitespace = { ' ', '\t' };\r
1284                         if (arg.IndexOfAny (whitespace) != -1){\r
1285                                 Report.Error (1025, Location, "Single-line comment or end-of-line expected");\r
1286                                 return;\r
1287                         }\r
1288 \r
1289                         if (!is_identifier_start_character (arg [0]))\r
1290                                 Report.Error (1001, Location, "Identifier expected: " + arg);\r
1291                         \r
1292                         foreach (char c in arg.Substring (1)){\r
1293                                 if (!is_identifier_part_character (c)){\r
1294                                         Report.Error (1001, Location, "Identifier expected: " + arg);\r
1295                                         return;\r
1296                                 }\r
1297                         }\r
1298 \r
1299                         if (is_define){\r
1300                                 if (defines == null)\r
1301                                         defines = new Hashtable ();\r
1302                                 define (arg);\r
1303                         } else {\r
1304                                 if (defines == null)\r
1305                                         return;\r
1306                                 if (defines.Contains (arg))\r
1307                                         defines.Remove (arg);\r
1308                         }\r
1309                 }\r
1310 \r
1311                 bool eval_val (string s)\r
1312                 {\r
1313                         if (s == "true")\r
1314                                 return true;\r
1315                         if (s == "false")\r
1316                                 return false;\r
1317                         \r
1318                         if (defines == null)\r
1319                                 return false;\r
1320                         if (defines.Contains (s))\r
1321                                 return true;\r
1322 \r
1323                         return false;\r
1324                 }\r
1325 \r
1326                 bool pp_primary (ref string s)\r
1327                 {\r
1328                         s = s.Trim ();\r
1329                         int len = s.Length;\r
1330 \r
1331                         if (len > 0){\r
1332                                 char c = s [0];\r
1333                                 \r
1334                                 if (c == '('){\r
1335                                         s = s.Substring (1);\r
1336                                         bool val = pp_expr (ref s);\r
1337                                         if (s.Length > 0 && s [0] == ')'){\r
1338                                                 s = s.Substring (1);\r
1339                                                 return val;\r
1340                                         }\r
1341                                         Error_InvalidDirective ();\r
1342                                         return false;\r
1343                                 }\r
1344                                 \r
1345                                 if (is_identifier_start_character (c)){\r
1346                                         int j = 1;\r
1347 \r
1348                                         while (j < len){\r
1349                                                 c = s [j];\r
1350                                                 \r
1351                                                 if (is_identifier_part_character (c)){\r
1352                                                         j++;\r
1353                                                         continue;\r
1354                                                 }\r
1355                                                 bool v = eval_val (s.Substring (0, j));\r
1356                                                 s = s.Substring (j);\r
1357                                                 return v;\r
1358                                         }\r
1359                                         bool vv = eval_val (s);\r
1360                                         s = "";\r
1361                                         return vv;\r
1362                                 }\r
1363                         }\r
1364                         Error_InvalidDirective ();\r
1365                         return false;\r
1366                 }\r
1367                 \r
1368                 bool pp_unary (ref string s)\r
1369                 {\r
1370                         s = s.Trim ();\r
1371                         int len = s.Length;\r
1372 \r
1373                         if (len > 0){\r
1374                                 if (s [0] == '!'){\r
1375                                         if (len > 1 && s [1] == '='){\r
1376                                                 Error_InvalidDirective ();\r
1377                                                 return false;\r
1378                                         }\r
1379                                         s = s.Substring (1);\r
1380                                         return ! pp_primary (ref s);\r
1381                                 } else\r
1382                                         return pp_primary (ref s);\r
1383                         } else {\r
1384                                 Error_InvalidDirective ();\r
1385                                 return false;\r
1386                         }\r
1387                 }\r
1388                 \r
1389                 bool pp_eq (ref string s)\r
1390                 {\r
1391                         bool va = pp_unary (ref s);\r
1392 \r
1393                         s = s.Trim ();\r
1394                         int len = s.Length;\r
1395                         if (len > 0){\r
1396                                 if (s [0] == '='){\r
1397                                         if (len > 2 && s [1] == '='){\r
1398                                                 s = s.Substring (2);\r
1399                                                 return va == pp_unary (ref s);\r
1400                                         } else {\r
1401                                                 Error_InvalidDirective ();\r
1402                                                 return false;\r
1403                                         }\r
1404                                 } else if (s [0] == '!' && len > 1 && s [1] == '='){\r
1405                                         s = s.Substring (2);\r
1406 \r
1407                                         return va != pp_unary (ref s);\r
1408 \r
1409                                 } \r
1410                         }\r
1411 \r
1412                         return va;\r
1413                                 \r
1414                 }\r
1415                 \r
1416                 bool pp_and (ref string s)\r
1417                 {\r
1418                         bool va = pp_eq (ref s);\r
1419 \r
1420                         s = s.Trim ();\r
1421                         int len = s.Length;\r
1422                         if (len > 0){\r
1423                                 if (s [0] == '&'){\r
1424                                         if (len > 2 && s [1] == '&'){\r
1425                                                 s = s.Substring (2);\r
1426                                                 return (va & pp_eq (ref s));\r
1427                                         } else {\r
1428                                                 Error_InvalidDirective ();\r
1429                                                 return false;\r
1430                                         }\r
1431                                 } \r
1432                         }\r
1433                         return va;\r
1434                 }\r
1435                 \r
1436                 //\r
1437                 // Evaluates an expression for `#if' or `#elif'\r
1438                 //\r
1439                 bool pp_expr (ref string s)\r
1440                 {\r
1441                         bool va = pp_and (ref s);\r
1442                         s = s.Trim ();\r
1443                         int len = s.Length;\r
1444                         if (len > 0){\r
1445                                 char c = s [0];\r
1446                                 \r
1447                                 if (c == '|'){\r
1448                                         if (len > 2 && s [1] == '|'){\r
1449                                                 s = s.Substring (2);\r
1450                                                 return va | pp_expr (ref s);\r
1451                                         } else {\r
1452                                                 Error_InvalidDirective ();\r
1453                                                 return false;\r
1454                                         }\r
1455                                 } \r
1456                         }\r
1457                         \r
1458                         return va;\r
1459                 }\r
1460 \r
1461                 bool eval (string s)\r
1462                 {\r
1463                         bool v = pp_expr (ref s);\r
1464                         s = s.Trim ();\r
1465                         if (s.Length != 0){\r
1466                                 Error_InvalidDirective ();\r
1467                                 return false;\r
1468                         }\r
1469 \r
1470                         return v;\r
1471                 }\r
1472                 \r
1473                 void Error_InvalidDirective ()\r
1474                 {\r
1475                         Report.Error (1517, Location, "Invalid pre-processor directive");\r
1476                 }\r
1477 \r
1478                 void Error_UnexpectedDirective (string extra)\r
1479                 {\r
1480                         Report.Error (\r
1481                                 1028, Location,\r
1482                                 "Unexpected processor directive (" + extra + ")");\r
1483                 }\r
1484 \r
1485                 void Error_TokensSeen ()\r
1486                 {\r
1487                         Report.Error (\r
1488                                 1032, Location,\r
1489                                 "Cannot define or undefine pre-processor symbols after a token in the file");\r
1490                 }\r
1491                 \r
1492                 //\r
1493                 // if true, then the code continues processing the code\r
1494                 // if false, the code stays in a loop until another directive is\r
1495                 // reached.\r
1496                 //\r
1497                 bool handle_preprocessing_directive (bool caller_is_taking)\r
1498                 {\r
1499                         string cmd, arg;\r
1500                         bool region_directive = false;\r
1501 \r
1502                         get_cmd_arg (out cmd, out arg);\r
1503 \r
1504                         // Eat any trailing whitespaces and single-line comments\r
1505                         if (arg.IndexOf ("//") != -1)\r
1506                                 arg = arg.Substring (0, arg.IndexOf ("//"));\r
1507                         arg = arg.TrimEnd (' ', '\t');\r
1508 \r
1509                         //\r
1510                         // The first group of pre-processing instructions is always processed\r
1511                         //\r
1512                         switch (cmd){\r
1513                         case "pragma":\r
1514                                 if (RootContext.V2)\r
1515                                         return true;\r
1516                                 break;\r
1517                                 \r
1518                         case "line":\r
1519                                 if (!PreProcessLine (arg))\r
1520                                         Report.Error (\r
1521                                                 1576, Location,\r
1522                                                 "Argument to #line directive is missing or invalid");\r
1523                                 return true;\r
1524 \r
1525                         case "region":\r
1526                                 region_directive = true;\r
1527                                 arg = "true";\r
1528                                 goto case "if";\r
1529 \r
1530                         case "endregion":\r
1531                                 region_directive = true;\r
1532                                 goto case "endif";\r
1533                                 \r
1534                         case "if":\r
1535                                 if (arg == ""){\r
1536                                         Error_InvalidDirective ();\r
1537                                         return true;\r
1538                                 }\r
1539                                 bool taking = false;\r
1540                                 if (ifstack == null)\r
1541                                         ifstack = new Stack ();\r
1542 \r
1543                                 if (ifstack.Count == 0){\r
1544                                         taking = true;\r
1545                                 } else {\r
1546                                         int state = (int) ifstack.Peek ();\r
1547                                         if ((state & TAKING) != 0)\r
1548                                                 taking = true;\r
1549                                 }\r
1550 \r
1551                                 if (eval (arg) && taking){\r
1552                                         int push = TAKING | TAKEN_BEFORE | PARENT_TAKING;\r
1553                                         if (region_directive)\r
1554                                                 push |= REGION;\r
1555                                         ifstack.Push (push);\r
1556                                         return true;\r
1557                                 } else {\r
1558                                         int push = (taking ? PARENT_TAKING : 0);\r
1559                                         if (region_directive)\r
1560                                                 push |= REGION;\r
1561                                         ifstack.Push (push);\r
1562                                         return false;\r
1563                                 }\r
1564                                 \r
1565                         case "endif":\r
1566                                 if (ifstack == null || ifstack.Count == 0){\r
1567                                         Error_UnexpectedDirective ("no #if for this #endif");\r
1568                                         return true;\r
1569                                 } else {\r
1570                                         int pop = (int) ifstack.Pop ();\r
1571                                         \r
1572                                         if (region_directive && ((pop & REGION) == 0))\r
1573                                                 Report.Error (1027, Location, "#endif directive expected");\r
1574                                         else if (!region_directive && ((pop & REGION) != 0))\r
1575                                                 Report.Error (1038, Location, "#endregion directive expected");\r
1576                                         \r
1577                                         if (ifstack.Count == 0)\r
1578                                                 return true;\r
1579                                         else {\r
1580                                                 int state = (int) ifstack.Peek ();\r
1581 \r
1582                                                 if ((state & TAKING) != 0)\r
1583                                                         return true;\r
1584                                                 else\r
1585                                                         return false;\r
1586                                         }\r
1587                                 }\r
1588 \r
1589                         case "elif":\r
1590                                 if (ifstack == null || ifstack.Count == 0){\r
1591                                         Error_UnexpectedDirective ("no #if for this #elif");\r
1592                                         return true;\r
1593                                 } else {\r
1594                                         int state = (int) ifstack.Peek ();\r
1595 \r
1596                                         if ((state & REGION) != 0) {\r
1597                                                 Report.Error (1038, Location, "#endregion directive expected");\r
1598                                                 return true;\r
1599                                         }\r
1600 \r
1601                                         if ((state & ELSE_SEEN) != 0){\r
1602                                                 Error_UnexpectedDirective ("#elif not valid after #else");\r
1603                                                 return true;\r
1604                                         }\r
1605 \r
1606                                         if ((state & (TAKEN_BEFORE | TAKING)) != 0)\r
1607                                                 return false;\r
1608 \r
1609                                         if (eval (arg) && ((state & PARENT_TAKING) != 0)){\r
1610                                                 state = (int) ifstack.Pop ();\r
1611                                                 ifstack.Push (state | TAKING | TAKEN_BEFORE);\r
1612                                                 return true;\r
1613                                         } else \r
1614                                                 return false;\r
1615                                 }\r
1616 \r
1617                         case "else":\r
1618                                 if (ifstack == null || ifstack.Count == 0){\r
1619                                         Report.Error (\r
1620                                                 1028, Location,\r
1621                                                 "Unexpected processor directive (no #if for this #else)");\r
1622                                         return true;\r
1623                                 } else {\r
1624                                         int state = (int) ifstack.Peek ();\r
1625 \r
1626                                         if ((state & REGION) != 0) {\r
1627                                                 Report.Error (1038, Location, "#endregion directive expected");\r
1628                                                 return true;\r
1629                                         }\r
1630 \r
1631                                         if ((state & ELSE_SEEN) != 0){\r
1632                                                 Error_UnexpectedDirective ("#else within #else");\r
1633                                                 return true;\r
1634                                         }\r
1635 \r
1636                                         ifstack.Pop ();\r
1637 \r
1638                                         bool ret;\r
1639                                         if ((state & TAKEN_BEFORE) == 0){\r
1640                                                 ret = ((state & PARENT_TAKING) != 0);\r
1641                                         } else\r
1642                                                 ret = false;\r
1643                                         \r
1644                                         if (ret)\r
1645                                                 state |= TAKING;\r
1646                                         else\r
1647                                                 state &= ~TAKING;\r
1648                                         \r
1649                                         ifstack.Push (state | ELSE_SEEN);\r
1650                                         \r
1651                                         return ret;\r
1652                                 }\r
1653                         }\r
1654 \r
1655                         //\r
1656                         // These are only processed if we are in a `taking' block\r
1657                         //\r
1658                         if (!caller_is_taking)\r
1659                                 return false;\r
1660                                         \r
1661                         switch (cmd){\r
1662                         case "define":\r
1663                                 if (any_token_seen){\r
1664                                         Error_TokensSeen ();\r
1665                                         return true;\r
1666                                 }\r
1667                                 PreProcessDefinition (true, arg);\r
1668                                 return true;\r
1669 \r
1670                         case "undef":\r
1671                                 if (any_token_seen){\r
1672                                         Error_TokensSeen ();\r
1673                                         return true;\r
1674                                 }\r
1675                                 PreProcessDefinition (false, arg);\r
1676                                 return true;\r
1677 \r
1678                         case "error":\r
1679                                 Report.Error (1029, Location, "#error: '" + arg + "'");\r
1680                                 return true;\r
1681 \r
1682                         case "warning":\r
1683                                 Report.Warning (1030, Location, "#warning: '" + arg + "'");\r
1684                                 return true;\r
1685                         }\r
1686 \r
1687                         Report.Error (1024, Location, "Preprocessor directive expected (got: " + cmd + ")");\r
1688                         return true;\r
1689 \r
1690                 }\r
1691 \r
1692                 private int consume_string (bool quoted) \r
1693                 {\r
1694                         int c;\r
1695                         string_builder.Length = 0;\r
1696                                                                 \r
1697                         while ((c = getChar ()) != -1){\r
1698                                 if (c == '"'){\r
1699                                         if (quoted && peekChar () == '"'){\r
1700                                                 string_builder.Append ((char) c);\r
1701                                                 getChar ();\r
1702                                                 continue;\r
1703                                         } else {\r
1704                                                 val = string_builder.ToString ();\r
1705                                                 return Token.LITERAL_STRING;\r
1706                                         }\r
1707                                 }\r
1708 \r
1709                                 if (c == '\n'){\r
1710                                         if (!quoted)\r
1711                                                 Report.Error (1010, Location, "Newline in constant");\r
1712                                         line++;\r
1713                                         ref_line++;\r
1714                                         col = 0;\r
1715                                 } else\r
1716                                         col++;\r
1717 \r
1718                                 if (!quoted){\r
1719                                         c = escape (c);\r
1720                                         if (c == -1)\r
1721                                                 return Token.ERROR;\r
1722                                 }\r
1723                                 string_builder.Append ((char) c);\r
1724                         }\r
1725 \r
1726                         Report.Error (1039, Location, "Unterminated string literal");\r
1727                         return Token.EOF;\r
1728                 }\r
1729 \r
1730                 private int consume_identifier (int s, bool quoted) \r
1731                 {\r
1732                         int pos = 1;\r
1733                         int c;\r
1734                         \r
1735                         id_builder [0] = (char) s;\r
1736                                         \r
1737                         while ((c = reader.Read ()) != -1) {\r
1738                                 if (is_identifier_part_character ((char) c)){\r
1739                                         if (pos == max_id_size){\r
1740                                                 Report.Error (645, Location, "Identifier too long (limit is 512 chars)");\r
1741                                                 return Token.ERROR;\r
1742                                         }\r
1743                                         \r
1744                                         id_builder [pos++] = (char) c;\r
1745                                         putback_char = -1;\r
1746                                         col++;\r
1747                                 } else {\r
1748                                         putback_char = c;\r
1749                                         break;\r
1750                                 }\r
1751                         }\r
1752 \r
1753                         //\r
1754                         // Optimization: avoids doing the keyword lookup\r
1755                         // on uppercase letters and _\r
1756                         //\r
1757                         if (s >= 'a'){\r
1758                                 int keyword = GetKeyword (id_builder, pos);\r
1759                                 if (keyword != -1 && !quoted)\r
1760                                 return keyword;\r
1761                         }\r
1762 \r
1763                         //\r
1764                         // Keep identifiers in an array of hashtables to avoid needless\r
1765                         // allocations\r
1766                         //\r
1767 \r
1768                         if (identifiers [pos] != null) {\r
1769                                 val = identifiers [pos][id_builder];\r
1770                                 if (val != null) {\r
1771                                         return Token.IDENTIFIER;\r
1772                                 }\r
1773                         }\r
1774                         else\r
1775                                 identifiers [pos] = new CharArrayHashtable (pos);\r
1776 \r
1777                         val = new String (id_builder, 0, pos);\r
1778 \r
1779                         char [] chars = new char [pos];\r
1780                         Array.Copy (id_builder, chars, pos);\r
1781 \r
1782                         identifiers [pos] [chars] = val;\r
1783 \r
1784                         return Token.IDENTIFIER;\r
1785                 }\r
1786                 \r
1787                 public int xtoken ()\r
1788                 {\r
1789                         int t;\r
1790                         bool doread = false;\r
1791                         int c;\r
1792 \r
1793                         val = null;\r
1794                         // optimization: eliminate col and implement #directive semantic correctly.\r
1795                         for (;(c = getChar ()) != -1; col++) {\r
1796                                 if (c == ' ' || c == '\t' || c == '\f' || c == '\v' || c == '\r' || c == 0xa0){\r
1797                                         \r
1798                                         if (c == '\t')\r
1799                                                 col = (((col + 8) / 8) * 8) - 1;\r
1800                                         continue;\r
1801                                 }\r
1802 \r
1803                                 // Handle double-slash comments.\r
1804                                 if (c == '/'){\r
1805                                         int d = peekChar ();\r
1806                                 \r
1807                                         if (d == '/'){\r
1808                                                 getChar ();\r
1809                                                 while ((d = getChar ()) != -1 && (d != '\n') && d != '\r')\r
1810                                                         col++;\r
1811                                                 if (d == '\n'){\r
1812                                                         line++;\r
1813                                                         ref_line++;\r
1814                                                         col = 0;\r
1815                                                 }\r
1816                                                 any_token_seen |= tokens_seen;\r
1817                                                 tokens_seen = false;\r
1818                                                 continue;\r
1819                                         } else if (d == '*'){\r
1820                                                 getChar ();\r
1821 \r
1822                                                 while ((d = getChar ()) != -1){\r
1823                                                         if (d == '*' && peekChar () == '/'){\r
1824                                                                 getChar ();\r
1825                                                                 col++;\r
1826                                                                 break;\r
1827                                                         }\r
1828                                                         if (d == '\n'){\r
1829                                                                 line++;\r
1830                                                                 ref_line++;\r
1831                                                                 col = 0;\r
1832                                                                 any_token_seen |= tokens_seen;\r
1833                                                                 tokens_seen = false;\r
1834                                                         }\r
1835                                                 }\r
1836                                                 continue;\r
1837                                         }\r
1838                                         goto is_punct_label;\r
1839                                 }\r
1840 \r
1841                                 \r
1842                                 if (is_identifier_start_character ((char)c)){\r
1843                                         tokens_seen = true;\r
1844                                         return consume_identifier (c, false);\r
1845                                 }\r
1846 \r
1847                         is_punct_label:\r
1848                                 if ((t = is_punct ((char)c, ref doread)) != Token.ERROR){\r
1849                                         tokens_seen = true;\r
1850                                         if (doread){\r
1851                                                 getChar ();\r
1852                                                 col++;\r
1853                                         }\r
1854                                         return t;\r
1855                                 }\r
1856 \r
1857                                 // white space\r
1858                                 if (c == '\n'){\r
1859                                         line++;\r
1860                                         ref_line++;\r
1861                                         col = 0;\r
1862                                         any_token_seen |= tokens_seen;\r
1863                                         tokens_seen = false;\r
1864                                         continue;\r
1865                                 }\r
1866 \r
1867                                 if (c >= '0' && c <= '9'){\r
1868                                         tokens_seen = true;\r
1869                                         return is_number (c);\r
1870                                 }\r
1871 \r
1872                                 if (c == '.'){\r
1873                                         tokens_seen = true;\r
1874                                         int peek = peekChar ();\r
1875                                         if (peek >= '0' && peek <= '9')\r
1876                                                 return is_number (c);\r
1877                                         return Token.DOT;\r
1878                                 }\r
1879                                 \r
1880                                 /* For now, ignore pre-processor commands */\r
1881                                 // FIXME: In C# the '#' is not limited to appear\r
1882                                 // on the first column.\r
1883                                 if (c == '#' && !tokens_seen){\r
1884                                         bool cont = true;\r
1885                                         \r
1886                                 start_again:\r
1887                                         \r
1888                                         cont = handle_preprocessing_directive (cont);\r
1889 \r
1890                                         if (cont){\r
1891                                                 col = 0;\r
1892                                                 continue;\r
1893                                         }\r
1894                                         col = 1;\r
1895 \r
1896                                         bool skipping = false;\r
1897                                         for (;(c = getChar ()) != -1; col++){\r
1898                                                 if (c == '\n'){\r
1899                                                         col = 0;\r
1900                                                         line++;\r
1901                                                         ref_line++;\r
1902                                                         skipping = false;\r
1903                                                 } else if (c == ' ' || c == '\t' || c == '\v' || c == '\r' || c == 0xa0)\r
1904                                                         continue;\r
1905                                                 else if (c != '#')\r
1906                                                         skipping = true;\r
1907                                                 if (c == '#' && !skipping)\r
1908                                                         goto start_again;\r
1909                                         }\r
1910                                         any_token_seen |= tokens_seen;\r
1911                                         tokens_seen = false;\r
1912                                         if (c == -1)\r
1913                                                 Report.Error (1027, Location, "#endif/#endregion expected");\r
1914                                         continue;\r
1915                                 }\r
1916                                 \r
1917                                 if (c == '"') \r
1918                                         return consume_string (false);\r
1919 \r
1920                                 if (c == '\''){\r
1921                                         c = getChar ();\r
1922                                         tokens_seen = true;\r
1923                                         if (c == '\''){\r
1924                                                 error_details = "Empty character literal";\r
1925                                                 Report.Error (1011, Location, error_details);\r
1926                                                 return Token.ERROR;\r
1927                                         }\r
1928                                         c = escape (c);\r
1929                                         if (c == -1)\r
1930                                                 return Token.ERROR;\r
1931                                         val = new System.Char ();\r
1932                                         val = (char) c;\r
1933                                         c = getChar ();\r
1934 \r
1935                                         if (c != '\''){\r
1936                                                 error_details = "Too many characters in character literal";\r
1937                                                 Report.Error (1012, Location, error_details);\r
1938 \r
1939                                                 // Try to recover, read until newline or next "'"\r
1940                                                 while ((c = getChar ()) != -1){\r
1941                                                         if (c == '\n' || c == '\''){\r
1942                                                                 line++;\r
1943                                                                 ref_line++;\r
1944                                                                 col = 0;\r
1945                                                                 break;\r
1946                                                         } else\r
1947                                                                 col++;\r
1948                                                         \r
1949                                                 }\r
1950                                                 return Token.ERROR;\r
1951                                         }\r
1952                                         return Token.LITERAL_CHARACTER;\r
1953                                 }\r
1954                                 \r
1955                                 if (c == '@') {\r
1956                                         c = getChar ();\r
1957                                         if (c == '"') {\r
1958                                                 tokens_seen = true;\r
1959                                                 return consume_string (true);\r
1960                                         } else if (is_identifier_start_character ((char) c)){\r
1961                                                 return consume_identifier (c, true);\r
1962                                         } else {\r
1963                                                 Report.Error (1033, Location, "'@' must be followed by string constant or identifier");\r
1964                                         }\r
1965                                 }\r
1966 \r
1967                                 if (c == '#') {\r
1968                                         error_details = "Preprocessor directives must appear as the first non-whitespace " +\r
1969                                                 "character on a line.";\r
1970 \r
1971                                         Report.Error (1040, Location, error_details);\r
1972 \r
1973                                         return Token.ERROR;\r
1974                                 }\r
1975 \r
1976                                 error_details = ((char)c).ToString ();\r
1977                                 \r
1978                                 return Token.ERROR;\r
1979                         }\r
1980 \r
1981                         return Token.EOF;\r
1982                 }\r
1983 \r
1984                 public void cleanup ()\r
1985                 {\r
1986                         if (ifstack != null && ifstack.Count >= 1) {\r
1987                                 int state = (int) ifstack.Pop ();\r
1988                                 if ((state & REGION) != 0)\r
1989                                         Report.Error (1038, "#endregion directive expected");\r
1990                                 else \r
1991                                         Report.Error (1027, "#endif directive expected");\r
1992                         }\r
1993                                 \r
1994                 }\r
1995         }\r
1996 }\r
1997 \r