2004-01-17 Miguel de Icaza <miguel@ximian.com>
[mono.git] / mcs / mcs / cs-tokenizer.cs
1 //\r
2 // cs-tokenizer.cs: The Tokenizer for the C# compiler\r
3 //                  This also implements the preprocessor\r
4 //\r
5 // Author: Miguel de Icaza (miguel@gnu.org)\r
6 //\r
7 // Licensed under the terms of the GNU GPL\r
8 //\r
9 // (C) 2001, 2002 Ximian, Inc (http://www.ximian.com)\r
10 //\r
11 \r
12 /*\r
13  * TODO:\r
14  *   Make sure we accept the proper Unicode ranges, per the spec.\r
15  *   Report error 1032\r
16 */\r
17 \r
18 using System;\r
19 using System.Text;\r
20 using System.Collections;\r
21 using System.IO;\r
22 using System.Globalization;\r
23 using System.Reflection;\r
24 \r
25 namespace Mono.CSharp\r
26 {\r
27         /// <summary>\r
28         ///    Tokenizer for C# source code. \r
29         /// </summary>\r
30 \r
31         public class Tokenizer : yyParser.yyInput\r
32         {\r
33                 SeekableStreamReader reader;\r
34                 public SourceFile ref_name;\r
35                 public SourceFile file_name;\r
36                 public int ref_line = 1;\r
37                 public int line = 1;\r
38                 public int col = 1;\r
39                 public int current_token;\r
40                 bool handle_get_set = false;\r
41                 bool handle_remove_add = false;\r
42                 bool handle_assembly = false;\r
43 \r
44                 //\r
45                 // Whether tokens have been seen on this line\r
46                 //\r
47                 bool tokens_seen = false;\r
48 \r
49                 //\r
50                 // Whether a token has been seen on the file\r
51                 // This is needed because `define' is not allowed to be used\r
52                 // after a token has been seen.\r
53                 //\r
54                 bool any_token_seen = false;\r
55                 static Hashtable tokenValues;\r
56                 \r
57                 private static Hashtable TokenValueName\r
58                 {\r
59                         get {\r
60                                 if (tokenValues == null)\r
61                                         tokenValues = GetTokenValueNameHash ();\r
62 \r
63                                 return tokenValues;\r
64                         }\r
65                 }\r
66 \r
67                 private static Hashtable GetTokenValueNameHash ()\r
68                 {\r
69                         Type t = typeof (Token);\r
70                         FieldInfo [] fields = t.GetFields ();\r
71                         Hashtable hash = new Hashtable ();\r
72                         foreach (FieldInfo field in fields) {\r
73                                 if (field.IsLiteral && field.IsStatic && field.FieldType == typeof (int))\r
74                                         hash.Add (field.GetValue (null), field.Name);\r
75                         }\r
76                         return hash;\r
77                 }\r
78                 \r
79                 //\r
80                 // Returns a verbose representation of the current location\r
81                 //\r
82                 public string location {\r
83                         get {\r
84                                 string det;\r
85 \r
86                                 if (current_token == Token.ERROR)\r
87                                         det = "detail: " + error_details;\r
88                                 else\r
89                                         det = "";\r
90                                 \r
91                                 // return "Line:     "+line+" Col: "+col + "\n" +\r
92                                 //       "VirtLine: "+ref_line +\r
93                                 //       " Token: "+current_token + " " + det;\r
94                                 string current_token_name = TokenValueName [current_token] as string;\r
95                                 if (current_token_name == null)\r
96                                         current_token_name = current_token.ToString ();\r
97 \r
98                                 return String.Format ("{0} ({1},{2}), Token: {3} {4}", ref_name.Name,\r
99                                                                                        ref_line,\r
100                                                                                        col,\r
101                                                                                        current_token_name,\r
102                                                                                        det);\r
103                         }\r
104                 }\r
105 \r
106                 public bool PropertyParsing {\r
107                         get {\r
108                                 return handle_get_set;\r
109                         }\r
110 \r
111                         set {\r
112                                 handle_get_set = value;\r
113                         }\r
114                 }\r
115 \r
116                 public bool AssemblyTargetParsing {\r
117                         get {\r
118                                 return handle_assembly;\r
119                         }\r
120 \r
121                         set {\r
122                                 handle_assembly = value;\r
123                         }\r
124                 }\r
125 \r
126                 public bool EventParsing {\r
127                         get {\r
128                                 return handle_remove_add;\r
129                         }\r
130 \r
131                         set {\r
132                                 handle_remove_add = value;\r
133                         }\r
134                 }\r
135                 \r
136                 //\r
137                 // Class variables\r
138                 // \r
139                 static CharArrayHashtable[] keywords;\r
140                 static NumberStyles styles;\r
141                 static NumberFormatInfo csharp_format_info;\r
142                 \r
143                 //\r
144                 // Values for the associated token returned\r
145                 //\r
146                 int putback_char;\r
147                 Object val;\r
148 \r
149                 //\r
150                 // Pre-processor\r
151                 //\r
152                 Hashtable defines;\r
153 \r
154                 const int TAKING        = 1;\r
155                 const int TAKEN_BEFORE  = 2;\r
156                 const int ELSE_SEEN     = 4;\r
157                 const int PARENT_TAKING = 8;\r
158                 const int REGION        = 16;           \r
159 \r
160                 //\r
161                 // pre-processor if stack state:\r
162                 //\r
163                 Stack ifstack;\r
164 \r
165                 static System.Text.StringBuilder string_builder;\r
166 \r
167                 const int max_id_size = 512;\r
168                 static char [] id_builder = new char [max_id_size];\r
169 \r
170                 static CharArrayHashtable [] identifiers = new CharArrayHashtable [max_id_size + 1];\r
171 \r
172                 const int max_number_size = 128;\r
173                 static char [] number_builder = new char [max_number_size];\r
174                 static int number_pos;\r
175                 \r
176                 //\r
177                 // Details about the error encoutered by the tokenizer\r
178                 //\r
179                 string error_details;\r
180                 \r
181                 public string error {\r
182                         get {\r
183                                 return error_details;\r
184                         }\r
185                 }\r
186                 \r
187                 public int Line {\r
188                         get {\r
189                                 return ref_line;\r
190                         }\r
191                 }\r
192 \r
193                 public int Col {\r
194                         get {\r
195                                 return col;\r
196                         }\r
197                 }\r
198 \r
199                 static void AddKeyword (string kw, int token) {\r
200                         if (keywords [kw.Length] == null) {\r
201                                 keywords [kw.Length] = new CharArrayHashtable (kw.Length);\r
202                         }\r
203                         keywords [kw.Length] [kw.ToCharArray ()] = token;\r
204                 }\r
205 \r
206                 static void InitTokens ()\r
207                 {\r
208                         keywords = new CharArrayHashtable [64];\r
209 \r
210                         AddKeyword ("abstract", Token.ABSTRACT);\r
211                         AddKeyword ("as", Token.AS);\r
212                         AddKeyword ("add", Token.ADD);\r
213                         AddKeyword ("assembly", Token.ASSEMBLY);\r
214                         AddKeyword ("base", Token.BASE);\r
215                         AddKeyword ("bool", Token.BOOL);\r
216                         AddKeyword ("break", Token.BREAK);\r
217                         AddKeyword ("byte", Token.BYTE);\r
218                         AddKeyword ("case", Token.CASE);\r
219                         AddKeyword ("catch", Token.CATCH);\r
220                         AddKeyword ("char", Token.CHAR);\r
221                         AddKeyword ("checked", Token.CHECKED);\r
222                         AddKeyword ("class", Token.CLASS);\r
223                         AddKeyword ("const", Token.CONST);\r
224                         AddKeyword ("continue", Token.CONTINUE);\r
225                         AddKeyword ("decimal", Token.DECIMAL);\r
226                         AddKeyword ("default", Token.DEFAULT);\r
227                         AddKeyword ("delegate", Token.DELEGATE);\r
228                         AddKeyword ("do", Token.DO);\r
229                         AddKeyword ("double", Token.DOUBLE);\r
230                         AddKeyword ("else", Token.ELSE);\r
231                         AddKeyword ("enum", Token.ENUM);\r
232                         AddKeyword ("event", Token.EVENT);\r
233                         AddKeyword ("explicit", Token.EXPLICIT);\r
234                         AddKeyword ("extern", Token.EXTERN);\r
235                         AddKeyword ("false", Token.FALSE);\r
236                         AddKeyword ("finally", Token.FINALLY);\r
237                         AddKeyword ("fixed", Token.FIXED);\r
238                         AddKeyword ("float", Token.FLOAT);\r
239                         AddKeyword ("for", Token.FOR);\r
240                         AddKeyword ("foreach", Token.FOREACH);\r
241                         AddKeyword ("goto", Token.GOTO);\r
242                         AddKeyword ("get", Token.GET);\r
243                         AddKeyword ("if", Token.IF);\r
244                         AddKeyword ("implicit", Token.IMPLICIT);\r
245                         AddKeyword ("in", Token.IN);\r
246                         AddKeyword ("int", Token.INT);\r
247                         AddKeyword ("interface", Token.INTERFACE);\r
248                         AddKeyword ("internal", Token.INTERNAL);\r
249                         AddKeyword ("is", Token.IS);\r
250                         AddKeyword ("lock", Token.LOCK);\r
251                         AddKeyword ("long", Token.LONG);\r
252                         AddKeyword ("namespace", Token.NAMESPACE);\r
253                         AddKeyword ("new", Token.NEW);\r
254                         AddKeyword ("null", Token.NULL);\r
255                         AddKeyword ("object", Token.OBJECT);\r
256                         AddKeyword ("operator", Token.OPERATOR);\r
257                         AddKeyword ("out", Token.OUT);\r
258                         AddKeyword ("override", Token.OVERRIDE);\r
259                         AddKeyword ("params", Token.PARAMS);\r
260                         AddKeyword ("private", Token.PRIVATE);\r
261                         AddKeyword ("protected", Token.PROTECTED);\r
262                         AddKeyword ("public", Token.PUBLIC);\r
263                         AddKeyword ("readonly", Token.READONLY);\r
264                         AddKeyword ("ref", Token.REF);\r
265                         AddKeyword ("remove", Token.REMOVE);\r
266                         AddKeyword ("return", Token.RETURN);\r
267                         AddKeyword ("sbyte", Token.SBYTE);\r
268                         AddKeyword ("sealed", Token.SEALED);\r
269                         AddKeyword ("set", Token.SET);\r
270                         AddKeyword ("short", Token.SHORT);\r
271                         AddKeyword ("sizeof", Token.SIZEOF);\r
272                         AddKeyword ("stackalloc", Token.STACKALLOC);\r
273                         AddKeyword ("static", Token.STATIC);\r
274                         AddKeyword ("string", Token.STRING);\r
275                         AddKeyword ("struct", Token.STRUCT);\r
276                         AddKeyword ("switch", Token.SWITCH);\r
277                         AddKeyword ("this", Token.THIS);\r
278                         AddKeyword ("throw", Token.THROW);\r
279                         AddKeyword ("true", Token.TRUE);\r
280                         AddKeyword ("try", Token.TRY);\r
281                         AddKeyword ("typeof", Token.TYPEOF);\r
282                         AddKeyword ("uint", Token.UINT);\r
283                         AddKeyword ("ulong", Token.ULONG);\r
284                         AddKeyword ("unchecked", Token.UNCHECKED);\r
285                         AddKeyword ("unsafe", Token.UNSAFE);\r
286                         AddKeyword ("ushort", Token.USHORT);\r
287                         AddKeyword ("using", Token.USING);\r
288                         AddKeyword ("virtual", Token.VIRTUAL);\r
289                         AddKeyword ("void", Token.VOID);\r
290                         AddKeyword ("volatile", Token.VOLATILE);\r
291                         AddKeyword ("while", Token.WHILE);\r
292 \r
293                         if (RootContext.V2){\r
294                                 AddKeyword ("__yield", Token.YIELD);\r
295                                 AddKeyword ("yield", Token.YIELD);\r
296                         }\r
297                 }\r
298 \r
299                 //\r
300                 // Class initializer\r
301                 // \r
302                 static Tokenizer ()\r
303                 {\r
304                         InitTokens ();\r
305                         csharp_format_info = NumberFormatInfo.InvariantInfo;\r
306                         styles = NumberStyles.Float;\r
307                         \r
308                         string_builder = new System.Text.StringBuilder ();\r
309                 }\r
310 \r
311                 int GetKeyword (char[] id, int id_len)\r
312                 {\r
313                         /*\r
314                          * Keywords are stored in an array of hashtables grouped by their\r
315                          * length.\r
316                          */\r
317 \r
318                         if ((id_len >= keywords.Length) || (keywords [id_len] == null))\r
319                                 return -1;\r
320                         object o = keywords [id_len] [id];\r
321 \r
322                         if (o == null)\r
323                                 return -1;\r
324                         \r
325                         int res = (int) o;\r
326 \r
327                         if (handle_get_set == false && (res == Token.GET || res == Token.SET))\r
328                                 return -1;\r
329                         if (handle_remove_add == false && (res == Token.REMOVE || res == Token.ADD))\r
330                                 return -1;\r
331                         if (handle_assembly == false && res == Token.ASSEMBLY)\r
332                                 return -1;\r
333                         return res;\r
334                         \r
335                 }\r
336 \r
337                 public Location Location {\r
338                         get {\r
339                                 return new Location (ref_line);\r
340                         }\r
341                 }\r
342 \r
343                 void define (string def)\r
344                 {\r
345                         if (!RootContext.AllDefines.Contains (def)){\r
346                                 RootContext.AllDefines [def] = true;\r
347                         }\r
348                         if (defines.Contains (def))\r
349                                 return;\r
350                         defines [def] = true;\r
351                 }\r
352                 \r
353                 public Tokenizer (SeekableStreamReader input, SourceFile file, ArrayList defs)\r
354                 {\r
355                         this.ref_name = file;\r
356                         this.file_name = file;\r
357                         reader = input;\r
358                         \r
359                         putback_char = -1;\r
360 \r
361                         if (defs != null){\r
362                                 defines = new Hashtable ();\r
363                                 foreach (string def in defs)\r
364                                         define (def);\r
365                         }\r
366 \r
367                         //\r
368                         // FIXME: This could be `Location.Push' but we have to\r
369                         // find out why the MS compiler allows this\r
370                         //\r
371                         Mono.CSharp.Location.Push (file);\r
372                 }\r
373 \r
374                 public static void Cleanup () {\r
375                         identifiers = null;\r
376                 }\r
377 \r
378                 bool is_identifier_start_character (char c)\r
379                 {\r
380                         return (c >= 'A' && c <= 'Z') || (c >= 'a' && c <= 'z') || c == '_' || Char.IsLetter (c);\r
381                 }\r
382 \r
383                 bool is_identifier_part_character (char c)\r
384                 {\r
385                         return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || c == '_' || (c >= '0' && c <= '9') || Char.IsLetter (c);\r
386                 }\r
387 \r
388                 int is_punct (char c, ref bool doread)\r
389                 {\r
390                         int d;\r
391                         int t;\r
392 \r
393                         doread = false;\r
394 \r
395                         switch (c){\r
396                         case '{':\r
397                                 return Token.OPEN_BRACE;\r
398                         case '}':\r
399                                 return Token.CLOSE_BRACE;\r
400                         case '[':\r
401                                 return Token.OPEN_BRACKET;\r
402                         case ']':\r
403                                 return Token.CLOSE_BRACKET;\r
404                         case '(':\r
405                                 return Token.OPEN_PARENS;\r
406                         case ')': {\r
407                                 if (deambiguate_close_parens == 0)\r
408                                         return Token.CLOSE_PARENS;\r
409 \r
410                                 --deambiguate_close_parens;\r
411 \r
412                                 // Save current position and parse next token.\r
413                                 int old = reader.Position;\r
414                                 int new_token = token ();\r
415                                 reader.Position = old;\r
416                                 putback_char = -1;\r
417 \r
418                                 if (new_token == Token.OPEN_PARENS)\r
419                                         return Token.CLOSE_PARENS_OPEN_PARENS;\r
420                                 else if (new_token == Token.MINUS)\r
421                                         return Token.CLOSE_PARENS_MINUS;\r
422                                 else if (IsCastToken (new_token))\r
423                                         return Token.CLOSE_PARENS_CAST;\r
424                                 else\r
425                                         return Token.CLOSE_PARENS_NO_CAST;\r
426                         }\r
427 \r
428                         case ',':\r
429                                 return Token.COMMA;\r
430                         case ':':\r
431                                 return Token.COLON;\r
432                         case ';':\r
433                                 return Token.SEMICOLON;\r
434                         case '~':\r
435                                 return Token.TILDE;\r
436                         case '?':\r
437                                 return Token.INTERR;\r
438                         }\r
439 \r
440                         d = peekChar ();\r
441                         if (c == '+'){\r
442                                 \r
443                                 if (d == '+')\r
444                                         t = Token.OP_INC;\r
445                                 else if (d == '=')\r
446                                         t = Token.OP_ADD_ASSIGN;\r
447                                 else\r
448                                         return Token.PLUS;\r
449                                 doread = true;\r
450                                 return t;\r
451                         }\r
452                         if (c == '-'){\r
453                                 if (d == '-')\r
454                                         t = Token.OP_DEC;\r
455                                 else if (d == '=')\r
456                                         t = Token.OP_SUB_ASSIGN;\r
457                                 else if (d == '>')\r
458                                         t = Token.OP_PTR;\r
459                                 else\r
460                                         return Token.MINUS;\r
461                                 doread = true;\r
462                                 return t;\r
463                         }\r
464 \r
465                         if (c == '!'){\r
466                                 if (d == '='){\r
467                                         doread = true;\r
468                                         return Token.OP_NE;\r
469                                 }\r
470                                 return Token.BANG;\r
471                         }\r
472 \r
473                         if (c == '='){\r
474                                 if (d == '='){\r
475                                         doread = true;\r
476                                         return Token.OP_EQ;\r
477                                 }\r
478                                 return Token.ASSIGN;\r
479                         }\r
480 \r
481                         if (c == '&'){\r
482                                 if (d == '&'){\r
483                                         doread = true;\r
484                                         return Token.OP_AND;\r
485                                 } else if (d == '='){\r
486                                         doread = true;\r
487                                         return Token.OP_AND_ASSIGN;\r
488                                 }\r
489                                 return Token.BITWISE_AND;\r
490                         }\r
491 \r
492                         if (c == '|'){\r
493                                 if (d == '|'){\r
494                                         doread = true;\r
495                                         return Token.OP_OR;\r
496                                 } else if (d == '='){\r
497                                         doread = true;\r
498                                         return Token.OP_OR_ASSIGN;\r
499                                 }\r
500                                 return Token.BITWISE_OR;\r
501                         }\r
502 \r
503                         if (c == '*'){\r
504                                 if (d == '='){\r
505                                         doread = true;\r
506                                         return Token.OP_MULT_ASSIGN;\r
507                                 }\r
508                                 return Token.STAR;\r
509                         }\r
510 \r
511                         if (c == '/'){\r
512                                 if (d == '='){\r
513                                         doread = true;\r
514                                         return Token.OP_DIV_ASSIGN;\r
515                                 }\r
516                                 return Token.DIV;\r
517                         }\r
518 \r
519                         if (c == '%'){\r
520                                 if (d == '='){\r
521                                         doread = true;\r
522                                         return Token.OP_MOD_ASSIGN;\r
523                                 }\r
524                                 return Token.PERCENT;\r
525                         }\r
526 \r
527                         if (c == '^'){\r
528                                 if (d == '='){\r
529                                         doread = true;\r
530                                         return Token.OP_XOR_ASSIGN;\r
531                                 }\r
532                                 return Token.CARRET;\r
533                         }\r
534 \r
535                         if (c == '<'){\r
536                                 if (d == '<'){\r
537                                         getChar ();\r
538                                         d = peekChar ();\r
539 \r
540                                         if (d == '='){\r
541                                                 doread = true;\r
542                                                 return Token.OP_SHIFT_LEFT_ASSIGN;\r
543                                         }\r
544                                         return Token.OP_SHIFT_LEFT;\r
545                                 } else if (d == '='){\r
546                                         doread = true;\r
547                                         return Token.OP_LE;\r
548                                 }\r
549                                 return Token.OP_LT;\r
550                         }\r
551 \r
552                         if (c == '>'){\r
553                                 if (d == '>'){\r
554                                         getChar ();\r
555                                         d = peekChar ();\r
556 \r
557                                         if (d == '='){\r
558                                                 doread = true;\r
559                                                 return Token.OP_SHIFT_RIGHT_ASSIGN;\r
560                                         }\r
561                                         return Token.OP_SHIFT_RIGHT;\r
562                                 } else if (d == '='){\r
563                                         doread = true;\r
564                                         return Token.OP_GE;\r
565                                 }\r
566                                 return Token.OP_GT;\r
567                         }\r
568                         return Token.ERROR;\r
569                 }\r
570 \r
571                 int deambiguate_close_parens = 0;\r
572 \r
573                 public void Deambiguate_CloseParens ()\r
574                 {\r
575                         putback (')');\r
576                         deambiguate_close_parens++;\r
577                 }\r
578 \r
579                 void Error_NumericConstantTooLong ()\r
580                 {\r
581                         Report.Error (1021, Location, "Numeric constant too long");                     \r
582                 }\r
583                 \r
584                 bool decimal_digits (int c)\r
585                 {\r
586                         int d;\r
587                         bool seen_digits = false;\r
588                         \r
589                         if (c != -1){\r
590                                 if (number_pos == max_number_size)\r
591                                         Error_NumericConstantTooLong ();\r
592                                 number_builder [number_pos++] = (char) c;\r
593                         }\r
594                         \r
595                         //\r
596                         // We use peekChar2, because decimal_digits needs to do a \r
597                         // 2-character look-ahead (5.ToString for example).\r
598                         //\r
599                         while ((d = peekChar2 ()) != -1){\r
600                                 if (d >= '0' && d <= '9'){\r
601                                         if (number_pos == max_number_size)\r
602                                                 Error_NumericConstantTooLong ();\r
603                                         number_builder [number_pos++] = (char) d;\r
604                                         getChar ();\r
605                                         seen_digits = true;\r
606                                 } else\r
607                                         break;\r
608                         }\r
609                         \r
610                         return seen_digits;\r
611                 }\r
612 \r
613                 bool is_hex (int e)\r
614                 {\r
615                         return (e >= '0' && e <= '9') || (e >= 'A' && e <= 'F') || (e >= 'a' && e <= 'f');\r
616                 }\r
617                 \r
618                 void hex_digits (int c)\r
619                 {\r
620                         if (c != -1)\r
621                                 number_builder [number_pos++] = (char) c;\r
622                         \r
623                 }\r
624                 \r
625                 int real_type_suffix (int c)\r
626                 {\r
627                         int t;\r
628 \r
629                         switch (c){\r
630                         case 'F': case 'f':\r
631                                 t =  Token.LITERAL_FLOAT;\r
632                                 break;\r
633                         case 'D': case 'd':\r
634                                 t = Token.LITERAL_DOUBLE;\r
635                                 break;\r
636                         case 'M': case 'm':\r
637                                  t= Token.LITERAL_DECIMAL;\r
638                                 break;\r
639                         default:\r
640                                 return Token.NONE;\r
641                         }\r
642                         return t;\r
643                 }\r
644 \r
645                 int integer_type_suffix (ulong ul, int c)\r
646                 {\r
647                         bool is_unsigned = false;\r
648                         bool is_long = false;\r
649 \r
650                         if (c != -1){\r
651                                 bool scanning = true;\r
652                                 do {\r
653                                         switch (c){\r
654                                         case 'U': case 'u':\r
655                                                 if (is_unsigned)\r
656                                                         scanning = false;\r
657                                                 is_unsigned = true;\r
658                                                 getChar ();\r
659                                                 break;\r
660 \r
661                                         case 'l':\r
662                                                 if (!is_unsigned){\r
663                                                         //\r
664                                                         // if we have not seen anything in between\r
665                                                         // report this error\r
666                                                         //\r
667                                                         Report.Warning (\r
668                                                                 78, Location,\r
669                                                         "the 'l' suffix is easily confused with digit `1'," +\r
670                                                         " use 'L' for clarity");\r
671                                                 }\r
672                                                 goto case 'L';\r
673                                                 \r
674                                         case 'L': \r
675                                                 if (is_long)\r
676                                                         scanning = false;\r
677                                                 is_long = true;\r
678                                                 getChar ();\r
679                                                 break;\r
680                                                 \r
681                                         default:\r
682                                                 scanning = false;\r
683                                                 break;\r
684                                         }\r
685                                         c = peekChar ();\r
686                                 } while (scanning);\r
687                         }\r
688 \r
689                         if (is_long && is_unsigned){\r
690                                 val = ul;\r
691                                 return Token.LITERAL_INTEGER;\r
692                         } else if (is_unsigned){\r
693                                 // uint if possible, or ulong else.\r
694 \r
695                                 if ((ul & 0xffffffff00000000) == 0)\r
696                                         val = (uint) ul;\r
697                                 else\r
698                                         val = ul;\r
699                         } else if (is_long){\r
700                                 // long if possible, ulong otherwise\r
701                                 if ((ul & 0x8000000000000000) != 0)\r
702                                         val = ul;\r
703                                 else\r
704                                         val = (long) ul;\r
705                         } else {\r
706                                 // int, uint, long or ulong in that order\r
707                                 if ((ul & 0xffffffff00000000) == 0){\r
708                                         uint ui = (uint) ul;\r
709                                         \r
710                                         if ((ui & 0x80000000) != 0)\r
711                                                 val = ui;\r
712                                         else\r
713                                                 val = (int) ui;\r
714                                 } else {\r
715                                         if ((ul & 0x8000000000000000) != 0)\r
716                                                 val = ul;\r
717                                         else\r
718                                                 val = (long) ul;\r
719                                 }\r
720                         }\r
721                         return Token.LITERAL_INTEGER;\r
722                 }\r
723                                 \r
724                 //\r
725                 // given `c' as the next char in the input decide whether\r
726                 // we need to convert to a special type, and then choose\r
727                 // the best representation for the integer\r
728                 //\r
729                 int adjust_int (int c)\r
730                 {\r
731                         try {\r
732                                 if (number_pos > 9){\r
733                                         ulong ul = (uint) (number_builder [0] - '0');\r
734 \r
735                                         for (int i = 1; i < number_pos; i++){\r
736                                                 ul = checked ((ul * 10) + ((uint)(number_builder [i] - '0')));\r
737                                         }\r
738                                         return integer_type_suffix (ul, c);\r
739                                 } else {\r
740                                         uint ui = (uint) (number_builder [0] - '0');\r
741 \r
742                                         for (int i = 1; i < number_pos; i++){\r
743                                                 ui = checked ((ui * 10) + ((uint)(number_builder [i] - '0')));\r
744                                         }\r
745                                         return integer_type_suffix (ui, c);\r
746                                 }\r
747                         } catch (OverflowException) {\r
748                                 error_details = "Integral constant is too large";\r
749                                 Report.Error (1021, Location, error_details);\r
750                                 val = 0ul;\r
751                                 return Token.LITERAL_INTEGER;\r
752                         }\r
753                 }\r
754                 \r
755                 int adjust_real (int t)\r
756                 {\r
757                         string s = new String (number_builder, 0, number_pos);\r
758 \r
759                         switch (t){\r
760                         case Token.LITERAL_DECIMAL:\r
761                                 try {\r
762                                         val = System.Decimal.Parse (s, styles, csharp_format_info);\r
763                                 } catch (OverflowException) {\r
764                                         val = 0m;     \r
765                                         error_details = "Floating-point constant is outside the range of the type 'decimal'";\r
766                                         Report.Error (594, Location, error_details);\r
767                                 }\r
768                                 break;\r
769                         case Token.LITERAL_FLOAT:\r
770                                 try {\r
771                                         val = (float) System.Double.Parse (s, styles, csharp_format_info);\r
772                                 } catch (OverflowException) {\r
773                                         val = 0.0f;     \r
774                                         error_details = "Floating-point constant is outside the range of the type 'float'";\r
775                                         Report.Error (594, Location, error_details);\r
776                                 }\r
777                                 break;\r
778                                 \r
779                         case Token.LITERAL_DOUBLE:\r
780                         case Token.NONE:\r
781                                 t = Token.LITERAL_DOUBLE;\r
782                                 try {\r
783                                         val = System.Double.Parse (s, styles, csharp_format_info);\r
784                                 } catch (OverflowException) {\r
785                                         val = 0.0;     \r
786                                         error_details = "Floating-point constant is outside the range of the type 'double'";\r
787                                         Report.Error (594, Location, error_details);\r
788                                 }\r
789                                 break;\r
790                         }\r
791                         return t;\r
792                 }\r
793 \r
794                 int handle_hex ()\r
795                 {\r
796                         int d;\r
797                         ulong ul;\r
798                         \r
799                         getChar ();\r
800                         while ((d = peekChar ()) != -1){\r
801                                 if (is_hex (d)){\r
802                                         number_builder [number_pos++] = (char) d;\r
803                                         getChar ();\r
804                                 } else\r
805                                         break;\r
806                         }\r
807                         \r
808                         string s = new String (number_builder, 0, number_pos);\r
809                         try {\r
810                                 if (number_pos <= 8)\r
811                                         ul = System.UInt32.Parse (s, NumberStyles.HexNumber);\r
812                                 else\r
813                                         ul = System.UInt64.Parse (s, NumberStyles.HexNumber);\r
814                         } catch (OverflowException){\r
815                                 error_details = "Integral constant is too large";\r
816                                 Report.Error (1021, Location, error_details);\r
817                                 val = 0ul;\r
818                                 return Token.LITERAL_INTEGER;\r
819                         }\r
820                         \r
821                         return integer_type_suffix (ul, peekChar ());\r
822                 }\r
823 \r
824                 //\r
825                 // Invoked if we know we have .digits or digits\r
826                 //\r
827                 int is_number (int c)\r
828                 {\r
829                         bool is_real = false;\r
830                         int type;\r
831 \r
832                         number_pos = 0;\r
833 \r
834                         if (c >= '0' && c <= '9'){\r
835                                 if (c == '0'){\r
836                                         int peek = peekChar ();\r
837 \r
838                                         if (peek == 'x' || peek == 'X')\r
839                                                 return handle_hex ();\r
840                                 }\r
841                                 decimal_digits (c);\r
842                                 c = getChar ();\r
843                         }\r
844 \r
845                         //\r
846                         // We need to handle the case of\r
847                         // "1.1" vs "1.string" (LITERAL_FLOAT vs NUMBER DOT IDENTIFIER)\r
848                         //\r
849                         if (c == '.'){\r
850                                 if (decimal_digits ('.')){\r
851                                         is_real = true;\r
852                                         c = getChar ();\r
853                                 } else {\r
854                                         putback ('.');\r
855                                         number_pos--;\r
856                                         return adjust_int (-1);\r
857                                 }\r
858                         }\r
859                         \r
860                         if (c == 'e' || c == 'E'){\r
861                                 is_real = true;\r
862                                 if (number_pos == max_number_size)\r
863                                         Error_NumericConstantTooLong ();\r
864                                 number_builder [number_pos++] = 'e';\r
865                                 c = getChar ();\r
866                                 \r
867                                 if (c == '+'){\r
868                                         if (number_pos == max_number_size)\r
869                                                 Error_NumericConstantTooLong ();\r
870                                         number_builder [number_pos++] = '+';\r
871                                         c = -1;\r
872                                 } else if (c == '-') {\r
873                                         if (number_pos == max_number_size)\r
874                                                 Error_NumericConstantTooLong ();\r
875                                         number_builder [number_pos++] = '-';\r
876                                         c = -1;\r
877                                 } else {\r
878                                         if (number_pos == max_number_size)\r
879                                                 Error_NumericConstantTooLong ();\r
880                                         number_builder [number_pos++] = '+';\r
881                                 }\r
882                                         \r
883                                 decimal_digits (c);\r
884                                 c = getChar ();\r
885                         }\r
886 \r
887                         type = real_type_suffix (c);\r
888                         if (type == Token.NONE && !is_real){\r
889                                 putback (c);\r
890                                 return adjust_int (c);\r
891                         } else \r
892                                 is_real = true;\r
893 \r
894                         if (type == Token.NONE){\r
895                                 putback (c);\r
896                         }\r
897                         \r
898                         if (is_real)\r
899                                 return adjust_real (type);\r
900 \r
901                         Console.WriteLine ("This should not be reached");\r
902                         throw new Exception ("Is Number should never reach this point");\r
903                 }\r
904 \r
905                 //\r
906                 // Accepts exactly count (4 or 8) hex, no more no less\r
907                 //\r
908                 int getHex (int count, out bool error)\r
909                 {\r
910                         int i;\r
911                         int total = 0;\r
912                         int c;\r
913                         int top = count != -1 ? count : 4;\r
914                         \r
915                         getChar ();\r
916                         error = false;\r
917                         for (i = 0; i < top; i++){\r
918                                 c = getChar ();\r
919                                 \r
920                                 if (c >= '0' && c <= '9')\r
921                                         c = (int) c - (int) '0';\r
922                                 else if (c >= 'A' && c <= 'F')\r
923                                         c = (int) c - (int) 'A' + 10;\r
924                                 else if (c >= 'a' && c <= 'f')\r
925                                         c = (int) c - (int) 'a' + 10;\r
926                                 else {\r
927                                         error = true;\r
928                                         return 0;\r
929                                 }\r
930                                 \r
931                                 total = (total * 16) + c;\r
932                                 if (count == -1){\r
933                                         int p = peekChar ();\r
934                                         if (p == -1)\r
935                                                 break;\r
936                                         if (!is_hex ((char)p))\r
937                                                 break;\r
938                                 }\r
939                         }\r
940                         return total;\r
941                 }\r
942 \r
943                 int escape (int c)\r
944                 {\r
945                         bool error;\r
946                         int d;\r
947                         int v;\r
948 \r
949                         d = peekChar ();\r
950                         if (c != '\\')\r
951                                 return c;\r
952                         \r
953                         switch (d){\r
954                         case 'a':\r
955                                 v = '\a'; break;\r
956                         case 'b':\r
957                                 v = '\b'; break;\r
958                         case 'n':\r
959                                 v = '\n'; break;\r
960                         case 't':\r
961                                 v = '\t'; break;\r
962                         case 'v':\r
963                                 v = '\v'; break;\r
964                         case 'r':\r
965                                 v = '\r'; break;\r
966                         case '\\':\r
967                                 v = '\\'; break;\r
968                         case 'f':\r
969                                 v = '\f'; break;\r
970                         case '0':\r
971                                 v = 0; break;\r
972                         case '"':\r
973                                 v = '"'; break;\r
974                         case '\'':\r
975                                 v = '\''; break;\r
976                         case 'x':\r
977                                 v = getHex (-1, out error);\r
978                                 if (error)\r
979                                         goto default;\r
980                                 return v;\r
981                         case 'u':\r
982                                 v = getHex (4, out error);\r
983                                 if (error)\r
984                                         goto default;\r
985                                 return v;\r
986                         case 'U':\r
987                                 v = getHex (8, out error);\r
988                                 if (error)\r
989                                         goto default;\r
990                                 return v;\r
991                         default:\r
992                                 Report.Error (1009, Location, "Unrecognized escape sequence in " + (char)d);\r
993                                 return d;\r
994                         }\r
995                         getChar ();\r
996                         return v;\r
997                 }\r
998 \r
999                 int getChar ()\r
1000                 {\r
1001                         if (putback_char != -1){\r
1002                                 int x = putback_char;\r
1003                                 putback_char = -1;\r
1004 \r
1005                                 return x;\r
1006                         }\r
1007                         return reader.Read ();\r
1008                 }\r
1009 \r
1010                 int peekChar ()\r
1011                 {\r
1012                         if (putback_char != -1)\r
1013                                 return putback_char;\r
1014                         putback_char = reader.Read ();\r
1015                         return putback_char;\r
1016                 }\r
1017 \r
1018                 int peekChar2 ()\r
1019                 {\r
1020                         if (putback_char != -1)\r
1021                                 return putback_char;\r
1022                         return reader.Peek ();\r
1023                 }\r
1024                 \r
1025                 void putback (int c)\r
1026                 {\r
1027                         if (putback_char != -1){\r
1028                                 Console.WriteLine ("Col: " + col);\r
1029                                 Console.WriteLine ("Row: " + line);\r
1030                                 Console.WriteLine ("Name: " + ref_name.Name);\r
1031                                 Console.WriteLine ("Current [{0}] putting back [{1}]  ", putback_char, c);\r
1032                                 throw new Exception ("This should not happen putback on putback");\r
1033                         }\r
1034                         putback_char = c;\r
1035                 }\r
1036 \r
1037                 public bool advance ()\r
1038                 {\r
1039                         return peekChar () != -1;\r
1040                 }\r
1041 \r
1042                 public Object Value {\r
1043                         get {\r
1044                                 return val;\r
1045                         }\r
1046                 }\r
1047 \r
1048                 public Object value ()\r
1049                 {\r
1050                         return val;\r
1051                 }\r
1052 \r
1053                 bool IsCastToken (int token)\r
1054                 {\r
1055                         switch (token) {\r
1056                         case Token.BANG:\r
1057                         case Token.TILDE:\r
1058                         case Token.IDENTIFIER:\r
1059                         case Token.LITERAL_INTEGER:\r
1060                         case Token.LITERAL_FLOAT:\r
1061                         case Token.LITERAL_DOUBLE:\r
1062                         case Token.LITERAL_DECIMAL:\r
1063                         case Token.LITERAL_CHARACTER:\r
1064                         case Token.LITERAL_STRING:\r
1065                         case Token.BASE:\r
1066                         case Token.CHECKED:\r
1067                         case Token.FALSE:\r
1068                         case Token.FIXED:\r
1069                         case Token.NEW:\r
1070                         case Token.NULL:\r
1071                         case Token.SIZEOF:\r
1072                         case Token.THIS:\r
1073                         case Token.THROW:\r
1074                         case Token.TRUE:\r
1075                         case Token.TYPEOF:\r
1076                         case Token.UNCHECKED:\r
1077                         case Token.UNSAFE:\r
1078 \r
1079                                 //\r
1080                                 // These can be part of a member access\r
1081                                 //\r
1082                         case Token.INT:\r
1083                         case Token.UINT:\r
1084                         case Token.SHORT:\r
1085                         case Token.USHORT:\r
1086                         case Token.LONG:\r
1087                         case Token.ULONG:\r
1088                         case Token.DOUBLE:\r
1089                         case Token.FLOAT:\r
1090                         case Token.CHAR:\r
1091                                 return true;\r
1092 \r
1093                         default:\r
1094                                 return false;\r
1095                         }\r
1096                 }\r
1097 \r
1098                 public int token ()\r
1099                 {\r
1100                         current_token = xtoken ();\r
1101                         return current_token;\r
1102                 }\r
1103 \r
1104                 static StringBuilder static_cmd_arg = new System.Text.StringBuilder ();\r
1105                 \r
1106                 void get_cmd_arg (out string cmd, out string arg)\r
1107                 {\r
1108                         int c;\r
1109                         \r
1110                         tokens_seen = false;\r
1111                         arg = "";\r
1112                         static_cmd_arg.Length = 0;\r
1113                                 \r
1114                         while ((c = getChar ()) != -1 && (c != '\n') && (c != ' ') && (c != '\t') && (c != '\r')){\r
1115                                 static_cmd_arg.Append ((char) c);\r
1116                         }\r
1117 \r
1118                         cmd = static_cmd_arg.ToString ();\r
1119 \r
1120                         if (c == '\n'){\r
1121                                 line++;\r
1122                                 ref_line++;\r
1123                                 return;\r
1124                         } else if (c == '\r')\r
1125                                 col = 0;\r
1126 \r
1127                         // skip over white space\r
1128                         while ((c = getChar ()) != -1 && (c != '\n') && ((c == '\r') || (c == ' ') || (c == '\t')))\r
1129                                 ;\r
1130 \r
1131                         if (c == '\n'){\r
1132                                 line++;\r
1133                                 ref_line++;\r
1134                                 return;\r
1135                         } else if (c == '\r'){\r
1136                                 col = 0;\r
1137                                 return;\r
1138                         }\r
1139                         \r
1140                         static_cmd_arg.Length = 0;\r
1141                         static_cmd_arg.Append ((char) c);\r
1142                         \r
1143                         while ((c = getChar ()) != -1 && (c != '\n') && (c != '\r')){\r
1144                                 static_cmd_arg.Append ((char) c);\r
1145                         }\r
1146 \r
1147                         if (c == '\n'){\r
1148                                 line++;\r
1149                                 ref_line++;\r
1150                         } else if (c == '\r')\r
1151                                 col = 0;\r
1152                         arg = static_cmd_arg.ToString ().Trim ();\r
1153                 }\r
1154 \r
1155                 //\r
1156                 // Handles the #line directive\r
1157                 //\r
1158                 bool PreProcessLine (string arg)\r
1159                 {\r
1160                         if (arg == "")\r
1161                                 return false;\r
1162 \r
1163                         if (arg == "default"){\r
1164                                 ref_line = line;\r
1165                                 ref_name = file_name;\r
1166                                 Location.Push (ref_name);\r
1167                                 return true;\r
1168                         }\r
1169                         \r
1170                         try {\r
1171                                 int pos;\r
1172 \r
1173                                 if ((pos = arg.IndexOf (' ')) != -1 && pos != 0){\r
1174                                         ref_line = System.Int32.Parse (arg.Substring (0, pos));\r
1175                                         pos++;\r
1176                                         \r
1177                                         char [] quotes = { '\"' };\r
1178                                         \r
1179                                         string name = arg.Substring (pos). Trim (quotes);\r
1180                                         ref_name = Location.LookupFile (name);\r
1181                                         Location.Push (ref_name);\r
1182                                 } else {\r
1183                                         ref_line = System.Int32.Parse (arg);\r
1184                                 }\r
1185                         } catch {\r
1186                                 return false;\r
1187                         }\r
1188                         \r
1189                         return true;\r
1190                 }\r
1191 \r
1192                 //\r
1193                 // Handles #define and #undef\r
1194                 //\r
1195                 void PreProcessDefinition (bool is_define, string arg)\r
1196                 {\r
1197                         if (arg == "" || arg == "true" || arg == "false"){\r
1198                                 Report.Error (1001, Location, "Missing identifer to pre-processor directive");\r
1199                                 return;\r
1200                         }\r
1201 \r
1202                         char[] whitespace = { ' ', '\t' };\r
1203                         if (arg.IndexOfAny (whitespace) != -1){\r
1204                                 Report.Error (1025, Location, "Single-line comment or end-of-line expected");\r
1205                                 return;\r
1206                         }\r
1207 \r
1208                         if (!is_identifier_start_character (arg [0]))\r
1209                                 Report.Error (1001, Location, "Identifier expected: " + arg);\r
1210                         \r
1211                         foreach (char c in arg.Substring (1)){\r
1212                                 if (!is_identifier_part_character (c)){\r
1213                                         Report.Error (1001, Location, "Identifier expected: " + arg);\r
1214                                         return;\r
1215                                 }\r
1216                         }\r
1217 \r
1218                         if (is_define){\r
1219                                 if (defines == null)\r
1220                                         defines = new Hashtable ();\r
1221                                 define (arg);\r
1222                         } else {\r
1223                                 if (defines == null)\r
1224                                         return;\r
1225                                 if (defines.Contains (arg))\r
1226                                         defines.Remove (arg);\r
1227                         }\r
1228                 }\r
1229 \r
1230                 bool eval_val (string s)\r
1231                 {\r
1232                         if (s == "true")\r
1233                                 return true;\r
1234                         if (s == "false")\r
1235                                 return false;\r
1236                         \r
1237                         if (defines == null)\r
1238                                 return false;\r
1239                         if (defines.Contains (s))\r
1240                                 return true;\r
1241 \r
1242                         return false;\r
1243                 }\r
1244 \r
1245                 bool pp_primary (ref string s)\r
1246                 {\r
1247                         s = s.Trim ();\r
1248                         int len = s.Length;\r
1249 \r
1250                         if (len > 0){\r
1251                                 char c = s [0];\r
1252                                 \r
1253                                 if (c == '('){\r
1254                                         s = s.Substring (1);\r
1255                                         bool val = pp_expr (ref s);\r
1256                                         if (s.Length > 0 && s [0] == ')'){\r
1257                                                 s = s.Substring (1);\r
1258                                                 return val;\r
1259                                         }\r
1260                                         Error_InvalidDirective ();\r
1261                                         return false;\r
1262                                 }\r
1263                                 \r
1264                                 if (is_identifier_start_character (c)){\r
1265                                         int j = 1;\r
1266 \r
1267                                         while (j < len){\r
1268                                                 c = s [j];\r
1269                                                 \r
1270                                                 if (is_identifier_part_character (c)){\r
1271                                                         j++;\r
1272                                                         continue;\r
1273                                                 }\r
1274                                                 bool v = eval_val (s.Substring (0, j));\r
1275                                                 s = s.Substring (j);\r
1276                                                 return v;\r
1277                                         }\r
1278                                         bool vv = eval_val (s);\r
1279                                         s = "";\r
1280                                         return vv;\r
1281                                 }\r
1282                         }\r
1283                         Error_InvalidDirective ();\r
1284                         return false;\r
1285                 }\r
1286                 \r
1287                 bool pp_unary (ref string s)\r
1288                 {\r
1289                         s = s.Trim ();\r
1290                         int len = s.Length;\r
1291 \r
1292                         if (len > 0){\r
1293                                 if (s [0] == '!'){\r
1294                                         if (len > 1 && s [1] == '='){\r
1295                                                 Error_InvalidDirective ();\r
1296                                                 return false;\r
1297                                         }\r
1298                                         s = s.Substring (1);\r
1299                                         return ! pp_primary (ref s);\r
1300                                 } else\r
1301                                         return pp_primary (ref s);\r
1302                         } else {\r
1303                                 Error_InvalidDirective ();\r
1304                                 return false;\r
1305                         }\r
1306                 }\r
1307                 \r
1308                 bool pp_eq (ref string s)\r
1309                 {\r
1310                         bool va = pp_unary (ref s);\r
1311 \r
1312                         s = s.Trim ();\r
1313                         int len = s.Length;\r
1314                         if (len > 0){\r
1315                                 if (s [0] == '='){\r
1316                                         if (len > 2 && s [1] == '='){\r
1317                                                 s = s.Substring (2);\r
1318                                                 return va == pp_unary (ref s);\r
1319                                         } else {\r
1320                                                 Error_InvalidDirective ();\r
1321                                                 return false;\r
1322                                         }\r
1323                                 } else if (s [0] == '!' && len > 1 && s [1] == '='){\r
1324                                         s = s.Substring (2);\r
1325 \r
1326                                         return va != pp_unary (ref s);\r
1327 \r
1328                                 } \r
1329                         }\r
1330 \r
1331                         return va;\r
1332                                 \r
1333                 }\r
1334                 \r
1335                 bool pp_and (ref string s)\r
1336                 {\r
1337                         bool va = pp_eq (ref s);\r
1338 \r
1339                         s = s.Trim ();\r
1340                         int len = s.Length;\r
1341                         if (len > 0){\r
1342                                 if (s [0] == '&'){\r
1343                                         if (len > 2 && s [1] == '&'){\r
1344                                                 s = s.Substring (2);\r
1345                                                 return (va & pp_eq (ref s));\r
1346                                         } else {\r
1347                                                 Error_InvalidDirective ();\r
1348                                                 return false;\r
1349                                         }\r
1350                                 } \r
1351                         }\r
1352                         return va;\r
1353                 }\r
1354                 \r
1355                 //\r
1356                 // Evaluates an expression for `#if' or `#elif'\r
1357                 //\r
1358                 bool pp_expr (ref string s)\r
1359                 {\r
1360                         bool va = pp_and (ref s);\r
1361                         s = s.Trim ();\r
1362                         int len = s.Length;\r
1363                         if (len > 0){\r
1364                                 char c = s [0];\r
1365                                 \r
1366                                 if (c == '|'){\r
1367                                         if (len > 2 && s [1] == '|'){\r
1368                                                 s = s.Substring (2);\r
1369                                                 return va | pp_expr (ref s);\r
1370                                         } else {\r
1371                                                 Error_InvalidDirective ();\r
1372                                                 return false;\r
1373                                         }\r
1374                                 } \r
1375                         }\r
1376                         \r
1377                         return va;\r
1378                 }\r
1379 \r
1380                 bool eval (string s)\r
1381                 {\r
1382                         bool v = pp_expr (ref s);\r
1383                         s = s.Trim ();\r
1384                         if (s.Length != 0){\r
1385                                 Error_InvalidDirective ();\r
1386                                 return false;\r
1387                         }\r
1388 \r
1389                         return v;\r
1390                 }\r
1391                 \r
1392                 void Error_InvalidDirective ()\r
1393                 {\r
1394                         Report.Error (1517, Location, "Invalid pre-processor directive");\r
1395                 }\r
1396 \r
1397                 void Error_UnexpectedDirective (string extra)\r
1398                 {\r
1399                         Report.Error (\r
1400                                 1028, Location,\r
1401                                 "Unexpected processor directive (" + extra + ")");\r
1402                 }\r
1403 \r
1404                 void Error_TokensSeen ()\r
1405                 {\r
1406                         Report.Error (\r
1407                                 1032, Location,\r
1408                                 "Cannot define or undefine pre-processor symbols after a token in the file");\r
1409                 }\r
1410                 \r
1411                 //\r
1412                 // if true, then the code continues processing the code\r
1413                 // if false, the code stays in a loop until another directive is\r
1414                 // reached.\r
1415                 //\r
1416                 bool handle_preprocessing_directive (bool caller_is_taking)\r
1417                 {\r
1418                         string cmd, arg;\r
1419                         bool region_directive = false;\r
1420 \r
1421                         get_cmd_arg (out cmd, out arg);\r
1422 \r
1423                         // Eat any trailing whitespaces and single-line comments\r
1424                         if (arg.IndexOf ("//") != -1)\r
1425                                 arg = arg.Substring (0, arg.IndexOf ("//"));\r
1426                         arg = arg.TrimEnd (' ', '\t');\r
1427 \r
1428                         //\r
1429                         // The first group of pre-processing instructions is always processed\r
1430                         //\r
1431                         switch (cmd){\r
1432                         case "pragma":\r
1433                                 if (RootContext.V2)\r
1434                                         return true;\r
1435                                 break;\r
1436                                 \r
1437                         case "line":\r
1438                                 if (!PreProcessLine (arg))\r
1439                                         Report.Error (\r
1440                                                 1576, Location,\r
1441                                                 "Argument to #line directive is missing or invalid");\r
1442                                 return true;\r
1443 \r
1444                         case "region":\r
1445                                 region_directive = true;\r
1446                                 arg = "true";\r
1447                                 goto case "if";\r
1448 \r
1449                         case "endregion":\r
1450                                 region_directive = true;\r
1451                                 goto case "endif";\r
1452                                 \r
1453                         case "if":\r
1454                                 if (arg == ""){\r
1455                                         Error_InvalidDirective ();\r
1456                                         return true;\r
1457                                 }\r
1458                                 bool taking = false;\r
1459                                 if (ifstack == null)\r
1460                                         ifstack = new Stack ();\r
1461 \r
1462                                 if (ifstack.Count == 0){\r
1463                                         taking = true;\r
1464                                 } else {\r
1465                                         int state = (int) ifstack.Peek ();\r
1466                                         if ((state & TAKING) != 0)\r
1467                                                 taking = true;\r
1468                                 }\r
1469 \r
1470                                 if (eval (arg) && taking){\r
1471                                         int push = TAKING | TAKEN_BEFORE | PARENT_TAKING;\r
1472                                         if (region_directive)\r
1473                                                 push |= REGION;\r
1474                                         ifstack.Push (push);\r
1475                                         return true;\r
1476                                 } else {\r
1477                                         int push = (taking ? PARENT_TAKING : 0);\r
1478                                         if (region_directive)\r
1479                                                 push |= REGION;\r
1480                                         ifstack.Push (push);\r
1481                                         return false;\r
1482                                 }\r
1483                                 \r
1484                         case "endif":\r
1485                                 if (ifstack == null || ifstack.Count == 0){\r
1486                                         Error_UnexpectedDirective ("no #if for this #endif");\r
1487                                         return true;\r
1488                                 } else {\r
1489                                         int pop = (int) ifstack.Pop ();\r
1490                                         \r
1491                                         if (region_directive && ((pop & REGION) == 0))\r
1492                                                 Report.Error (1027, Location, "#endif directive expected");\r
1493                                         else if (!region_directive && ((pop & REGION) != 0))\r
1494                                                 Report.Error (1038, Location, "#endregion directive expected");\r
1495                                         \r
1496                                         if (ifstack.Count == 0)\r
1497                                                 return true;\r
1498                                         else {\r
1499                                                 int state = (int) ifstack.Peek ();\r
1500 \r
1501                                                 if ((state & TAKING) != 0)\r
1502                                                         return true;\r
1503                                                 else\r
1504                                                         return false;\r
1505                                         }\r
1506                                 }\r
1507 \r
1508                         case "elif":\r
1509                                 if (ifstack == null || ifstack.Count == 0){\r
1510                                         Error_UnexpectedDirective ("no #if for this #elif");\r
1511                                         return true;\r
1512                                 } else {\r
1513                                         int state = (int) ifstack.Peek ();\r
1514 \r
1515                                         if ((state & REGION) != 0) {\r
1516                                                 Report.Error (1038, Location, "#endregion directive expected");\r
1517                                                 return true;\r
1518                                         }\r
1519 \r
1520                                         if ((state & ELSE_SEEN) != 0){\r
1521                                                 Error_UnexpectedDirective ("#elif not valid after #else");\r
1522                                                 return true;\r
1523                                         }\r
1524 \r
1525                                         if ((state & (TAKEN_BEFORE | TAKING)) != 0)\r
1526                                                 return false;\r
1527 \r
1528                                         if (eval (arg) && ((state & PARENT_TAKING) != 0)){\r
1529                                                 state = (int) ifstack.Pop ();\r
1530                                                 ifstack.Push (state | TAKING | TAKEN_BEFORE);\r
1531                                                 return true;\r
1532                                         } else \r
1533                                                 return false;\r
1534                                 }\r
1535 \r
1536                         case "else":\r
1537                                 if (ifstack == null || ifstack.Count == 0){\r
1538                                         Report.Error (\r
1539                                                 1028, Location,\r
1540                                                 "Unexpected processor directive (no #if for this #else)");\r
1541                                         return true;\r
1542                                 } else {\r
1543                                         int state = (int) ifstack.Peek ();\r
1544 \r
1545                                         if ((state & REGION) != 0) {\r
1546                                                 Report.Error (1038, Location, "#endregion directive expected");\r
1547                                                 return true;\r
1548                                         }\r
1549 \r
1550                                         if ((state & ELSE_SEEN) != 0){\r
1551                                                 Error_UnexpectedDirective ("#else within #else");\r
1552                                                 return true;\r
1553                                         }\r
1554 \r
1555                                         ifstack.Pop ();\r
1556 \r
1557                                         bool ret;\r
1558                                         if ((state & TAKEN_BEFORE) == 0){\r
1559                                                 ret = ((state & PARENT_TAKING) != 0);\r
1560                                         } else\r
1561                                                 ret = false;\r
1562                                         \r
1563                                         if (ret)\r
1564                                                 state |= TAKING;\r
1565                                         else\r
1566                                                 state &= ~TAKING;\r
1567                                         \r
1568                                         ifstack.Push (state | ELSE_SEEN);\r
1569                                         \r
1570                                         return ret;\r
1571                                 }\r
1572                         }\r
1573 \r
1574                         //\r
1575                         // These are only processed if we are in a `taking' block\r
1576                         //\r
1577                         if (!caller_is_taking)\r
1578                                 return false;\r
1579                                         \r
1580                         switch (cmd){\r
1581                         case "define":\r
1582                                 if (any_token_seen){\r
1583                                         Error_TokensSeen ();\r
1584                                         return true;\r
1585                                 }\r
1586                                 PreProcessDefinition (true, arg);\r
1587                                 return true;\r
1588 \r
1589                         case "undef":\r
1590                                 if (any_token_seen){\r
1591                                         Error_TokensSeen ();\r
1592                                         return true;\r
1593                                 }\r
1594                                 PreProcessDefinition (false, arg);\r
1595                                 return true;\r
1596 \r
1597                         case "error":\r
1598                                 Report.Error (1029, Location, "#error: '" + arg + "'");\r
1599                                 return true;\r
1600 \r
1601                         case "warning":\r
1602                                 Report.Warning (1030, Location, "#warning: '" + arg + "'");\r
1603                                 return true;\r
1604                         }\r
1605 \r
1606                         Report.Error (1024, Location, "Preprocessor directive expected (got: " + cmd + ")");\r
1607                         return true;\r
1608 \r
1609                 }\r
1610 \r
1611                 private int consume_string (bool quoted) \r
1612                 {\r
1613                         int c;\r
1614                         string_builder.Length = 0;\r
1615                                                                 \r
1616                         while ((c = getChar ()) != -1){\r
1617                                 if (c == '"'){\r
1618                                         if (quoted && peekChar () == '"'){\r
1619                                                 string_builder.Append ((char) c);\r
1620                                                 getChar ();\r
1621                                                 continue;\r
1622                                         } else {\r
1623                                                 val = string_builder.ToString ();\r
1624                                                 return Token.LITERAL_STRING;\r
1625                                         }\r
1626                                 }\r
1627 \r
1628                                 if (c == '\n'){\r
1629                                         if (!quoted)\r
1630                                                 Report.Error (1010, Location, "Newline in constant");\r
1631                                         line++;\r
1632                                         ref_line++;\r
1633                                         col = 0;\r
1634                                 } else\r
1635                                         col++;\r
1636 \r
1637                                 if (!quoted){\r
1638                                         c = escape (c);\r
1639                                         if (c == -1)\r
1640                                                 return Token.ERROR;\r
1641                                 }\r
1642                                 string_builder.Append ((char) c);\r
1643                         }\r
1644 \r
1645                         Report.Error (1039, Location, "Unterminated string literal");\r
1646                         return Token.EOF;\r
1647                 }\r
1648 \r
1649                 private int consume_identifier (int s, bool quoted) \r
1650                 {\r
1651                         int pos = 1;\r
1652                         int c;\r
1653                         \r
1654                         id_builder [0] = (char) s;\r
1655                                         \r
1656                         while ((c = reader.Read ()) != -1) {\r
1657                                 if (is_identifier_part_character ((char) c)){\r
1658                                         if (pos == max_id_size){\r
1659                                                 Report.Error (645, Location, "Identifier too long (limit is 512 chars)");\r
1660                                                 return Token.ERROR;\r
1661                                         }\r
1662                                         \r
1663                                         id_builder [pos++] = (char) c;\r
1664                                         putback_char = -1;\r
1665                                         col++;\r
1666                                 } else {\r
1667                                         putback_char = c;\r
1668                                         break;\r
1669                                 }\r
1670                         }\r
1671 \r
1672                         //\r
1673                         // Optimization: avoids doing the keyword lookup\r
1674                         // on uppercase letters and _\r
1675                         //\r
1676                         if (s >= 'a'){\r
1677                                 int keyword = GetKeyword (id_builder, pos);\r
1678                                 if (keyword != -1 && !quoted)\r
1679                                         return keyword;\r
1680                         }\r
1681 \r
1682                         //\r
1683                         // Keep identifiers in an array of hashtables to avoid needless\r
1684                         // allocations\r
1685                         //\r
1686 \r
1687                         if (identifiers [pos] != null) {\r
1688                                 val = identifiers [pos][id_builder];\r
1689                                 if (val != null) {\r
1690                                         return Token.IDENTIFIER;\r
1691                                 }\r
1692                         }\r
1693                         else\r
1694                                 identifiers [pos] = new CharArrayHashtable (pos);\r
1695 \r
1696                         val = new String (id_builder, 0, pos);\r
1697 \r
1698                         char [] chars = new char [pos];\r
1699                         Array.Copy (id_builder, chars, pos);\r
1700 \r
1701                         identifiers [pos] [chars] = val;\r
1702 \r
1703                         return Token.IDENTIFIER;\r
1704                 }\r
1705                 \r
1706                 public int xtoken ()\r
1707                 {\r
1708                         int t;\r
1709                         bool doread = false;\r
1710                         int c;\r
1711 \r
1712                         val = null;\r
1713                         // optimization: eliminate col and implement #directive semantic correctly.\r
1714                         for (;(c = getChar ()) != -1; col++) {\r
1715                                 if (c == ' ' || c == '\t' || c == '\f' || c == '\v' || c == '\r' || c == 0xa0){\r
1716                                         \r
1717                                         if (c == '\t')\r
1718                                                 col = (((col + 8) / 8) * 8) - 1;\r
1719                                         continue;\r
1720                                 }\r
1721 \r
1722                                 // Handle double-slash comments.\r
1723                                 if (c == '/'){\r
1724                                         int d = peekChar ();\r
1725                                 \r
1726                                         if (d == '/'){\r
1727                                                 getChar ();\r
1728                                                 while ((d = getChar ()) != -1 && (d != '\n') && d != '\r')\r
1729                                                         col++;\r
1730                                                 if (d == '\n'){\r
1731                                                         line++;\r
1732                                                         ref_line++;\r
1733                                                         col = 0;\r
1734                                                 }\r
1735                                                 any_token_seen |= tokens_seen;\r
1736                                                 tokens_seen = false;\r
1737                                                 continue;\r
1738                                         } else if (d == '*'){\r
1739                                                 getChar ();\r
1740 \r
1741                                                 while ((d = getChar ()) != -1){\r
1742                                                         if (d == '*' && peekChar () == '/'){\r
1743                                                                 getChar ();\r
1744                                                                 col++;\r
1745                                                                 break;\r
1746                                                         }\r
1747                                                         if (d == '\n'){\r
1748                                                                 line++;\r
1749                                                                 ref_line++;\r
1750                                                                 col = 0;\r
1751                                                                 any_token_seen |= tokens_seen;\r
1752                                                                 tokens_seen = false;\r
1753                                                         }\r
1754                                                 }\r
1755                                                 continue;\r
1756                                         }\r
1757                                         goto is_punct_label;\r
1758                                 }\r
1759 \r
1760                                 \r
1761                                 if (is_identifier_start_character ((char)c)){\r
1762                                         tokens_seen = true;\r
1763                                         return consume_identifier (c, false);\r
1764                                 }\r
1765 \r
1766                         is_punct_label:\r
1767                                 if ((t = is_punct ((char)c, ref doread)) != Token.ERROR){\r
1768                                         tokens_seen = true;\r
1769                                         if (doread){\r
1770                                                 getChar ();\r
1771                                                 col++;\r
1772                                         }\r
1773                                         return t;\r
1774                                 }\r
1775 \r
1776                                 // white space\r
1777                                 if (c == '\n'){\r
1778                                         line++;\r
1779                                         ref_line++;\r
1780                                         col = 0;\r
1781                                         any_token_seen |= tokens_seen;\r
1782                                         tokens_seen = false;\r
1783                                         continue;\r
1784                                 }\r
1785 \r
1786                                 if (c >= '0' && c <= '9'){\r
1787                                         tokens_seen = true;\r
1788                                         return is_number (c);\r
1789                                 }\r
1790 \r
1791                                 if (c == '.'){\r
1792                                         tokens_seen = true;\r
1793                                         int peek = peekChar ();\r
1794                                         if (peek >= '0' && peek <= '9')\r
1795                                                 return is_number (c);\r
1796                                         return Token.DOT;\r
1797                                 }\r
1798                                 \r
1799                                 /* For now, ignore pre-processor commands */\r
1800                                 // FIXME: In C# the '#' is not limited to appear\r
1801                                 // on the first column.\r
1802                                 if (c == '#' && !tokens_seen){\r
1803                                         bool cont = true;\r
1804                                         \r
1805                                 start_again:\r
1806                                         \r
1807                                         cont = handle_preprocessing_directive (cont);\r
1808 \r
1809                                         if (cont){\r
1810                                                 col = 0;\r
1811                                                 continue;\r
1812                                         }\r
1813                                         col = 1;\r
1814 \r
1815                                         bool skipping = false;\r
1816                                         for (;(c = getChar ()) != -1; col++){\r
1817                                                 if (c == '\n'){\r
1818                                                         col = 0;\r
1819                                                         line++;\r
1820                                                         ref_line++;\r
1821                                                         skipping = false;\r
1822                                                 } else if (c == ' ' || c == '\t' || c == '\v' || c == '\r' || c == 0xa0)\r
1823                                                         continue;\r
1824                                                 else if (c != '#')\r
1825                                                         skipping = true;\r
1826                                                 if (c == '#' && !skipping)\r
1827                                                         goto start_again;\r
1828                                         }\r
1829                                         any_token_seen |= tokens_seen;\r
1830                                         tokens_seen = false;\r
1831                                         if (c == -1)\r
1832                                                 Report.Error (1027, Location, "#endif/#endregion expected");\r
1833                                         continue;\r
1834                                 }\r
1835                                 \r
1836                                 if (c == '"') \r
1837                                         return consume_string (false);\r
1838 \r
1839                                 if (c == '\''){\r
1840                                         c = getChar ();\r
1841                                         tokens_seen = true;\r
1842                                         if (c == '\''){\r
1843                                                 error_details = "Empty character literal";\r
1844                                                 Report.Error (1011, Location, error_details);\r
1845                                                 return Token.ERROR;\r
1846                                         }\r
1847                                         c = escape (c);\r
1848                                         if (c == -1)\r
1849                                                 return Token.ERROR;\r
1850                                         val = new System.Char ();\r
1851                                         val = (char) c;\r
1852                                         c = getChar ();\r
1853 \r
1854                                         if (c != '\''){\r
1855                                                 error_details = "Too many characters in character literal";\r
1856                                                 Report.Error (1012, Location, error_details);\r
1857 \r
1858                                                 // Try to recover, read until newline or next "'"\r
1859                                                 while ((c = getChar ()) != -1){\r
1860                                                         if (c == '\n' || c == '\''){\r
1861                                                                 line++;\r
1862                                                                 ref_line++;\r
1863                                                                 col = 0;\r
1864                                                                 break;\r
1865                                                         } else\r
1866                                                                 col++;\r
1867                                                         \r
1868                                                 }\r
1869                                                 return Token.ERROR;\r
1870                                         }\r
1871                                         return Token.LITERAL_CHARACTER;\r
1872                                 }\r
1873                                 \r
1874                                 if (c == '@') {\r
1875                                         c = getChar ();\r
1876                                         if (c == '"') {\r
1877                                                 tokens_seen = true;\r
1878                                                 return consume_string (true);\r
1879                                         } else if (is_identifier_start_character ((char) c)){\r
1880                                                 return consume_identifier (c, true);\r
1881                                         } else {\r
1882                                                 Report.Error (1033, Location, "'@' must be followed by string constant or identifier");\r
1883                                         }\r
1884                                 }\r
1885 \r
1886                                 if (c == '#') {\r
1887                                         error_details = "Preprocessor directives must appear as the first non-whitespace " +\r
1888                                                 "character on a line.";\r
1889 \r
1890                                         Report.Error (1040, Location, error_details);\r
1891 \r
1892                                         return Token.ERROR;\r
1893                                 }\r
1894 \r
1895                                 error_details = ((char)c).ToString ();\r
1896                                 \r
1897                                 return Token.ERROR;\r
1898                         }\r
1899 \r
1900                         return Token.EOF;\r
1901                 }\r
1902 \r
1903                 public void cleanup ()\r
1904                 {\r
1905                         if (ifstack != null && ifstack.Count >= 1) {\r
1906                                 int state = (int) ifstack.Pop ();\r
1907                                 if ((state & REGION) != 0)\r
1908                                         Report.Error (1038, "#endregion directive expected");\r
1909                                 else \r
1910                                         Report.Error (1027, "#endif directive expected");\r
1911                         }\r
1912                                 \r
1913                 }\r
1914         }\r
1915 }\r
1916 \r