2004-08-06 Bernie Solomon <bernard@ugsolutions.com>
[mono.git] / mcs / mbas / mb-tokenizer.cs
index ff7330e3348e22f2f9a6437b84e233b66d820087..4cfe33c3d50e9a2ae49e9eb5a2c4348830539b52 100644 (file)
@@ -18,7 +18,7 @@ namespace Mono.MonoBASIC
        using System.IO;
        using System.Globalization;
        using Mono.Languages;
-       using Mono.CSharp;
+       using Mono.MonoBASIC;
        
        /// <summary>
        ///    Tokenizer for MonoBASIC source code. 
@@ -27,14 +27,14 @@ namespace Mono.MonoBASIC
        public class Tokenizer : yyParser.yyInput
        {
                TextReader reader;
-               // TODO: public SourceFile file_name;
-               public string file_name;
-               public string ref_name;
-               public int ref_line = 1;
-               public int line = 1;
-               public int col = 1;
-               public int current_token = Token.EOL;
+               string file_name;
+               string ref_name;
+               int ref_line = 0;
+               int line = 0;
+               int col = 1;
+               public int current_token = Token.ERROR;
                bool handle_get_set = false;
+               bool cant_have_a_type_character = false;
 
                public int ExpandedTabsSize = 4; 
 
@@ -70,27 +70,11 @@ namespace Mono.MonoBASIC
                static NumberStyles styles;
                static NumberFormatInfo csharp_format_info;
                
-               //
-               // Pre-processor
-               //
-               Hashtable defines;
-
-               const int TAKING        = 1;
-               const int TAKEN_BEFORE  = 2;
-               const int ELSE_SEEN     = 4;
-               const int PARENT_TAKING = 8;
-               const int REGION        = 16;           
-
-               //
-               // pre-processor if stack state:
-               //
-               Stack ifstack;
-
                //
                // Values for the associated token returned
                //
-               System.Text.StringBuilder number;
-               int putback_char;
+               StringBuilder number;
+               int putback_char = -1;
                Object val;
                
                //
@@ -103,13 +87,45 @@ namespace Mono.MonoBASIC
                                return error_details;
                        }
                }
+
                
+               public string Source {
+                       get {
+                               return file_name;
+                       }
+
+                       set {
+                               file_name = value;
+                               ref_name = value;
+                               Location.SetCurrentSource(file_name);
+                       }
+               }
+
+               public string EffectiveSource {
+                       get {
+                               return ref_name;
+                       }
+                       set {
+                               ref_name = value;
+                               Location.SetCurrentSource(ref_name);
+                       }
+               }
+
                public int Line {
                        get {
                                return line;
                        }
                }
 
+               public int EffectiveLine {
+                       get {
+                               return ref_line;
+                       }
+                       set {
+                               ref_line = value;
+                       }
+               }
+
                public int Col {
                        get {
                                return col;
@@ -129,7 +145,7 @@ namespace Mono.MonoBASIC
                        keywords.Add ("as", Token.AS);
                        keywords.Add ("assembly", Token.ASSEMBLY);
                        keywords.Add ("auto", Token.AUTO);
-                       keywords.Add ("binary", Token.BINARY);
+                       keywords.Add ("binary", Token.BINARY); // Not a VB.NET Keyword 
                        keywords.Add ("boolean", Token.BOOLEAN);
                        keywords.Add ("byref", Token.BYREF);
                        keywords.Add ("byte", Token.BYTE);
@@ -148,37 +164,40 @@ namespace Mono.MonoBASIC
                        keywords.Add ("class", Token.CLASS);
                        keywords.Add ("clng", Token.CLNG);
                        keywords.Add ("cobj", Token.COBJ);
-                       keywords.Add ("compare", Token.COMPARE);
+                       keywords.Add ("compare", Token.COMPARE); // Not a VB.NET Keyword
                        keywords.Add ("const", Token.CONST);
                        keywords.Add ("cshort", Token.CSHORT);
                        keywords.Add ("csng", Token.CSNG);
                        keywords.Add ("cstr", Token.CSTR);
                        keywords.Add ("ctype", Token.CTYPE);
-                       //keywords.Add ("date", Token.DATE);
+                       keywords.Add ("date", Token.DATE);
                        keywords.Add ("decimal", Token.DECIMAL);
                        keywords.Add ("declare", Token.DECLARE);
                        keywords.Add ("default", Token.DEFAULT);
                        keywords.Add ("delegate", Token.DELEGATE);
                        keywords.Add ("dim", Token.DIM);
+                       keywords.Add ("directcast", Token.DIRECTCAST);                  
                        keywords.Add ("do", Token.DO);
                        keywords.Add ("double", Token.DOUBLE);
                        keywords.Add ("each", Token.EACH);
                        keywords.Add ("else", Token.ELSE);
                        keywords.Add ("elseif", Token.ELSEIF);
                        keywords.Add ("end", Token.END);
+                       keywords.Add ("endif", Token.ENDIF); // An unused VB.NET keyword
                        keywords.Add ("enum", Token.ENUM);
                        keywords.Add ("erase", Token.ERASE);
                        keywords.Add ("error", Token.ERROR);
                        keywords.Add ("event", Token.EVENT);
                        keywords.Add ("exit", Token.EXIT);
-                       keywords.Add ("explicit", Token.EXPLICIT);
+                       keywords.Add ("explicit", Token.EXPLICIT); // Not a VB.NET keyword 
                        keywords.Add ("false", Token.FALSE);
                        keywords.Add ("finally", Token.FINALLY);
                        keywords.Add ("for", Token.FOR);
                        keywords.Add ("friend", Token.FRIEND);
                        keywords.Add ("function", Token.FUNCTION);
                        keywords.Add ("get", Token.GET);
-                       //keywords.Add ("gettype", Token.GETTYPE);
+                       keywords.Add ("gettype", Token.GETTYPE);
+                       keywords.Add ("gosub", Token.GOSUB); // An unused VB.NET keyword 
                        keywords.Add ("goto", Token.GOTO);
                        keywords.Add ("handles", Token.HANDLES);
                        keywords.Add ("if", Token.IF);
@@ -189,7 +208,7 @@ namespace Mono.MonoBASIC
                        keywords.Add ("integer", Token.INTEGER);
                        keywords.Add ("interface", Token.INTERFACE);
                        keywords.Add ("is", Token.IS);
-                       keywords.Add ("let ", Token.LET );
+                       keywords.Add ("let ", Token.LET ); // An unused VB.NET keyword
                        keywords.Add ("lib ", Token.LIB );
                        keywords.Add ("like ", Token.LIKE );
                        keywords.Add ("long", Token.LONG);
@@ -209,7 +228,7 @@ namespace Mono.MonoBASIC
                        keywords.Add ("notinheritable", Token.NOTINHERITABLE);
                        keywords.Add ("notoverridable", Token.NOTOVERRIDABLE);
                        keywords.Add ("object", Token.OBJECT);
-                       keywords.Add ("off", Token.OFF);
+                       keywords.Add ("off", Token.OFF); // Not a VB.NET Keyword 
                        keywords.Add ("on", Token.ON);
                        keywords.Add ("option", Token.OPTION);
                        keywords.Add ("optional", Token.OPTIONAL);
@@ -237,16 +256,16 @@ namespace Mono.MonoBASIC
                        keywords.Add ("shared", Token.SHARED);
                        keywords.Add ("short", Token.SHORT);
                        keywords.Add ("single", Token.SINGLE);
-                       keywords.Add ("sizeof", Token.SIZEOF);
+                       keywords.Add ("sizeof", Token.SIZEOF); // Not a VB.NET Keyword 
                        keywords.Add ("static", Token.STATIC);
                        keywords.Add ("step", Token.STEP);
                        keywords.Add ("stop", Token.STOP);
-                       keywords.Add ("strict", Token.STRICT);
+                       keywords.Add ("strict", Token.STRICT); // Not a VB.NET Keyword 
                        keywords.Add ("string", Token.STRING);
                        keywords.Add ("structure", Token.STRUCTURE);
                        keywords.Add ("sub", Token.SUB);
                        keywords.Add ("synclock", Token.SYNCLOCK);
-                       keywords.Add ("text", Token.TEXT);
+                       keywords.Add ("text", Token.TEXT); // Not a VB.NET Keyword
                        keywords.Add ("then", Token.THEN);
                        keywords.Add ("throw", Token.THROW);
                        keywords.Add ("to", Token.TO);
@@ -255,7 +274,8 @@ namespace Mono.MonoBASIC
                        keywords.Add ("typeof", Token.TYPEOF);
                        keywords.Add ("unicode", Token.UNICODE);
                        keywords.Add ("until", Token.UNTIL);
-                       keywords.Add ("variant", Token.VARIANT);
+                       keywords.Add ("variant", Token.VARIANT); // An unused VB.NET keyword
+                       keywords.Add ("wend", Token.WEND); // An unused VB.NET keyword
                        keywords.Add ("when", Token.WHEN);
                        keywords.Add ("while", Token.WHILE);
                        keywords.Add ("with", Token.WITH);
@@ -269,9 +289,6 @@ namespace Mono.MonoBASIC
 
                }
 
-               //
-               // Class initializer
-               // 
                static Tokenizer ()
                {
                        initTokens ();
@@ -280,12 +297,24 @@ namespace Mono.MonoBASIC
                        styles = NumberStyles.AllowExponent | NumberStyles.AllowDecimalPoint;
                }
 
+               public Tokenizer (System.IO.TextReader input, string fname, ArrayList defines)
+               {
+                       this.Source = fname;
+
+                       reader = input;
+
+                       // putback an EOL at the beginning of a stream. This is a convenience that 
+                       // allows pre-processor directives to be added to the beginning of a vb file.
+                       putback('\n');
+               }
+
                bool is_keyword (string name)
                {
                        bool res;
+                       name = name.ToLower();
 
-                       res = keywords.Contains(name.ToLower());
-                       if ((name == "get" || name == "set") && handle_get_set == false)
+                       res = keywords.Contains(name);
+                       if ((name == "GET" || name == "SET") && handle_get_set == false)
                                return false;
                        return res;
                }
@@ -297,20 +326,10 @@ namespace Mono.MonoBASIC
                
                public Location Location {
                        get {
-                               return new Location (ref_line);
+                               return new Location (ref_line, col);
                        }
                }
                
-               void define (string def)
-               {
-                       if (!RootContext.AllDefines.Contains(def)){
-                               RootContext.AllDefines [def] = true;
-                       }
-                       if (defines.Contains (def))
-                               return;
-                       defines [def] = true;
-               }
-
                public bool PropertyParsing {
                        get {
                                return handle_get_set;
@@ -333,12 +352,15 @@ namespace Mono.MonoBASIC
 
                int is_punct (char c, ref bool doread)
                {
-                       int idx = "{}[](),:;~+-*/%&|^!=<>?".IndexOf (c);
                        int d;
                        int t;
 
                        doread = false;
-
+                       
+                       error_details = c.ToString();
+                       
+                       d = peekChar ();
+                       
                        switch (c){
                        case '[':
                                return Token.OPEN_BRACKET;
@@ -354,17 +376,52 @@ namespace Mono.MonoBASIC
                                return Token.CLOSE_PARENS;
                        case ',':
                                return Token.COMMA;
-                       //case ':':
-                       //      return Token.COLON;
                        case '?':
                                return Token.INTERR;
-                       //case '&':
-                       //      return Token.OP_CONCAT;                         
+                       case '!':
+                               if (is_identifier_start_character((char)d) || cant_have_a_type_character)
+                                       return Token.EXCLAMATION;
+                               return Token.SINGLETYPECHAR;
+                       case '$':
+                               if (cant_have_a_type_character)
+                                       return Token.ERROR;
+                               return Token.DOLAR_SIGN;
+                       case '@':
+                               if (cant_have_a_type_character)
+                                       return Token.ERROR;
+                               return Token.AT_SIGN;
+                       case '%':
+                               if (cant_have_a_type_character)
+                                       return Token.ERROR;
+                               return Token.PERCENT;
+                       case '#':
+                               if(tokens_seen)
+                               {
+                                       if (cant_have_a_type_character) 
+                                               return ExtractDateTimeLiteral();
+                                       else
+                                               return Token.NUMBER_SIGN;
+                               }
+                               else 
+                               {
+                                       tokens_seen = true;
+                                       return Token.HASH;
+                               } 
+                       case '&':
+                               if (!cant_have_a_type_character)
+                                       return Token.LONGTYPECHAR;
+                               t = handle_integer_literal_in_other_bases(d);
+                               if (t == Token.NONE) {
+                                       if (d == '=') {
+                                               doread = true;
+                                               t = Token.OP_CONCAT_ASSIGN;
+                                       } else 
+                                               t = Token.OP_CONCAT;
+                               }
+                               return t;                       
                        }
 
-                       d = peekChar ();
                        if (c == '+'){
-                               
                                if (d == '+')
                                        t = Token.OP_INC;
                                else if (d == '=')
@@ -374,14 +431,6 @@ namespace Mono.MonoBASIC
                                doread = true;
                                return t;
                        }
-                       if (c == '&'){
-                               if (d == '=')
-                                       t = Token.OP_CONCAT_ASSIGN;
-                               else
-                                       return Token.OP_CONCAT;
-                               doread = true;
-                               return t;
-                       }                       
                        if (c == '-'){
                                if (d == '=')
                                        t = Token.OP_SUB_ASSIGN;
@@ -392,10 +441,6 @@ namespace Mono.MonoBASIC
                        }
 
                        if (c == '='){
-                               /*if (d == '='){
-                                       doread = true;
-                                       return Token.OP_EQ;
-                               }*/
                                return Token.ASSIGN;
                        }
 
@@ -441,6 +486,11 @@ namespace Mono.MonoBASIC
                                        doread = true;
                                        return Token.OP_LE;
                                }
+                               if (d == '<')
+                               {
+                                       doread = true;
+                                       return Token.OP_SHIFT_LEFT;
+                               }
                                return Token.OP_LT;
                        }
 
@@ -449,8 +499,14 @@ namespace Mono.MonoBASIC
                                        doread = true;
                                        return Token.OP_GE;
                                }
+                               if (d == '>')
+                               {
+                                       doread = true;
+                                       return Token.OP_SHIFT_RIGHT;
+                               }
                                return Token.OP_GT;
                        }
+                       
                        if (c == ':'){
                                if (d == '='){
                                        doread = true;
@@ -458,6 +514,7 @@ namespace Mono.MonoBASIC
                                }
                                return Token.COLON;
                        }                       
+                       
                        return Token.ERROR;
                }
 
@@ -480,23 +537,6 @@ namespace Mono.MonoBASIC
                        return seen_digits;
                }
 
-               void hex_digits (int c)
-               {
-                       int d;
-
-                       if (c != -1)
-                               number.Append ((char) c);
-                       while ((d = peekChar ()) != -1){
-                               char e = Char.ToUpper ((char) d);
-                               
-                               if (Char.IsDigit (e) ||
-                                   (e >= 'A' && e <= 'F')){
-                                       number.Append ((char) e);
-                                       getChar ();
-                               } else
-                                       break;
-                       }
-               }
                
                int real_type_suffix (int c)
                {
@@ -506,10 +546,10 @@ namespace Mono.MonoBASIC
                        case 'F': case 'f':
                                t =  Token.LITERAL_SINGLE;
                                break;
-                       case 'D': case 'd':
+                       case 'R': case 'r':
                                t = Token.LITERAL_DOUBLE;
                                break;
-                       case 'M': case 'm':
+                       case 'D': case 'd':
                                 t= Token.LITERAL_DECIMAL;
                                break;
                        default:
@@ -521,23 +561,45 @@ namespace Mono.MonoBASIC
 
                int integer_type_suffix (int c)
                {
-                       // FIXME: Handle U and L suffixes.
-                       // We also need to see in which kind of
-                       // Int the thing fits better according to the spec.
-                       return Token.LITERAL_INTEGER;
+                       int t;
+                       
+                       try {
+                       
+                               switch (c){
+                               case 'S': case 's':
+                                       t =  Token.LITERAL_INTEGER; // SHORT ?
+                                       val = ((IConvertible)val).ToInt16(null);
+                                       break;
+                               case 'I': case 'i':
+                                       t = Token.LITERAL_INTEGER;
+                                       val = ((IConvertible)val).ToInt32(null);
+                                       break;
+                               case 'L': case 'l':
+                                        t= Token.LITERAL_INTEGER; // LONG ?
+                                        val = ((IConvertible)val).ToInt64(null);
+                                       break;
+                               default:
+                                       if ((long)val <= System.Int32.MaxValue &&
+                                               (long)val >= System.Int32.MinValue) {
+                                               val = ((IConvertible)val).ToInt32(null);
+                                               return Token.LITERAL_INTEGER;
+                                       } else {
+                                               val = ((IConvertible)val).ToInt64(null);
+                                               return Token.LITERAL_INTEGER; // LONG ?
+                                       }
+                               }
+                               getChar ();
+                               return t;
+                       } catch (Exception e) {
+                               val = e.ToString();
+                               return Token.ERROR;
+                       }
                }
                
-               void adjust_int (int t)
-               {
-                       val = new System.Int32();
-                       val = System.Int32.Parse (number.ToString (), 0);
-               }
-
                int adjust_real (int t)
                {
                        string s = number.ToString ();
 
-                       Console.WriteLine (s);
                        switch (t){
                        case Token.LITERAL_DECIMAL:
                                val = new System.Decimal ();
@@ -565,42 +627,89 @@ namespace Mono.MonoBASIC
                        return t;
                }
 
+               long hex_digits ()
+               {
+                       StringBuilder hexNumber = new StringBuilder ();
+                       
+                       int d;
+
+                       while ((d = peekChar ()) != -1){
+                               char e = Char.ToUpper ((char) d);
+                               
+                               if (Char.IsDigit (e) || (e >= 'A' && e <= 'F')){
+                                       hexNumber.Append (e);
+                                       getChar ();
+                               } else
+                                       break;
+                       }
+                       return System.Int64.Parse (hexNumber.ToString(), NumberStyles.HexNumber);
+               }
+
+               long octal_digits ()
+               {
+                       long valueToReturn = 0;
+                       
+                       int d;
+
+                       while ((d = peekChar ()) != -1){
+                               char e = (char)d;                       
+                               if (Char.IsDigit (e) && (e < '8')){
+                                       valueToReturn *= 8;
+                                       valueToReturn += (d - (int)'0');
+                                       getChar ();
+                               } else
+                                       break;
+                       }
+                       
+                       return valueToReturn;
+               }
+
+               int handle_integer_literal_in_other_bases(int peek)
+               {
+                       if (peek == 'h' || peek == 'H'){
+                               getChar ();
+                               val = hex_digits ();
+                               return integer_type_suffix (peekChar ());
+                       }
+                       
+                       if (peek == 'o' || peek == 'O'){
+                               getChar ();
+                               val = octal_digits ();
+                               return integer_type_suffix (peekChar ());
+                       }
+                       
+                       return Token.NONE;
+               }
+               
                //
                // Invoked if we know we have .digits or digits
                //
                int is_number (int c)
                {
                        bool is_real = false;
-                       number = new System.Text.StringBuilder ();
+                       number = new StringBuilder ();
                        int type;
 
                        number.Length = 0;
 
                        if (Char.IsDigit ((char)c)){
-                               if (c == '0' && peekChar () == 'x' || peekChar () == 'X'){
-                                       getChar ();
-                                       hex_digits (-1);
-                                       val = new System.Int32 ();
-                                       val = System.Int32.Parse (number.ToString (), NumberStyles.HexNumber);
-                                       return integer_type_suffix (peekChar ());
-                               }
                                decimal_digits (c);
-                               c = getChar ();
+                               c = peekChar ();
                        }
 
                        //
                        // We need to handle the case of
-                       // "1.1" vs "1.string" (LITERAL_SINGLE vs NUMBER DOT IDENTIFIER)
+                       // "1.1" vs "1.ToString()" (LITERAL_SINGLE vs NUMBER DOT IDENTIFIER)
                        //
                        if (c == '.'){
-                               if (decimal_digits ('.')){
+                               if (decimal_digits (getChar())){
                                        is_real = true;
                                        c = peekChar ();
                                } else {
                                        putback ('.');
                                        number.Length -= 1;
-                                       adjust_int (Token.LITERAL_INTEGER);
-                                       return Token.LITERAL_INTEGER;
+                                       val = System.Int64.Parse(number.ToString());
+                                       return integer_type_suffix('.');
                                }
                        }
                        
@@ -625,25 +734,13 @@ namespace Mono.MonoBASIC
 
                        type = real_type_suffix (c);
                        if (type == Token.NONE && !is_real){
-                               type = integer_type_suffix (c);
-                               adjust_int (type);
-                               putback (c);
-                               return type;
-                       } else
-                               is_real = true;
-
-                       if (is_real)
-                               return adjust_real (type);
-
-                       Console.WriteLine ("This should not be reached");
-                       throw new Exception ("Is Number should never reach this point");
-               }
+                               val = System.Int64.Parse(number.ToString());
+                               return integer_type_suffix(c);
+                       }
                        
-               int escape (int c)
-               {
-                       return peekChar ();
+                       return adjust_real (type);
                }
-
+                       
                int getChar ()
                {
                        if (putback_char != -1){
@@ -687,14 +784,23 @@ namespace Mono.MonoBASIC
 
                private bool IsEOL(int currentChar)
                {
-                       if (currentChar ==  0x0D)
-                       {
+                       bool retVal;
+                       
+                       if (currentChar ==  0x0D) {
                                if (peekChar() ==  0x0A) // if it is a CR-LF pair consume LF also
                                        getChar();
 
-                               return true;
+                               retVal = true;
+                       }
+                       else {
+                               retVal = (currentChar ==  -1 || currentChar ==  0x0A || currentChar ==  0x2028 || currentChar ==  0x2029);
                        }
-                       return (currentChar ==  -1 || currentChar ==  0x0A || currentChar ==  0x2028 || currentChar ==  0x2029);
+
+                       if(retVal) {
+                               nextLine();
+                       }
+
+                       return retVal;
                }
 
                private int DropComments()              
@@ -702,9 +808,6 @@ namespace Mono.MonoBASIC
                        int d;
                        while (!IsEOL(d = getChar ()))
                                col++;
-                       line++;
-                       ref_line++;
-                       col = 0;
 
                        return Token.EOL;
                }       
@@ -735,7 +838,7 @@ namespace Mono.MonoBASIC
 
                private string GetIdentifier(int c)
                {
-                       System.Text.StringBuilder id = new System.Text.StringBuilder ();
+                       StringBuilder id = new StringBuilder ();
 
                        id.Append ((char) c);
                                
@@ -749,11 +852,34 @@ namespace Mono.MonoBASIC
                                else 
                                        break;
                        }
-
-                       return id.ToString ();
+                       
+                       cant_have_a_type_character = false;
+                       
+                       return id.ToString();
                }
 
+               private bool is_doublequote(int currentChar)
+               {
+                       return (currentChar == '"' || 
+                                       currentChar == 0x201C || // unicode left double-quote character
+                                       currentChar == 0x201D);  // unicode right double-quote character
+               }
+               
+               private bool is_whitespace(int c)
+               {
+                       return (c == ' ' || c == '\t' || c == '\v' || c == '\r' || c == 0xa0);
+               }
+               
                private bool tokens_seen = false;
+               
+               private void nextLine()
+               {
+                       cant_have_a_type_character = true;
+                       line++;
+                       ref_line++;
+                       col = 0;
+                       tokens_seen = false;
+               }
 
                public int xtoken ()
                {
@@ -764,27 +890,32 @@ namespace Mono.MonoBASIC
                        val = null;
                        for (;(c = getChar ()) != -1; col++) {
                        
-                               // Handle line comments.
-                               if (c == '\'')
-                                       return Token.REM;
-                                       
                                // Handle line continuation character
                                if (c == '_') 
                                {
-                                       int d = getChar();
-                                       putback(d);
+                                       int d = peekChar();
                                        if (!is_identifier_part_character((char)d)) {
                                                while ((c = getChar ()) != -1 && !IsEOL(c)) {}
                                                c = getChar ();                 
                                        }               
                                }
+
+                               // white space
+                               if (is_whitespace(c)) {
+                                       // expand tabs for location
+                                       if (c == '\t')
+                                               col = (((col + ExpandedTabsSize) / ExpandedTabsSize) * ExpandedTabsSize) - 1;
+                                       cant_have_a_type_character = true;
+                                       continue;
+                               }
+                               
+                               // Handle line comments.
+                               if (c == '\'')
+                                       return Token.REM;                                       
+                               
                                // Handle EOL.
                                if (IsEOL(c))
                                {
-                                       line++;
-                                       ref_line++;
-                                       col = 0;
-                                       tokens_seen = false;
                                        if (current_token == Token.EOL) // if last token was also EOL keep skipping
                                                continue;
                                        return Token.EOL;
@@ -814,9 +945,16 @@ namespace Mono.MonoBASIC
                                        return Token.IDENTIFIER;
                                }
 
+                               // Treat string literals
+                               if (is_doublequote(c)) {
+                                       cant_have_a_type_character = true;
+                                       return ExtractStringOrCharLiteral(c);
+                               }
+                       
                                // handle numeric literals
                                if (c == '.')
                                {
+                                       cant_have_a_type_character = true;
                                        tokens_seen = true;
                                        if (Char.IsDigit ((char) peekChar ()))
                                                return is_number (c);
@@ -825,52 +963,17 @@ namespace Mono.MonoBASIC
                                
                                if (Char.IsDigit ((char) c))
                                {
+                                       cant_have_a_type_character = true;
                                        tokens_seen = true;
                                        return is_number (c);
                                }
 
-                               if (c == '#' && !tokens_seen)
-                               {
-                                       bool cont = true;
-                                       
-                               start_again:
-                                       
-                                       cont = handle_preprocessing_directive (cont);
+                               if ((t = is_punct ((char)c, ref doread)) != Token.ERROR) {
+                                       cant_have_a_type_character = true;
 
-                                       if (cont)
-                                       {
-                                               col = 0;
+                                       if (t == Token.NONE)
                                                continue;
-                                       }
-                                       col = 1;
-
-                                       bool skipping = false;
-                                       for (;(c = getChar ()) != -1; col++)
-                                       {
-                                               if (IsEOL(c))
-                                               {
-                                                       col = 0;
-                                                       line++;
-                                                       ref_line++;
-                                                       skipping = false;
-                                               } 
-                                               else if (c == ' ' || c == '\t' || c == '\v' || c == '\r' || c == 0xa0)
-                                                       continue;
-                                               else if (c != '#')
-                                               {
-                                                       skipping = true;
-                                                       continue;
-                                               }       
-                                               if (c == '#' && !skipping)
-                                                       goto start_again;
-                                       }
-                                       tokens_seen = false;
-                                       if (c == -1)
-                                               Report.Error (1027, Location, "#endif/#endregion expected");
-                                       continue;
-                               }
-                               
-                               if ((t = is_punct ((char)c, ref doread)) != Token.ERROR){
+                                               
                                        if (doread){
                                                getChar ();
                                                col++;
@@ -879,42 +982,7 @@ namespace Mono.MonoBASIC
                                        return t;
                                }
                                
-                               // Treat string literals
-                               if (c == '"'){
-                                       System.Text.StringBuilder s = new System.Text.StringBuilder ();
-
-                                       tokens_seen = true;
-
-                                       while ((c = getChar ()) != -1){
-                                               if (c == '"'){
-                                                       if (peekChar() == '"')
-                                                               getChar();
-                                                       else {
-                                                               val = s.ToString ();
-                                                               return Token.LITERAL_STRING;
-                                                       }
-                                               }
-
-                                               if (IsEOL(c))
-                                                       return Token.ERROR;
-                                                       
-                                               s.Append ((char) c);
-                                       }
-                               }
-                       
-                               // expand tabs for location and ignore it as whitespace
-                               if (c == '\t')
-                               {
-                                       col = (((col + ExpandedTabsSize) / ExpandedTabsSize) * ExpandedTabsSize) - 1;
-                                       continue;
-                               }
-
-                               // white space
-                               if (c == ' ' || c == '\f' || c == '\v')
-                                       continue;
-
                                error_details = ((char)c).ToString ();
-                               
                                return Token.ERROR;
                        }
 
@@ -924,536 +992,101 @@ namespace Mono.MonoBASIC
                        return Token.EOF;
                }
 
-               public void cleanup ()
-               {
-/* borrowed from mcs - have to work it to have preprocessing in mbas
-
-                       if (ifstack != null && ifstack.Count >= 1) {
-                               int state = (int) ifstack.Pop ();
-                               if ((state & REGION) != 0)
-                                       Report.Error (1038, "#endregion directive expected");
-                               else 
-                                       Report.Error (1027, "#endif directive expected");
-                       }
-*/                             
-               }
-
-               public Tokenizer (System.IO.TextReader input, string fname, ArrayList defines)
-               {
-                       this.ref_name = fname;
-                       reader = input;
-                       putback_char = -1;
-                       
-                       Location.Push (fname);
-               }
-
-               static StringBuilder static_cmd_arg = new System.Text.StringBuilder ();
-               
-               void get_cmd_arg (out string cmd, out string arg)
+               private int ExtractDateTimeLiteral()
                {
                        int c;
                        
-                       tokens_seen = false;
-                       arg = "";
-                       static_cmd_arg.Length = 0;
-                               
-                       while ((c = getChar ()) != -1 && (c != '\n') && (c != ' ') && (c != '\t') && (c != '\r')){
-                               static_cmd_arg.Append ((char) c);
-                       }
-
-                       cmd = static_cmd_arg.ToString ();
-
-                       if (c == '\n'){
-                               line++;
-                               ref_line++;
-                               return;
-                       } else if (c == '\r')
-                               col = 0;
-
-                       // skip over white space
-                       while ((c = getChar ()) != -1 && (c != '\n') && ((c == '\r') || (c == ' ') || (c == '\t')))
-                               ;
-
-                       if (c == '\n'){
-                               line++;
-                               ref_line++;
-                               return;
-                       } else if (c == '\r'){
-                               col = 0;
-                               return;
-                       }
-                       
-                       static_cmd_arg.Length = 0;
-                       static_cmd_arg.Append ((char) c);
-                       
-                       while ((c = getChar ()) != -1 && (c != '\n') && (c != '\r')){
-                               static_cmd_arg.Append ((char) c);
-                       }
-
-                       if (c == '\n'){
-                               line++;
-                               ref_line++;
-                       } else if (c == '\r')
-                               col = 0;
-                       arg = static_cmd_arg.ToString ().Trim ();
-                       
-                       if (cmd == "End" && arg == "Region") {
-                               cmd = "End Region";
-                               arg = "";       
-                       }
-                       if (cmd == "End" && arg == "If") {
-                               cmd = "End If";
-                               arg = "";       
-                       }                       
-                               
-               }
-
-               //
-               // Handles the #line directive
-               //
-               bool PreProcessLine (string arg)
-               {
-                       if (arg == "")
-                               return false;
-
-                       if (arg == "default"){
-                               ref_line = line;
-                               ref_name = file_name;
-                               Location.Push (ref_name);
-                               return true;
-                       }
-                       
-                       try {
-                               int pos;
-
-                               if ((pos = arg.IndexOf (' ')) != -1 && pos != 0){
-                                       ref_line = System.Int32.Parse (arg.Substring (0, pos));
-                                       pos++;
-                                       
-                                       char [] quotes = { '\"' };
-                                       
-                                       string name = arg.Substring (pos). Trim (quotes);
-                                       ref_name = name; // TODO: Synchronize with mcs: Location.LookupFile (name);
-                                       Location.Push (ref_name);
-                               } else {
-                                       ref_line = System.Int32.Parse (arg);
-                               }
-                       } catch {
-                               return false;
-                       }
-                       
-                       return true;
-               }
-
-               //
-               // Handles #define and #undef
-               //
-               void PreProcessDefinition (bool is_define, string arg)
-               {
-                       if (arg == "" || arg == "true" || arg == "false"){
-                               Report.Error (1001, Location, "Missing identifer to pre-processor directive");
-                               return;
-                       }
-
-                       char[] whitespace = { ' ', '\t' };
-                       if (arg.IndexOfAny (whitespace) != -1){
-                               Report.Error (1025, Location, "Single-line comment or end-of-line expected");
-                               return;
-                       }
-
-                       foreach (char c in arg){
-                               if (!Char.IsLetter (c) && (c != '_')){
-                                       Report.Error (1001, Location, "Identifier expected");
-                                       return;
+                       StringBuilder sb = new StringBuilder();
+                       for (;(c = getChar ()) != -1; col++)
+                       {
+                               if (c == '#') {
+                                       val = ParseDateLiteral(sb);
+                                       return Token.LITERAL_DATE;
                                }
+                               if (IsEOL(c)) {
+                                       break;
+                               } 
+                               if (c == '-')
+                                       c = '/';
+                               sb.Append((char)c);
                        }
-
-                       if (is_define){
-                               if (defines == null)
-                                       defines = new Hashtable ();
-                               define (arg);
-                       } else {
-                               if (defines == null)
-                                       return;
-                               if (defines.Contains (arg))
-                                       defines.Remove (arg);
-                       }
-               }
-
-               bool eval_val (string s)
-               {
-                       if (s == "true")
-                               return true;
-                       if (s == "false")
-                               return false;
-                       
-                       if (defines == null)
-                               return false;
-                       if (defines.Contains (s))
-                               return true;
-
-                       return false;
+                       return Token.ERROR;
                }
-
-               bool pp_primary (ref string s)
+               
+               private int ExtractStringOrCharLiteral(int c)
                {
-                       s = s.Trim ();
-                       int len = s.Length;
+                       StringBuilder s = new StringBuilder ();
 
-                       if (len > 0){
-                               char c = s [0];
-                               
-                               if (c == '('){
-                                       s = s.Substring (1);
-                                       bool val = pp_expr (ref s);
-                                       if (s.Length > 0 && s [0] == ')'){
-                                               s = s.Substring (1);
-                                               return val;
-                                       }
-                                       Error_InvalidDirective ();
-                                       return false;
-                               }
-                               
-                               if (is_identifier_start_character (c)){
-                                       int j = 1;
+                       tokens_seen = true;
 
-                                       while (j < len){
-                                               c = s [j];
-                                               
-                                               if (is_identifier_part_character (c)){
-                                                       j++;
-                                                       continue;
+                       while ((c = getChar ()) != -1){
+                               if (is_doublequote(c)){
+                                       if (is_doublequote(peekChar()))
+                                               getChar();
+                                       else {
+                                               //handle Char Literals
+                                               if (peekChar() == 'C' || peekChar() == 'c') {
+                                                       getChar();
+                                                       if (s.Length == 1) {
+                                                               val = s[0];
+                                                               return Token.LITERAL_CHARACTER;
+                                                       } else {
+                                                               val = "Incorrect length for a character literal";
+                                                               return Token.ERROR;
+                                                       }                                                       
+                                               } else {
+                                                       val = s.ToString ();
+                                                       return Token.LITERAL_STRING;
                                                }
-                                               bool v = eval_val (s.Substring (0, j));
-                                               s = s.Substring (j);
-                                               return v;
                                        }
-                                       bool vv = eval_val (s);
-                                       s = "";
-                                       return vv;
                                }
-                       }
-                       Error_InvalidDirective ();
-                       return false;
-               }
-               
-               bool pp_unary (ref string s)
-               {
-                       s = s.Trim ();
-                       int len = s.Length;
-
-                       if (len > 0){
-                               if (s [0] == '!'){
-                                       if (len > 1 && s [1] == '='){
-                                               Error_InvalidDirective ();
-                                               return false;
-                                       }
-                                       s = s.Substring (1);
-                                       return ! pp_primary (ref s);
-                               } else
-                                       return pp_primary (ref s);
-                       } else {
-                               Error_InvalidDirective ();
-                               return false;
-                       }
-               }
-               
-               bool pp_eq (ref string s)
-               {
-                       bool va = pp_unary (ref s);
-
-                       s = s.Trim ();
-                       int len = s.Length;
-                       if (len > 0){
-                               if (s [0] == '='){
-                                       if (len > 2 && s [1] == '='){
-                                               s = s.Substring (2);
-                                               return va == pp_unary (ref s);
-                                       } else {
-                                               Error_InvalidDirective ();
-                                               return false;
-                                       }
-                               } else if (s [0] == '!' && len > 1 && s [1] == '='){
-                                       s = s.Substring (2);
-
-                                       return va != pp_unary (ref s);
 
-                               } 
-                       }
-
-                       return va;
-                               
-               }
-               
-               bool pp_and (ref string s)
-               {
-                       bool va = pp_eq (ref s);
-
-                       s = s.Trim ();
-                       int len = s.Length;
-                       if (len > 0){
-                               if (s [0] == '&'){
-                                       if (len > 2 && s [1] == '&'){
-                                               s = s.Substring (2);
-                                               return (va & pp_eq (ref s));
-                                       } else {
-                                               Error_InvalidDirective ();
-                                               return false;
-                                       }
-                               } 
-                       }
-                       return va;
-               }
-               
-               //
-               // Evaluates an expression for `#if' or `#elif'
-               //
-               bool pp_expr (ref string s)
-               {
-                       bool va = pp_and (ref s);
-                       s = s.Trim ();
-                       int len = s.Length;
-                       if (len > 0){
-                               char c = s [0];
-                               
-                               if (c == '|'){
-                                       if (len > 2 && s [1] == '|'){
-                                               s = s.Substring (2);
-                                               return va | pp_expr (ref s);
-                                       } else {
-                                               Error_InvalidDirective ();
-                                               return false;
-                                       }
-                               } 
-                       }
+                               if (IsEOL(c)) {
+                                       return Token.ERROR;
+                               }
                        
-                       return va;
-               }
-
-               bool eval (string s)
-               {
-                       bool v = pp_expr (ref s);
-                       s = s.Trim ();
-                       if (s.Length != 0){
-                               Error_InvalidDirective ();
-                               return false;
+                               s.Append ((char) c);
                        }
-
-                       return v;
-               }
-               
-               void Error_InvalidDirective ()
-               {
-                       Report.Error (1517, Location, "Invalid pre-processor directive");
+                                       
+                       return Token.ERROR;
                }
 
-               void Error_UnexpectedDirective (string extra)
-               {
-                       Report.Error (
-                               1028, Location,
-                               "Unexpected processor directive (" + extra + ")");
-               }
+               static IFormatProvider enUSculture = new CultureInfo("en-US", true);
 
-               void Error_TokensSeen ()
+               private DateTime ParseDateLiteral(StringBuilder value)
                {
-                       Report.Error (
-                               1032, Location,
-                               "Cannot define or undefine pre-processor symbols after a token in the file");
+                       try
+                       {
+                               return DateTime.Parse(value.ToString(),
+                                                 enUSculture,
+                                                 DateTimeStyles.NoCurrentDateDefault | DateTimeStyles.AllowWhiteSpaces);
+                       }
+                       catch (FormatException ex)
+                       {
+                               //TODO: What is the correct error number and message?
+                               Report.Error (1, Location, string.Format("Invalid date literal '{0}'", value.ToString()) 
+                                       + Environment.NewLine + ex.ToString());
+                       }
+                       catch (Exception)
+                       {
+                               Report.Error (1, Location, "Error parsing date literal");       //TODO: What is the correct error number and message?
+                       }
+                       return new DateTime();
                }
-               
-               //
-               // if true, then the code continues processing the code
-               // if false, the code stays in a loop until another directive is
-               // reached.
-               //
-               bool handle_preprocessing_directive (bool caller_is_taking)
+               public void PositionCursorAtNextPreProcessorDirective()
                {
-                       char [] blank = { ' ', '\t' };
-                       string cmd, arg;
-                       bool region_directive = false;
-
-                       get_cmd_arg (out cmd, out arg);
-                       // Eat any trailing whitespaces and single-line comments
-                       if (arg.IndexOf ("//") != -1)
-                               arg = arg.Substring (0, arg.IndexOf ("//"));
-                       arg = arg.TrimEnd (' ', '\t');
-
-                       //
-                       // The first group of pre-processing instructions is always processed
-                       //
-                       switch (cmd){
-                       case "line":
-                               if (!PreProcessLine (arg))
-                                       Report.Error (
-                                               1576, Location,
-                                               "Argument to #line directive is missing or invalid");
-                               return true;
-
-                       case "Region":
-                               region_directive = true;
-                               arg = "true";
-                               goto case "If";
-
-                       case "End Region":
-                               region_directive = true;
-                               goto case "End If";
-                               
-                       case "If":
-                               if (arg == ""){
-                                       Error_InvalidDirective ();
-                                       return true;
-                               }
-                               bool taking = false;
-                               if (ifstack == null)
-                                       ifstack = new Stack ();
-
-                               if (ifstack.Count == 0){
-                                       taking = true;
-                               } else {
-                                       int state = (int) ifstack.Peek ();
-                                       if ((state & TAKING) != 0)
-                                               taking = true;
-                               }
-
-                               if (eval (arg) && taking){
-                                       int push = TAKING | TAKEN_BEFORE | PARENT_TAKING;
-                                       if (region_directive)
-                                               push |= REGION;
-                                       ifstack.Push (push);
-                                       return true;
-                               } else {
-                                       int push = (taking ? PARENT_TAKING : 0);
-                                       if (region_directive)
-                                               push |= REGION;
-                                       ifstack.Push (push);
-                                       return false;
-                               }
-                               
-                       case "End If":
-                               if (ifstack == null || ifstack.Count == 0){
-                                       Error_UnexpectedDirective ("no #if for this #endif");
-                                       return true;
-                               } else {
-                                       int pop = (int) ifstack.Pop ();
-                                       
-                                       if (region_directive && ((pop & REGION) == 0))
-                                               Report.Error (1027, Location, "#endif directive expected");
-                                       else if (!region_directive && ((pop & REGION) != 0))
-                                               Report.Error (1038, Location, "#endregion directive expected");
-                                       
-                                       if (ifstack.Count == 0)
-                                               return true;
-                                       else {
-                                               int state = (int) ifstack.Peek ();
-
-                                               if ((state & TAKING) != 0)
-                                                       return true;
-                                               else
-                                                       return false;
-                                       }
-                               }
-
-                       case "ElseIf":
-                               if (ifstack == null || ifstack.Count == 0){
-                                       Error_UnexpectedDirective ("no #if for this #elif");
-                                       return true;
-                               } else {
-                                       int state = (int) ifstack.Peek ();
-
-                                       if ((state & REGION) != 0) {
-                                               Report.Error (1038, Location, "#endregion directive expected");
-                                               return true;
-                                       }
-
-                                       if ((state & ELSE_SEEN) != 0){
-                                               Error_UnexpectedDirective ("#elif not valid after #else");
-                                               return true;
-                                       }
-
-                                       if ((state & (TAKEN_BEFORE | TAKING)) != 0)
-                                               return false;
-
-                                       if (eval (arg) && ((state & PARENT_TAKING) != 0)){
-                                               state = (int) ifstack.Pop ();
-                                               ifstack.Push (state | TAKING | TAKEN_BEFORE);
-                                               return true;
-                                       } else 
-                                               return false;
-                               }
-
-                       case "Else":
-                               if (ifstack == null || ifstack.Count == 0){
-                                       Report.Error (
-                                               1028, Location,
-                                               "Unexpected processor directive (no #if for this #else)");
-                                       return true;
-                               } else {
-                                       int state = (int) ifstack.Peek ();
-
-                                       if ((state & REGION) != 0) {
-                                               Report.Error (1038, Location, "#endregion directive expected");
-                                               return true;
-                                       }
-
-                                       if ((state & ELSE_SEEN) != 0){
-                                               Error_UnexpectedDirective ("#else within #else");
-                                               return true;
-                                       }
-
-                                       ifstack.Pop ();
-
-                                       bool ret;
-                                       if ((state & TAKEN_BEFORE) == 0){
-                                               ret = ((state & PARENT_TAKING) != 0);
-                                       } else
-                                               ret = false;
-                                       
-                                       if (ret)
-                                               state |= TAKING;
-                                       else
-                                               state &= ~TAKING;
-                                       
-                                       ifstack.Push (state | ELSE_SEEN);
-                                       
-                                       return ret;
-                               }
-                       }
+                       int t;
+                       
+                       for(t = token(); t != Token.HASH && t != Token.EOF; t = token());
 
-                       //
-                       // These are only processed if we are in a `taking' block
-                       //
-                       if (!caller_is_taking)
-                               return false;
-                                       
-                       switch (cmd){
-                       case "define":
-                               /* if (any_token_seen){
-                                       Error_TokensSeen ();
-                                       return true;
-                               } */
-                               PreProcessDefinition (true, arg);
-                               return true;
-
-                       case "undef":
-                               /* if (any_token_seen){
-                                       Error_TokensSeen ();
-                                       return true;
-                               } */
-                               PreProcessDefinition (false, arg);
-                               return true;
-
-                       case "error":
-                               Report.Error (1029, Location, "#error: '" + arg + "'");
-                               return true;
-
-                       case "warning":
-                               Report.Warning (1030, Location, "#warning: '" + arg + "'");
-                               return true;
+                       if(t == Token.EOF)
+                               throw new ApplicationException("Unexpected EOF while looking for a pre-processor directive");
+                       
+                       if(t == Token.HASH) {
+                               tokens_seen = false;
+                               putback('#');
                        }
-
-                       Report.Error (1024, Location, "Preprocessor directive expected (got: " + cmd + ")");
-                       return true;
-
                }
 
        }