// This also implements the preprocessor
//
// Author: Miguel de Icaza (miguel@gnu.org)
-// Marek Safar (marek.safar@seznam.cz)
+// Marek Safar (marek.safar@gmail.com)
//
-// Licensed under the terms of the GNU GPL
-//
-// (C) 2001, 2002 Ximian, Inc (http://www.ximian.com)
-// (C) 2004 Novell, Inc
+// Dual licensed under the terms of the MIT X11 or GNU GPL
//
+// Copyright 2001, 2002 Ximian, Inc (http://www.ximian.com)
+// Copyright 2004-2008 Novell, Inc
+// Copyright 2011 Xamarin, Inc (http://www.xamarin.com)
//
using System;
using System.Text;
-using System.Collections;
-using System.IO;
+using System.Collections.Generic;
using System.Globalization;
-using System.Reflection;
+using System.Diagnostics;
namespace Mono.CSharp
{
public class Tokenizer : yyParser.yyInput
{
+ class KeywordEntry<T>
+ {
+ public readonly T Token;
+ public KeywordEntry<T> Next;
+ public readonly char[] Value;
+
+ public KeywordEntry (string value, T token)
+ {
+ this.Value = value.ToCharArray ();
+ this.Token = token;
+ }
+ }
+
+ sealed class IdentifiersComparer : IEqualityComparer<char[]>
+ {
+ readonly int length;
+
+ public IdentifiersComparer (int length)
+ {
+ this.length = length;
+ }
+
+ public bool Equals (char[] x, char[] y)
+ {
+ for (int i = 0; i < length; ++i)
+ if (x [i] != y [i])
+ return false;
+
+ return true;
+ }
+
+ public int GetHashCode (char[] obj)
+ {
+ int h = 0;
+ for (int i = 0; i < length; ++i)
+ h = (h << 5) - h + obj [i];
+
+ return h;
+ }
+ }
+
+ //
+ // This class has to be used in the parser only, it reuses token
+ // details after each parse
+ //
+ public class LocatedToken
+ {
+ int row, column;
+ string value;
+
+ static LocatedToken[] buffer;
+ static int pos;
+
+ private LocatedToken ()
+ {
+ }
+
+ public static LocatedToken Create (int row, int column)
+ {
+ return Create (null, row, column);
+ }
+
+ public static LocatedToken Create (string value, Location loc)
+ {
+ return Create (value, loc.Row, loc.Column);
+ }
+
+ public static LocatedToken Create (string value, int row, int column)
+ {
+ //
+ // TODO: I am not very happy about the logic but it's the best
+ // what I could come up with for now.
+ // Ideally we should be using just tiny buffer (256 elements) which
+ // is enough to hold all details for currect stack and recycle elements
+ // poped from the stack but there is a trick needed to recycle
+ // them properly.
+ //
+ LocatedToken entry;
+ if (pos >= buffer.Length) {
+ entry = new LocatedToken ();
+ } else {
+ entry = buffer [pos];
+ if (entry == null) {
+ entry = new LocatedToken ();
+ buffer [pos] = entry;
+ }
+
+ ++pos;
+ }
+ entry.value = value;
+ entry.row = row;
+ entry.column = column;
+ return entry;
+ }
+
+ //
+ // Used for token not required by expression evaluator
+ //
+ [Conditional ("FULL_AST")]
+ public static void CreateOptional (int row, int col, ref object token)
+ {
+ token = Create (row, col);
+ }
+
+ public static void Initialize ()
+ {
+ if (buffer == null)
+ buffer = new LocatedToken [10000];
+ pos = 0;
+ }
+
+ public Location Location {
+ get { return new Location (row, column); }
+ }
+
+ public string Value {
+ get { return value; }
+ }
+ }
+
+ public enum PreprocessorDirective
+ {
+ Invalid = 0,
+
+ Region = 1,
+ Endregion = 2,
+ If = 3 | RequiresArgument,
+ Endif = 4,
+ Elif = 5 | RequiresArgument,
+ Else = 6,
+ Define = 7 | RequiresArgument,
+ Undef = 8 | RequiresArgument,
+ Error = 9,
+ Warning = 10,
+ Pragma = 11 | CustomArgumentsParsing,
+ Line = 12,
+
+ CustomArgumentsParsing = 1 << 10,
+ RequiresArgument = 1 << 11
+ }
+
SeekableStreamReader reader;
SourceFile ref_name;
- SourceFile file_name;
+ CompilationSourceFile file_name;
+ CompilerContext context;
+ bool hidden = false;
int ref_line = 1;
int line = 1;
int col = 0;
int previous_col;
int current_token;
+ int tab_size;
bool handle_get_set = false;
bool handle_remove_add = false;
- bool handle_assembly = false;
bool handle_where = false;
bool handle_typeof = false;
bool lambda_arguments_parsing;
- Location current_location;
- Location current_comment_location = Location.Null;
- ArrayList escaped_identifiers = new ArrayList ();
+ List<Location> escaped_identifiers;
+ int parsing_generic_less_than;
+ readonly bool doc_processing;
+
+ //
+ // Used mainly for parser optimizations. Some expressions for instance
+ // can appear only in block (including initializer, base initializer)
+ // scope only
+ //
public int parsing_block;
-
-#if GMCS_SOURCE
- bool query_parsing;
-#endif
+ internal bool query_parsing;
- static bool IsLinqEnabled {
- get {
- return RootContext.Version == LanguageVersion.LINQ;
- }
- }
+ //
+ // When parsing type only, useful for ambiguous nullable types
+ //
+ public int parsing_type;
+
+ //
+ // Set when parsing generic declaration (type or method header)
+ //
+ public bool parsing_generic_declaration;
+ public bool parsing_generic_declaration_doc;
+
+ //
+ // The value indicates that we have not reach any declaration or
+ // namespace yet
+ //
+ public int parsing_declaration;
+ public bool parsing_attribute_section;
+
+ public bool parsing_modifiers;
+
+ //
+ // The special characters to inject on streams to run the unit parser
+ // in the special expression mode. Using private characters from
+ // Plane Sixteen (U+100000 to U+10FFFD)
+ //
+ // This character is only tested just before the tokenizer is about to report
+ // an error; So on the regular operation mode, this addition will have no
+ // impact on the tokenizer's performance.
+ //
+
+ public const int EvalStatementParserCharacter = 0x100000;
+ public const int EvalCompilationUnitParserCharacter = 0x100001;
+ public const int EvalUsingDeclarationsParserCharacter = 0x100002;
+ public const int DocumentationXref = 0x100003;
+
//
// XML documentation buffer. The save point is used to divide
// comments on types and comments on members.
//
bool tokens_seen = false;
+ //
+ // Set to true once the GENERATE_COMPLETION token has bee
+ // returned. This helps produce one GENERATE_COMPLETION,
+ // as many COMPLETE_COMPLETION as necessary to complete the
+ // AST tree and one final EOF.
+ //
+ bool generated;
+
//
// Whether a token has been seen on the file
// This is needed because `define' is not allowed to be used
// after a token has been seen.
//
- bool any_token_seen = false;
-
- static Hashtable token_values;
- static readonly char[] simple_whitespaces = new char[] { ' ', '\t' };
-
- private static Hashtable TokenValueName
- {
- get {
- if (token_values == null)
- token_values = GetTokenValueNameHash ();
-
- return token_values;
- }
- }
+ bool any_token_seen;
- private static Hashtable GetTokenValueNameHash ()
- {
- Type t = typeof (Token);
- FieldInfo [] fields = t.GetFields ();
- Hashtable hash = new Hashtable ();
- foreach (FieldInfo field in fields) {
- if (field.IsLiteral && field.IsStatic && field.FieldType == typeof (int))
- hash.Add (field.GetValue (null), field.Name);
- }
- return hash;
- }
-
//
- // Returns a verbose representation of the current location
- //
- public string location {
- get {
- string det;
-
- if (current_token == Token.ERROR)
- det = "detail: " + error_details;
- else
- det = "";
-
- // return "Line: "+line+" Col: "+col + "\n" +
- // "VirtLine: "+ref_line +
- // " Token: "+current_token + " " + det;
- string current_token_name = TokenValueName [current_token] as string;
- if (current_token_name == null)
- current_token_name = current_token.ToString ();
+ // Class variables
+ //
+ static readonly KeywordEntry<int>[][] keywords;
+ static readonly KeywordEntry<PreprocessorDirective>[][] keywords_preprocessor;
+ static readonly Dictionary<string, object> keyword_strings; // TODO: HashSet
+ static readonly NumberStyles styles;
+ static readonly NumberFormatInfo csharp_format_info;
+
+ // Pragma arguments
+ static readonly char[] pragma_warning = "warning".ToCharArray ();
+ static readonly char[] pragma_warning_disable = "disable".ToCharArray ();
+ static readonly char[] pragma_warning_restore = "restore".ToCharArray ();
+ static readonly char[] pragma_checksum = "checksum".ToCharArray ();
- return String.Format ("{0} ({1},{2}), Token: {3} {4}", ref_name.Name,
- ref_line,
- col,
- current_token_name,
- det);
- }
- }
+ static readonly char[] simple_whitespaces = new char[] { ' ', '\t' };
public bool PropertyParsing {
get { return handle_get_set; }
set { handle_get_set = value; }
- }
-
- public bool AssemblyTargetParsing {
- get { return handle_assembly; }
- set { handle_assembly = value; }
}
public bool EventParsing {
get { return handle_typeof; }
set { handle_typeof = value; }
}
+
+ public int TabSize {
+ get { return tab_size; }
+ set { tab_size = value; }
+ }
public XmlCommentState doc_state {
get { return xml_doc_state; }
}
}
- public bool IsEscapedIdentifier (Location loc)
+ //
+ // This is used to trigger completion generation on the parser
+ public bool CompleteOnEOF;
+
+ void AddEscapedIdentifier (Location loc)
{
- foreach (LocatedToken lt in escaped_identifiers)
- if (lt.Location.Equals (loc))
- return true;
- return false;
+ if (escaped_identifiers == null)
+ escaped_identifiers = new List<Location> ();
+
+ escaped_identifiers.Add (loc);
+ }
+
+ public bool IsEscapedIdentifier (ATypeNameExpression name)
+ {
+ return escaped_identifiers != null && escaped_identifiers.Contains (name.Location);
}
- //
- // Class variables
- //
- static CharArrayHashtable[] keywords;
- static Hashtable keyword_strings;
- static NumberStyles styles;
- static NumberFormatInfo csharp_format_info;
-
//
// Values for the associated token returned
//
- int putback_char;
- Object val;
+ internal int putback_char; // Used by repl only
+ object val;
//
// Pre-processor
//
- Hashtable defines;
-
const int TAKING = 1;
const int ELSE_SEEN = 4;
const int PARENT_TAKING = 8;
//
// pre-processor if stack state:
//
- Stack ifstack;
+ Stack<int> ifstack;
static System.Text.StringBuilder string_builder;
const int max_id_size = 512;
- static char [] id_builder = new char [max_id_size];
+ static readonly char [] id_builder = new char [max_id_size];
- static CharArrayHashtable [] identifiers = new CharArrayHashtable [max_id_size + 1];
+ public static Dictionary<char[], string>[] identifiers = new Dictionary<char[], string>[max_id_size + 1];
const int max_number_size = 512;
static char [] number_builder = new char [max_number_size];
static int number_pos;
-
- //
- // Details about the error encoutered by the tokenizer
- //
- string error_details;
-
- public string error {
- get {
- return error_details;
- }
- }
-
+
+ static char[] value_builder = new char[256];
+
public int Line {
get {
return ref_line;
}
}
- public int Col {
- get {
- return col;
- }
- }
-
//
// This is used when the tokenizer needs to save
// the current position as it needs to do some parsing
// on its own to deamiguate a token in behalf of the
// parser.
//
- Stack position_stack = new Stack (2);
+ Stack<Position> position_stack = new Stack<Position> (2);
+
class Position {
public int position;
+ public int line;
public int ref_line;
public int col;
+ public bool hidden;
public int putback_char;
public int previous_col;
- public Stack ifstack;
+ public Stack<int> ifstack;
public int parsing_generic_less_than;
public int current_token;
+ public object val;
public Position (Tokenizer t)
{
position = t.reader.Position;
+ line = t.line;
ref_line = t.ref_line;
col = t.col;
+ hidden = t.hidden;
putback_char = t.putback_char;
previous_col = t.previous_col;
- if (t.ifstack != null && t.ifstack.Count != 0)
- ifstack = (Stack)t.ifstack.Clone ();
+ if (t.ifstack != null && t.ifstack.Count != 0) {
+ // There is no simple way to clone Stack<T> all
+ // methods reverse the order
+ var clone = t.ifstack.ToArray ();
+ Array.Reverse (clone);
+ ifstack = new Stack<int> (clone);
+ }
parsing_generic_less_than = t.parsing_generic_less_than;
current_token = t.current_token;
+ val = t.val;
}
}
+
+ public Tokenizer (SeekableStreamReader input, CompilationSourceFile file, CompilerContext ctx)
+ {
+ this.ref_name = file;
+ this.file_name = file;
+ this.context = ctx;
+ reader = input;
+
+ putback_char = -1;
+
+ xml_comment_buffer = new StringBuilder ();
+ doc_processing = ctx.Settings.DocumentationFile != null;
+
+ if (Environment.OSVersion.Platform == PlatformID.Win32NT)
+ tab_size = 4;
+ else
+ tab_size = 8;
+
+ Mono.CSharp.Location.Push (file, file);
+ }
public void PushPosition ()
{
public void PopPosition ()
{
- Position p = (Position) position_stack.Pop ();
+ Position p = position_stack.Pop ();
reader.Position = p.position;
ref_line = p.ref_line;
+ line = p.line;
col = p.col;
+ hidden = p.hidden;
putback_char = p.putback_char;
previous_col = p.previous_col;
ifstack = p.ifstack;
parsing_generic_less_than = p.parsing_generic_less_than;
current_token = p.current_token;
+ val = p.val;
}
// Do not reset the position, ignore it.
static void AddKeyword (string kw, int token)
{
- keyword_strings.Add (kw, kw);
- if (keywords [kw.Length] == null) {
- keywords [kw.Length] = new CharArrayHashtable (kw.Length);
+ keyword_strings.Add (kw, null);
+
+ AddKeyword (keywords, kw, token);
+ }
+
+ static void AddPreprocessorKeyword (string kw, PreprocessorDirective directive)
+ {
+ AddKeyword (keywords_preprocessor, kw, directive);
+ }
+
+ static void AddKeyword<T> (KeywordEntry<T>[][] keywords, string kw, T token)
+ {
+ int length = kw.Length;
+ if (keywords[length] == null) {
+ keywords[length] = new KeywordEntry<T>['z' - '_' + 1];
+ }
+
+ int char_index = kw[0] - '_';
+ var kwe = keywords[length][char_index];
+ if (kwe == null) {
+ keywords[length][char_index] = new KeywordEntry<T> (kw, token);
+ return;
+ }
+
+ while (kwe.Next != null) {
+ kwe = kwe.Next;
}
- keywords [kw.Length] [kw.ToCharArray ()] = token;
+
+ kwe.Next = new KeywordEntry<T> (kw, token);
}
- static void InitTokens ()
+ //
+ // Class initializer
+ //
+ static Tokenizer ()
{
- keyword_strings = new Hashtable ();
- keywords = new CharArrayHashtable [64];
+ keyword_strings = new Dictionary<string, object> ();
+
+ // 11 is the length of the longest keyword for now
+ keywords = new KeywordEntry<int>[11][];
AddKeyword ("__arglist", Token.ARGLIST);
+ AddKeyword ("__makeref", Token.MAKEREF);
+ AddKeyword ("__reftype", Token.REFTYPE);
+ AddKeyword ("__refvalue", Token.REFVALUE);
AddKeyword ("abstract", Token.ABSTRACT);
AddKeyword ("as", Token.AS);
AddKeyword ("add", Token.ADD);
- AddKeyword ("assembly", Token.ASSEMBLY);
AddKeyword ("base", Token.BASE);
AddKeyword ("bool", Token.BOOL);
AddKeyword ("break", Token.BREAK);
AddKeyword ("volatile", Token.VOLATILE);
AddKeyword ("while", Token.WHILE);
AddKeyword ("partial", Token.PARTIAL);
-#if GMCS_SOURCE
AddKeyword ("where", Token.WHERE);
-#endif
- }
-#if GMCS_SOURCE
- public static void InitializeLinqKeywords ()
- {
+ // LINQ keywords
AddKeyword ("from", Token.FROM);
AddKeyword ("join", Token.JOIN);
AddKeyword ("on", Token.ON);
AddKeyword ("ascending", Token.ASCENDING);
AddKeyword ("descending", Token.DESCENDING);
AddKeyword ("into", Token.INTO);
- }
-#endif
- //
- // Class initializer
- //
- static Tokenizer ()
- {
- Reset ();
- }
+ // Contextual async keywords
+ AddKeyword ("async", Token.ASYNC);
+ AddKeyword ("await", Token.AWAIT);
+
+ keywords_preprocessor = new KeywordEntry<PreprocessorDirective>[10][];
+
+ AddPreprocessorKeyword ("region", PreprocessorDirective.Region);
+ AddPreprocessorKeyword ("endregion", PreprocessorDirective.Endregion);
+ AddPreprocessorKeyword ("if", PreprocessorDirective.If);
+ AddPreprocessorKeyword ("endif", PreprocessorDirective.Endif);
+ AddPreprocessorKeyword ("elif", PreprocessorDirective.Elif);
+ AddPreprocessorKeyword ("else", PreprocessorDirective.Else);
+ AddPreprocessorKeyword ("define", PreprocessorDirective.Define);
+ AddPreprocessorKeyword ("undef", PreprocessorDirective.Undef);
+ AddPreprocessorKeyword ("error", PreprocessorDirective.Error);
+ AddPreprocessorKeyword ("warning", PreprocessorDirective.Warning);
+ AddPreprocessorKeyword ("pragma", PreprocessorDirective.Pragma);
+ AddPreprocessorKeyword ("line", PreprocessorDirective.Line);
- public static void Reset ()
- {
- InitTokens ();
csharp_format_info = NumberFormatInfo.InvariantInfo;
styles = NumberStyles.Float;
int GetKeyword (char[] id, int id_len)
{
- /*
- * Keywords are stored in an array of hashtables grouped by their
- * length.
- */
-
- if ((id_len >= keywords.Length) || (keywords [id_len] == null))
+ //
+ // Keywords are stored in an array of arrays grouped by their
+ // length and then by the first character
+ //
+ if (id_len >= keywords.Length || keywords [id_len] == null)
return -1;
- object o = keywords [id_len] [id];
- if (o == null)
+ int first_index = id [0] - '_';
+ if (first_index > 'z' - '_')
return -1;
-
- int res = (int) o;
- if (!handle_get_set && (res == Token.GET || res == Token.SET))
- return -1;
- if (!handle_remove_add && (res == Token.REMOVE || res == Token.ADD))
+ var kwe = keywords [id_len] [first_index];
+ if (kwe == null)
return -1;
- if (!handle_assembly && res == Token.ASSEMBLY)
+
+ int res;
+ do {
+ res = kwe.Token;
+ for (int i = 1; i < id_len; ++i) {
+ if (id [i] != kwe.Value [i]) {
+ res = 0;
+ kwe = kwe.Next;
+ break;
+ }
+ }
+ } while (res == 0 && kwe != null);
+
+ if (res == 0)
return -1;
-#if GMCS_SOURCE
- if (IsLinqEnabled) {
+
+ int next_token;
+ switch (res) {
+ case Token.GET:
+ case Token.SET:
+ if (!handle_get_set)
+ res = -1;
+ break;
+ case Token.REMOVE:
+ case Token.ADD:
+ if (!handle_remove_add)
+ res = -1;
+ break;
+ case Token.EXTERN:
+ if (parsing_declaration == 0)
+ res = Token.EXTERN_ALIAS;
+ break;
+ case Token.DEFAULT:
+ if (peek_token () == Token.COLON) {
+ token ();
+ res = Token.DEFAULT_COLON;
+ }
+ break;
+ case Token.WHERE:
+ if (!handle_where && !query_parsing)
+ res = -1;
+ break;
+ case Token.FROM:
//
// A query expression is any expression that starts with `from identifier'
// followed by any token except ; , =
//
- if (!query_parsing && res == Token.FROM) {
+ if (!query_parsing) {
+ if (lambda_arguments_parsing) {
+ res = -1;
+ break;
+ }
+
PushPosition ();
- switch (token ()) {
- case Token.IDENTIFIER:
- case Token.INT:
- case Token.BOOL:
- case Token.BYTE:
- case Token.CHAR:
- case Token.DECIMAL:
- case Token.FLOAT:
- case Token.LONG:
- case Token.OBJECT:
- case Token.STRING:
- case Token.UINT:
- case Token.ULONG:
- int next_token = token ();
- query_parsing = next_token != Token.SEMICOLON && next_token != Token.COMMA &&
- next_token != Token.EQUALS;
- break;
- case Token.VOID:
- Expression.Error_VoidInvalidInTheContext (Location);
- break;
+ // HACK: to disable generics micro-parser, because PushPosition does not
+ // store identifiers array
+ parsing_generic_less_than = 1;
+ switch (xtoken ()) {
+ case Token.IDENTIFIER:
+ case Token.INT:
+ case Token.BOOL:
+ case Token.BYTE:
+ case Token.CHAR:
+ case Token.DECIMAL:
+ case Token.FLOAT:
+ case Token.LONG:
+ case Token.OBJECT:
+ case Token.STRING:
+ case Token.UINT:
+ case Token.ULONG:
+ next_token = xtoken ();
+ if (next_token == Token.SEMICOLON || next_token == Token.COMMA || next_token == Token.EQUALS)
+ goto default;
+
+ res = Token.FROM_FIRST;
+ query_parsing = true;
+ if (context.Settings.Version <= LanguageVersion.ISO_2)
+ Report.FeatureIsNotAvailable (context, Location, "query expressions");
+ break;
+ case Token.VOID:
+ Expression.Error_VoidInvalidInTheContext (Location, Report);
+ break;
+ default:
+ PopPosition ();
+ // HACK: A token is not a keyword so we need to restore identifiers buffer
+ // which has been overwritten before we grabbed the identifier
+ id_builder [0] = 'f'; id_builder [1] = 'r'; id_builder [2] = 'o'; id_builder [3] = 'm';
+ return -1;
}
PopPosition ();
}
+ break;
+ case Token.JOIN:
+ case Token.ON:
+ case Token.EQUALS:
+ case Token.SELECT:
+ case Token.GROUP:
+ case Token.BY:
+ case Token.LET:
+ case Token.ORDERBY:
+ case Token.ASCENDING:
+ case Token.DESCENDING:
+ case Token.INTO:
+ if (!query_parsing)
+ res = -1;
+ break;
+
+ case Token.USING:
+ case Token.NAMESPACE:
+ // TODO: some explanation needed
+ check_incorrect_doc_comment ();
+ break;
+
+ case Token.PARTIAL:
+ if (parsing_block > 0) {
+ res = -1;
+ break;
+ }
- if (!query_parsing && res > Token.QUERY_FIRST_TOKEN && res < Token.QUERY_LAST_TOKEN)
- return -1;
+ // Save current position and parse next token.
+ PushPosition ();
- return res;
- }
+ next_token = token ();
+ bool ok = (next_token == Token.CLASS) ||
+ (next_token == Token.STRUCT) ||
+ (next_token == Token.INTERFACE) ||
+ (next_token == Token.VOID);
- if (!handle_where && res == Token.WHERE)
- return -1;
-#endif
- return res;
-
- }
+ PopPosition ();
- public Location Location {
- get { return current_location; }
- }
+ if (ok) {
+ if (next_token == Token.VOID) {
+ if (context.Settings.Version <= LanguageVersion.ISO_2)
+ Report.FeatureIsNotAvailable (context, Location, "partial methods");
+ } else if (context.Settings.Version == LanguageVersion.ISO_1)
+ Report.FeatureIsNotAvailable (context, Location, "partial types");
- void define (string def)
- {
- if (!RootContext.AllDefines.Contains (def)){
- RootContext.AllDefines [def] = true;
- }
- if (defines.Contains (def))
- return;
- defines [def] = true;
- }
-
- public Tokenizer (SeekableStreamReader input, SourceFile file, ArrayList defs)
- {
- this.ref_name = file;
- this.file_name = file;
- reader = input;
-
- putback_char = -1;
+ return res;
+ }
+
+ if (next_token < Token.LAST_KEYWORD) {
+ Report.Error (267, Location,
+ "The `partial' modifier can be used only immediately before `class', `struct', `interface', or `void' keyword");
+ return token ();
+ }
+
+ res = -1;
+ break;
+
+ case Token.ASYNC:
+ if (parsing_modifiers) {
+ //
+ // Skip attributes section or constructor called async
+ //
+ if (parsing_attribute_section || peek_token () == Token.OPEN_PARENS) {
+ res = -1;
+ } else {
+ // async is keyword
+ }
+ } else if (parsing_block > 0) {
+ switch (peek_token ()) {
+ case Token.DELEGATE:
+ case Token.OPEN_PARENS_LAMBDA:
+ // async is keyword
+ break;
+ case Token.IDENTIFIER:
+ PushPosition ();
+ xtoken ();
+ if (xtoken () != Token.ARROW)
+ res = -1;
+
+ PopPosition ();
+ break;
+ default:
+ res = -1;
+ break;
+ }
+ } else {
+ res = -1;
+ }
+
+ if (res == Token.ASYNC && context.Settings.Version <= LanguageVersion.V_4) {
+ Report.FeatureIsNotAvailable (context, Location, "asynchronous functions");
+ }
+
+ break;
- if (defs != null){
- defines = new Hashtable ();
- foreach (string def in defs)
- define (def);
+ case Token.AWAIT:
+ if (parsing_block == 0)
+ res = -1;
+
+ break;
}
- xml_comment_buffer = new StringBuilder ();
+ return res;
+ }
+
+ static PreprocessorDirective GetPreprocessorDirective (char[] id, int id_len)
+ {
//
- // FIXME: This could be `Location.Push' but we have to
- // find out why the MS compiler allows this
+ // Keywords are stored in an array of arrays grouped by their
+ // length and then by the first character
//
- Mono.CSharp.Location.Push (file);
+ if (id_len >= keywords_preprocessor.Length || keywords_preprocessor[id_len] == null)
+ return PreprocessorDirective.Invalid;
+
+ int first_index = id[0] - '_';
+ if (first_index > 'z' - '_')
+ return PreprocessorDirective.Invalid;
+
+ var kwe = keywords_preprocessor[id_len][first_index];
+ if (kwe == null)
+ return PreprocessorDirective.Invalid;
+
+ PreprocessorDirective res = PreprocessorDirective.Invalid;
+ do {
+ res = kwe.Token;
+ for (int i = 1; i < id_len; ++i) {
+ if (id[i] != kwe.Value[i]) {
+ res = 0;
+ kwe = kwe.Next;
+ break;
+ }
+ }
+ } while (res == PreprocessorDirective.Invalid && kwe != null);
+
+ return res;
}
- static bool is_identifier_start_character (char c)
+ public Location Location {
+ get {
+ return new Location (ref_line, hidden ? -1 : col);
+ }
+ }
+
+ static bool is_identifier_start_character (int c)
{
- return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || c == '_' || Char.IsLetter (c);
+ return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || c == '_' || Char.IsLetter ((char)c);
}
static bool is_identifier_part_character (char c)
{
- return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || c == '_' || (c >= '0' && c <= '9') ||
- Char.IsLetter (c) || Char.GetUnicodeCategory (c) == UnicodeCategory.ConnectorPunctuation;
+ if (c >= 'a' && c <= 'z')
+ return true;
+
+ if (c >= 'A' && c <= 'Z')
+ return true;
+
+ if (c == '_' || (c >= '0' && c <= '9'))
+ return true;
+
+ if (c < 0x80)
+ return false;
+
+ return Char.IsLetter (c) || Char.GetUnicodeCategory (c) == UnicodeCategory.ConnectorPunctuation;
}
public static bool IsKeyword (string s)
{
- return keyword_strings [s] != null;
+ return keyword_strings.ContainsKey (s);
}
//
- // Tests whether '(' is beggining of lambda parameters
- //
- bool IsLambdaOpenParens ()
+ // Open parens micro parser. Detects both lambda and cast ambiguity.
+ //
+ int TokenizeOpenParens ()
{
- int ntoken;
- while ((ntoken = xtoken ()) != Token.EOF) {
- switch (ntoken) {
- case Token.CLOSE_PARENS:
- return xtoken () == Token.ARROW;
+ int ptoken;
+ current_token = -1;
- case Token.STAR:
- case Token.SEMICOLON:
- case Token.OPEN_PARENS:
- return false;
+ int bracket_level = 0;
+ bool is_type = false;
+ bool can_be_type = false;
+
+ while (true) {
+ ptoken = current_token;
+ token ();
+
+ switch (current_token) {
+ case Token.CLOSE_PARENS:
+ token ();
+
+ //
+ // Expression inside parens is lambda, (int i) =>
+ //
+ if (current_token == Token.ARROW)
+ return Token.OPEN_PARENS_LAMBDA;
+
+ //
+ // Expression inside parens is single type, (int[])
+ //
+ if (is_type)
+ return Token.OPEN_PARENS_CAST;
+
+ //
+ // Expression is possible cast, look at next token, (T)null
+ //
+ if (can_be_type) {
+ switch (current_token) {
+ case Token.OPEN_PARENS:
+ case Token.BANG:
+ case Token.TILDE:
+ case Token.IDENTIFIER:
+ case Token.LITERAL:
+ case Token.BASE:
+ case Token.CHECKED:
+ case Token.DELEGATE:
+ case Token.FALSE:
+ case Token.FIXED:
+ case Token.NEW:
+ case Token.NULL:
+ case Token.SIZEOF:
+ case Token.THIS:
+ case Token.THROW:
+ case Token.TRUE:
+ case Token.TYPEOF:
+ case Token.UNCHECKED:
+ case Token.UNSAFE:
+ case Token.DEFAULT:
+
+ //
+ // These can be part of a member access
+ //
+ case Token.INT:
+ case Token.UINT:
+ case Token.SHORT:
+ case Token.USHORT:
+ case Token.LONG:
+ case Token.ULONG:
+ case Token.DOUBLE:
+ case Token.FLOAT:
+ case Token.CHAR:
+ case Token.BYTE:
+ case Token.DECIMAL:
+ case Token.BOOL:
+ return Token.OPEN_PARENS_CAST;
+ }
+ }
+ return Token.OPEN_PARENS;
+
+ case Token.DOT:
+ case Token.DOUBLE_COLON:
+ if (ptoken != Token.IDENTIFIER && ptoken != Token.OP_GENERICS_GT)
+ goto default;
+
+ continue;
+
+ case Token.IDENTIFIER:
+ switch (ptoken) {
+ case Token.DOT:
+ if (bracket_level == 0) {
+ is_type = false;
+ can_be_type = true;
+ }
+
+ continue;
+ case Token.OP_GENERICS_LT:
+ case Token.COMMA:
+ case Token.DOUBLE_COLON:
+ case -1:
+ if (bracket_level == 0)
+ can_be_type = true;
+ continue;
+ default:
+ can_be_type = is_type = false;
+ continue;
+ }
+
+ case Token.OBJECT:
+ case Token.STRING:
+ case Token.BOOL:
+ case Token.DECIMAL:
+ case Token.FLOAT:
+ case Token.DOUBLE:
+ case Token.SBYTE:
+ case Token.BYTE:
+ case Token.SHORT:
+ case Token.USHORT:
+ case Token.INT:
+ case Token.UINT:
+ case Token.LONG:
+ case Token.ULONG:
+ case Token.CHAR:
+ case Token.VOID:
+ if (bracket_level == 0)
+ is_type = true;
+ continue;
+
+ case Token.COMMA:
+ if (bracket_level == 0) {
+ bracket_level = 100;
+ can_be_type = is_type = false;
+ }
+ continue;
+
+ case Token.OP_GENERICS_LT:
+ case Token.OPEN_BRACKET:
+ if (bracket_level++ == 0)
+ is_type = true;
+ continue;
+
+ case Token.OP_GENERICS_GT:
+ case Token.CLOSE_BRACKET:
+ --bracket_level;
+ continue;
+
+ case Token.INTERR_NULLABLE:
+ case Token.STAR:
+ if (bracket_level == 0)
+ is_type = true;
+ continue;
+
+ case Token.REF:
+ case Token.OUT:
+ can_be_type = is_type = false;
+ continue;
+
+ default:
+ return Token.OPEN_PARENS;
}
}
-
- Error_TokenExpected (")");
- return false;
}
public static bool IsValidIdentifier (string s)
the_token = token ();
} while (the_token != Token.CLOSE_BRACKET);
the_token = token ();
+ } else if (the_token == Token.IN || the_token == Token.OUT) {
+ the_token = token ();
}
switch (the_token) {
case Token.IDENTIFIER:
case Token.CHAR:
case Token.VOID:
break;
+ case Token.OP_GENERICS_GT:
+ case Token.IN:
+ case Token.OUT:
+ return true;
default:
return false;
return true;
else if (the_token == Token.COMMA || the_token == Token.DOT || the_token == Token.DOUBLE_COLON)
goto start;
- else if (the_token == Token.INTERR || the_token == Token.STAR)
+ else if (the_token == Token.INTERR_NULLABLE || the_token == Token.STAR)
goto again;
else if (the_token == Token.OP_GENERICS_LT) {
if (!parse_less_than ())
return false;
}
-#if GMCS_SOURCE
- public void PutbackNullable ()
- {
- if (nullable_pos < 0)
- throw new Exception ();
-
- current_token = -1;
- val = null;
- reader.Position = nullable_pos;
-
- putback_char = '?';
- }
-
- public void PutbackCloseParens ()
- {
- putback_char = ')';
- }
-
-
- int nullable_pos = -1;
-
- public void CheckNullable (bool is_nullable)
- {
- if (is_nullable)
- nullable_pos = reader.Position;
- else
- nullable_pos = -1;
- }
-
- public bool QueryParsing {
- set {
- query_parsing = value;
- }
- }
-
bool parse_generic_dimension (out int dimension)
{
dimension = 1;
}
return false;
- }
-#endif
+ }
public int peek_token ()
{
return the_token;
}
- int parsing_generic_less_than = 0;
-
- int is_punct (char c, ref bool doread)
+ //
+ // Tonizes `?' using custom disambiguous rules to return one
+ // of following tokens: INTERR_NULLABLE, OP_COALESCING, INTERR
+ //
+ // Tricky expression look like:
+ //
+ // Foo ? a = x ? b : c;
+ //
+ int TokenizePossibleNullableType ()
{
- int d;
- int t;
-
- doread = false;
-
- switch (c){
- case '{':
- val = Location;
- return Token.OPEN_BRACE;
- case '}':
- val = Location;
- return Token.CLOSE_BRACE;
- case '[':
- // To block doccomment inside attribute declaration.
- if (doc_state == XmlCommentState.Allowed)
- doc_state = XmlCommentState.NotAllowed;
- return Token.OPEN_BRACKET;
- case ']':
- return Token.CLOSE_BRACKET;
- case '(':
- if (IsLinqEnabled && !lambda_arguments_parsing) {
- lambda_arguments_parsing = true;
- PushPosition ();
- bool lambda_start = IsLambdaOpenParens ();
- PopPosition ();
- lambda_arguments_parsing = false;
- if (lambda_start)
- return Token.OPEN_PARENS_LAMBDA;
- }
- return Token.OPEN_PARENS;
- case ')': {
- if (deambiguate_close_parens == 0)
- return Token.CLOSE_PARENS;
-
- --deambiguate_close_parens;
-
- PushPosition ();
-
- int new_token = xtoken ();
-
- PopPosition ();
-
- if (new_token == Token.OPEN_PARENS)
- return Token.CLOSE_PARENS_OPEN_PARENS;
- else if (new_token == Token.MINUS)
- return Token.CLOSE_PARENS_MINUS;
- else if (IsCastToken (new_token))
- return Token.CLOSE_PARENS_CAST;
- else
- return Token.CLOSE_PARENS_NO_CAST;
- }
-
- case ',':
- return Token.COMMA;
- case ';':
- val = Location;
- return Token.SEMICOLON;
- case '~':
- val = Location;
- return Token.TILDE;
- case '?':
-#if GMCS_SOURCE
- d = peek_char ();
- if (d == '?') {
- get_char ();
- return Token.OP_COALESCING;
- }
-#endif
- return Token.INTERR;
- }
-#if GMCS_SOURCE
- if (c == '<') {
- if (parsing_generic_less_than++ > 0)
- return Token.OP_GENERICS_LT;
-
- if (handle_typeof) {
- int dimension;
- PushPosition ();
- if (parse_generic_dimension (out dimension)) {
- val = dimension;
- DiscardPosition ();
- return Token.GENERIC_DIMENSION;
- }
- PopPosition ();
- }
-
- // Save current position and parse next token.
- PushPosition ();
- bool is_generic_lt = parse_less_than ();
- PopPosition ();
-
- if (is_generic_lt) {
- return Token.OP_GENERICS_LT;
- } else
- parsing_generic_less_than = 0;
-
- d = peek_char ();
- if (d == '<'){
- get_char ();
- d = peek_char ();
-
- if (d == '='){
- doread = true;
- return Token.OP_SHIFT_LEFT_ASSIGN;
- }
- return Token.OP_SHIFT_LEFT;
- } else if (d == '='){
- doread = true;
- return Token.OP_LE;
- }
- return Token.OP_LT;
- } else if (c == '>') {
- if (parsing_generic_less_than > 0) {
- parsing_generic_less_than--;
- return Token.OP_GENERICS_GT;
- }
-
- d = peek_char ();
- if (d == '>'){
- get_char ();
- d = peek_char ();
-
- if (d == '='){
- doread = true;
- return Token.OP_SHIFT_RIGHT_ASSIGN;
- }
- return Token.OP_SHIFT_RIGHT;
- } else if (d == '='){
- doread = true;
- return Token.OP_GE;
- }
- return Token.OP_GT;
- }
-#endif
- d = peek_char ();
- if (c == '+'){
-
- if (d == '+') {
- val = Location;
- t = Token.OP_INC;
- }
- else if (d == '=')
- t = Token.OP_ADD_ASSIGN;
- else {
- val = Location;
- return Token.PLUS;
- }
- doread = true;
- return t;
- }
- if (c == '-'){
- if (d == '-') {
- val = Location;
- t = Token.OP_DEC;
- }
- else if (d == '=')
- t = Token.OP_SUB_ASSIGN;
- else if (d == '>')
- t = Token.OP_PTR;
- else {
- val = Location;
- return Token.MINUS;
- }
- doread = true;
- return t;
- }
+ if (parsing_block == 0 || parsing_type > 0)
+ return Token.INTERR_NULLABLE;
- if (c == '!'){
- if (d == '='){
- doread = true;
- return Token.OP_NE;
- }
- val = Location;
- return Token.BANG;
+ int d = peek_char ();
+ if (d == '?') {
+ get_char ();
+ return Token.OP_COALESCING;
}
- if (c == '='){
- if (d == '='){
- doread = true;
- return Token.OP_EQ;
- }
- if (d == '>'){
- doread = true;
- val = Location;
- return Token.ARROW;
- }
-
- return Token.ASSIGN;
- }
-
- if (c == '&'){
- if (d == '&'){
- doread = true;
- return Token.OP_AND;
- } else if (d == '='){
- doread = true;
- return Token.OP_AND_ASSIGN;
- }
- val = Location;
- return Token.BITWISE_AND;
- }
-
- if (c == '|'){
- if (d == '|'){
- doread = true;
- return Token.OP_OR;
- } else if (d == '='){
- doread = true;
- return Token.OP_OR_ASSIGN;
- }
- return Token.BITWISE_OR;
- }
-
- if (c == '*'){
- if (d == '='){
- doread = true;
- return Token.OP_MULT_ASSIGN;
- }
- val = Location;
- return Token.STAR;
- }
-
- if (c == '/'){
- if (d == '='){
- doread = true;
- return Token.OP_DIV_ASSIGN;
- }
- return Token.DIV;
- }
-
- if (c == '%'){
- if (d == '='){
- doread = true;
- return Token.OP_MOD_ASSIGN;
- }
- return Token.PERCENT;
+ switch (current_token) {
+ case Token.CLOSE_PARENS:
+ case Token.TRUE:
+ case Token.FALSE:
+ case Token.NULL:
+ case Token.LITERAL:
+ return Token.INTERR;
}
- if (c == '^'){
- if (d == '='){
- doread = true;
- return Token.OP_XOR_ASSIGN;
- }
- return Token.CARRET;
+ if (d != ' ') {
+ if (d == ',' || d == ';' || d == '>')
+ return Token.INTERR_NULLABLE;
+ if (d == '*' || (d >= '0' && d <= '9'))
+ return Token.INTERR;
}
-#if !GMCS_SOURCE
- if (c == '<'){
- if (d == '<'){
- get_char ();
- d = peek_char ();
-
- if (d == '='){
- doread = true;
- return Token.OP_SHIFT_LEFT_ASSIGN;
- }
- return Token.OP_SHIFT_LEFT;
- } else if (d == '='){
- doread = true;
- return Token.OP_LE;
- }
- return Token.OP_LT;
+ PushPosition ();
+ current_token = Token.NONE;
+ int next_token;
+ switch (xtoken ()) {
+ case Token.LITERAL:
+ case Token.TRUE:
+ case Token.FALSE:
+ case Token.NULL:
+ case Token.THIS:
+ case Token.NEW:
+ next_token = Token.INTERR;
+ break;
+
+ case Token.SEMICOLON:
+ case Token.COMMA:
+ case Token.CLOSE_PARENS:
+ case Token.OPEN_BRACKET:
+ case Token.OP_GENERICS_GT:
+ case Token.INTERR:
+ next_token = Token.INTERR_NULLABLE;
+ break;
+
+ default:
+ next_token = -1;
+ break;
}
- if (c == '>'){
- if (d == '>'){
- get_char ();
- d = peek_char ();
-
- if (d == '='){
- doread = true;
- return Token.OP_SHIFT_RIGHT_ASSIGN;
+ if (next_token == -1) {
+ switch (xtoken ()) {
+ case Token.COMMA:
+ case Token.SEMICOLON:
+ case Token.OPEN_BRACE:
+ case Token.CLOSE_PARENS:
+ case Token.IN:
+ next_token = Token.INTERR_NULLABLE;
+ break;
+
+ case Token.COLON:
+ next_token = Token.INTERR;
+ break;
+
+ default:
+ int ntoken;
+ int interrs = 1;
+ int colons = 0;
+ //
+ // All shorcuts failed, do it hard way
+ //
+ while ((ntoken = xtoken ()) != Token.EOF) {
+ if (ntoken == Token.SEMICOLON)
+ break;
+
+ if (ntoken == Token.COLON) {
+ if (++colons == interrs)
+ break;
+ continue;
+ }
+
+ if (ntoken == Token.INTERR) {
+ ++interrs;
+ continue;
+ }
}
- return Token.OP_SHIFT_RIGHT;
- } else if (d == '='){
- doread = true;
- return Token.OP_GE;
- }
- return Token.OP_GT;
- }
-#endif
- if (c == ':'){
- if (d == ':'){
- doread = true;
- return Token.DOUBLE_COLON;
+
+ next_token = colons != interrs ? Token.INTERR_NULLABLE : Token.INTERR;
+ break;
}
- val = Location;
- return Token.COLON;
}
-
- return Token.ERROR;
- }
-
- int deambiguate_close_parens = 0;
-
- public void Deambiguate_CloseParens (object expression)
- {
- putback (')');
-
- // When any binary operation is used we are sure it is not a cast
- if (expression is Binary)
- return;
-
- deambiguate_close_parens++;
+
+ PopPosition ();
+ return next_token;
}
bool decimal_digits (int c)
{
return (e >= '0' && e <= '9') || (e >= 'A' && e <= 'F') || (e >= 'a' && e <= 'f');
}
-
- static int real_type_suffix (int c)
- {
- int t;
+ static TypeCode real_type_suffix (int c)
+ {
switch (c){
case 'F': case 'f':
- t = Token.LITERAL_FLOAT;
- break;
+ return TypeCode.Single;
case 'D': case 'd':
- t = Token.LITERAL_DOUBLE;
- break;
+ return TypeCode.Double;
case 'M': case 'm':
- t= Token.LITERAL_DECIMAL;
- break;
+ return TypeCode.Decimal;
default:
- return Token.NONE;
+ return TypeCode.Empty;
}
- return t;
}
- int integer_type_suffix (ulong ul, int c)
+ ILiteralConstant integer_type_suffix (ulong ul, int c, Location loc)
{
bool is_unsigned = false;
bool is_long = false;
//
Report.Warning (78, 4, Location, "The 'l' suffix is easily confused with the digit '1' (use 'L' for clarity)");
}
- //
- // This goto statement causes the MS CLR 2.0 beta 1 csc to report an error, so
- // work around that.
- //
- //goto case 'L';
- if (is_long)
- scanning = false;
- is_long = true;
- get_char ();
- break;
+
+ goto case 'L';
case 'L':
if (is_long)
}
if (is_long && is_unsigned){
- val = ul;
- return Token.LITERAL_INTEGER;
- } else if (is_unsigned){
+ return new ULongLiteral (context.BuiltinTypes, ul, loc);
+ }
+
+ if (is_unsigned){
// uint if possible, or ulong else.
if ((ul & 0xffffffff00000000) == 0)
- val = (uint) ul;
+ return new UIntLiteral (context.BuiltinTypes, (uint) ul, loc);
else
- val = ul;
+ return new ULongLiteral (context.BuiltinTypes, ul, loc);
} else if (is_long){
// long if possible, ulong otherwise
if ((ul & 0x8000000000000000) != 0)
- val = ul;
+ return new ULongLiteral (context.BuiltinTypes, ul, loc);
else
- val = (long) ul;
+ return new LongLiteral (context.BuiltinTypes, (long) ul, loc);
} else {
// int, uint, long or ulong in that order
if ((ul & 0xffffffff00000000) == 0){
uint ui = (uint) ul;
if ((ui & 0x80000000) != 0)
- val = ui;
+ return new UIntLiteral (context.BuiltinTypes, ui, loc);
else
- val = (int) ui;
+ return new IntLiteral (context.BuiltinTypes, (int) ui, loc);
} else {
if ((ul & 0x8000000000000000) != 0)
- val = ul;
+ return new ULongLiteral (context.BuiltinTypes, ul, loc);
else
- val = (long) ul;
+ return new LongLiteral (context.BuiltinTypes, (long) ul, loc);
}
}
- return Token.LITERAL_INTEGER;
}
//
// we need to convert to a special type, and then choose
// the best representation for the integer
//
- int adjust_int (int c)
+ ILiteralConstant adjust_int (int c, Location loc)
{
try {
if (number_pos > 9){
for (int i = 1; i < number_pos; i++){
ul = checked ((ul * 10) + ((uint)(number_builder [i] - '0')));
}
- return integer_type_suffix (ul, c);
+
+ return integer_type_suffix (ul, c, loc);
} else {
uint ui = (uint) (number_builder [0] - '0');
for (int i = 1; i < number_pos; i++){
ui = checked ((ui * 10) + ((uint)(number_builder [i] - '0')));
}
- return integer_type_suffix (ui, c);
+
+ return integer_type_suffix (ui, c, loc);
}
} catch (OverflowException) {
- error_details = "Integral constant is too large";
- Report.Error (1021, Location, error_details);
- val = 0ul;
- return Token.LITERAL_INTEGER;
+ Error_NumericConstantTooLong ();
+ return new IntLiteral (context.BuiltinTypes, 0, loc);
}
catch (FormatException) {
Report.Error (1013, Location, "Invalid number");
- val = 0ul;
- return Token.LITERAL_INTEGER;
+ return new IntLiteral (context.BuiltinTypes, 0, loc);
}
}
- int adjust_real (int t)
+ ILiteralConstant adjust_real (TypeCode t, Location loc)
{
- string s = new String (number_builder, 0, number_pos);
+ string s = new string (number_builder, 0, number_pos);
const string error_details = "Floating-point constant is outside the range of type `{0}'";
switch (t){
- case Token.LITERAL_DECIMAL:
+ case TypeCode.Decimal:
try {
- val = System.Decimal.Parse (s, styles, csharp_format_info);
+ return new DecimalLiteral (context.BuiltinTypes, decimal.Parse (s, styles, csharp_format_info), loc);
} catch (OverflowException) {
- val = 0m;
Report.Error (594, Location, error_details, "decimal");
+ return new DecimalLiteral (context.BuiltinTypes, 0, loc);
}
- break;
- case Token.LITERAL_FLOAT:
+ case TypeCode.Single:
try {
- val = float.Parse (s, styles, csharp_format_info);
+ return new FloatLiteral (context.BuiltinTypes, float.Parse (s, styles, csharp_format_info), loc);
} catch (OverflowException) {
- val = 0.0f;
Report.Error (594, Location, error_details, "float");
+ return new FloatLiteral (context.BuiltinTypes, 0, loc);
}
- break;
-
- case Token.LITERAL_DOUBLE:
- case Token.NONE:
- t = Token.LITERAL_DOUBLE;
+ default:
try {
- val = System.Double.Parse (s, styles, csharp_format_info);
+ return new DoubleLiteral (context.BuiltinTypes, double.Parse (s, styles, csharp_format_info), loc);
} catch (OverflowException) {
- val = 0.0;
- Report.Error (594, Location, error_details, "double");
+ Report.Error (594, loc, error_details, "double");
+ return new DoubleLiteral (context.BuiltinTypes, 0, loc);
}
- break;
}
- return t;
}
- int handle_hex ()
+ ILiteralConstant handle_hex (Location loc)
{
int d;
ulong ul;
}
string s = new String (number_builder, 0, number_pos);
+
try {
if (number_pos <= 8)
ul = System.UInt32.Parse (s, NumberStyles.HexNumber);
else
ul = System.UInt64.Parse (s, NumberStyles.HexNumber);
+
+ return integer_type_suffix (ul, peek_char (), loc);
} catch (OverflowException){
- error_details = "Integral constant is too large";
- Report.Error (1021, Location, error_details);
- val = 0ul;
- return Token.LITERAL_INTEGER;
+ Error_NumericConstantTooLong ();
+ return new IntLiteral (context.BuiltinTypes, 0, loc);
}
catch (FormatException) {
Report.Error (1013, Location, "Invalid number");
- val = 0ul;
- return Token.LITERAL_INTEGER;
+ return new IntLiteral (context.BuiltinTypes, 0, loc);
}
-
- return integer_type_suffix (ul, peek_char ());
}
//
//
int is_number (int c)
{
- bool is_real = false;
- int type;
+ ILiteralConstant res;
+#if FULL_AST
+ int read_start = reader.Position - 1;
+#endif
number_pos = 0;
+ var loc = Location;
if (c >= '0' && c <= '9'){
if (c == '0'){
int peek = peek_char ();
- if (peek == 'x' || peek == 'X')
- return handle_hex ();
+ if (peek == 'x' || peek == 'X') {
+ val = res = handle_hex (loc);
+#if FULL_AST
+ res.ParsedValue = reader.ReadChars (read_start, reader.Position - 1);
+#endif
+
+ return Token.LITERAL;
+ }
}
decimal_digits (c);
c = get_char ();
// We need to handle the case of
// "1.1" vs "1.string" (LITERAL_FLOAT vs NUMBER DOT IDENTIFIER)
//
+ bool is_real = false;
if (c == '.'){
if (decimal_digits ('.')){
is_real = true;
} else {
putback ('.');
number_pos--;
- return adjust_int (-1);
+ val = res = adjust_int (-1, loc);
+
+#if FULL_AST
+ res.ParsedValue = reader.ReadChars (read_start, reader.Position - 1);
+#endif
+ return Token.LITERAL;
}
}
is_real = true;
if (number_pos == max_number_size)
Error_NumericConstantTooLong ();
- number_builder [number_pos++] = 'e';
+ number_builder [number_pos++] = (char) c;
c = get_char ();
if (c == '+'){
c = get_char ();
}
- type = real_type_suffix (c);
- if (type == Token.NONE && !is_real){
+ var type = real_type_suffix (c);
+ if (type == TypeCode.Empty && !is_real) {
putback (c);
- return adjust_int (c);
- } else
+ res = adjust_int (c, loc);
+ } else {
is_real = true;
- if (type == Token.NONE){
- putback (c);
+ if (type == TypeCode.Empty) {
+ putback (c);
+ }
+
+ res = adjust_real (type, loc);
}
-
- if (is_real)
- return adjust_real (type);
- Console.WriteLine ("This should not be reached");
- throw new Exception ("Is Number should never reach this point");
+ val = res;
+
+#if FULL_AST
+ res.ParsedValue = reader.ReadChars (read_start, reader.Position - (type == TypeCode.Empty ? 1 : 0));
+#endif
+
+ return Token.LITERAL;
}
//
// Accepts exactly count (4 or 8) hex, no more no less
//
- int getHex (int count, out bool error)
+ int getHex (int count, out int surrogate, out bool error)
{
int i;
int total = 0;
get_char ();
error = false;
+ surrogate = 0;
for (i = 0; i < top; i++){
c = get_char ();
-
+
if (c >= '0' && c <= '9')
c = (int) c - (int) '0';
else if (c >= 'A' && c <= 'F')
break;
}
}
+
+ if (top == 8) {
+ if (total > 0x0010FFFF) {
+ error = true;
+ return 0;
+ }
+
+ if (total >= 0x00010000) {
+ surrogate = ((total - 0x00010000) % 0x0400 + 0xDC00);
+ total = ((total - 0x00010000) / 0x0400 + 0xD800);
+ }
+ }
+
return total;
}
- int escape (int c)
+ int escape (int c, out int surrogate)
{
bool error;
int d;
int v;
d = peek_char ();
- if (c != '\\')
+ if (c != '\\') {
+ surrogate = 0;
return c;
+ }
switch (d){
case 'a':
case '\'':
v = '\''; break;
case 'x':
- v = getHex (-1, out error);
+ v = getHex (-1, out surrogate, out error);
if (error)
goto default;
return v;
case 'u':
- v = getHex (4, out error);
- if (error)
- goto default;
- return v;
case 'U':
- v = getHex (8, out error);
- if (error)
- goto default;
- return v;
+ return EscapeUnicode (d, out surrogate);
default:
+ surrogate = 0;
Report.Error (1009, Location, "Unrecognized escape sequence `\\{0}'", ((char)d).ToString ());
return d;
}
+
get_char ();
+ surrogate = 0;
return v;
}
+ int EscapeUnicode (int ch, out int surrogate)
+ {
+ bool error;
+ if (ch == 'U') {
+ ch = getHex (8, out surrogate, out error);
+ } else {
+ ch = getHex (4, out surrogate, out error);
+ }
+
+ if (error)
+ Report.Error (1009, Location, "Unrecognized escape sequence");
+
+ return ch;
+ }
+
int get_char ()
{
int x;
if (putback_char != -1) {
x = putback_char;
putback_char = -1;
- } else
+ } else {
x = reader.Read ();
- if (x == '\n') {
- line++;
- ref_line++;
- previous_col = col;
- col = 0;
}
- else
+
+ if (x == '\r') {
+ if (peek_char () == '\n') {
+ putback_char = -1;
+ }
+
+ x = '\n';
+ advance_line ();
+ } else if (x == '\n') {
+ advance_line ();
+ } else {
col++;
+ }
return x;
}
+ void advance_line ()
+ {
+ line++;
+ ref_line++;
+ previous_col = col;
+ col = 0;
+ }
+
int peek_char ()
{
- if (putback_char != -1)
- return putback_char;
- putback_char = reader.Read ();
+ if (putback_char == -1)
+ putback_char = reader.Read ();
return putback_char;
}
public bool advance ()
{
- return peek_char () != -1;
+ return peek_char () != -1 || CompleteOnEOF;
}
public Object Value {
return val;
}
- static bool IsCastToken (int token)
+ public int token ()
{
- switch (token) {
- case Token.BANG:
- case Token.TILDE:
- case Token.IDENTIFIER:
- case Token.LITERAL_INTEGER:
- case Token.LITERAL_FLOAT:
- case Token.LITERAL_DOUBLE:
- case Token.LITERAL_DECIMAL:
- case Token.LITERAL_CHARACTER:
- case Token.LITERAL_STRING:
- case Token.BASE:
- case Token.CHECKED:
- case Token.DELEGATE:
- case Token.FALSE:
- case Token.FIXED:
- case Token.NEW:
- case Token.NULL:
- case Token.SIZEOF:
- case Token.THIS:
- case Token.THROW:
- case Token.TRUE:
- case Token.TYPEOF:
- case Token.UNCHECKED:
- case Token.UNSAFE:
-#if GMCS_SOURCE
- case Token.DEFAULT:
-#endif
-
- //
- // These can be part of a member access
- //
- case Token.INT:
- case Token.UINT:
- case Token.SHORT:
- case Token.USHORT:
- case Token.LONG:
- case Token.ULONG:
- case Token.DOUBLE:
- case Token.FLOAT:
- case Token.CHAR:
- return true;
-
- default:
- return false;
- }
+ current_token = xtoken ();
+ return current_token;
}
- public int token ()
+ int TokenizePreprocessorIdentifier (out int c)
{
- current_token = xtoken ();
+ // skip over white space
+ do {
+ c = get_char ();
+ } while (c == ' ' || c == '\t');
+
-#if GMCS_SOURCE
- if (current_token != Token.DEFAULT)
- return current_token;
+ int pos = 0;
+ while (c != -1 && c >= 'a' && c <= 'z') {
+ id_builder[pos++] = (char) c;
+ c = get_char ();
+ if (c == '\\') {
+ int peek = peek_char ();
+ if (peek == 'U' || peek == 'u') {
+ int surrogate;
+ c = EscapeUnicode (c, out surrogate);
+ if (surrogate != 0) {
+ if (is_identifier_part_character ((char) c)) {
+ id_builder[pos++] = (char) c;
+ }
+ c = surrogate;
+ }
+ }
+ }
+ }
- PushPosition();
- int c = xtoken();
- if (c == -1)
- current_token = Token.ERROR;
- else if (c == Token.OPEN_PARENS)
- current_token = Token.DEFAULT_OPEN_PARENS;
- else if (c == Token.COLON)
- current_token = Token.DEFAULT_COLON;
- else
- PopPosition();
-#endif
- return current_token;
+ return pos;
}
- static StringBuilder static_cmd_arg = new System.Text.StringBuilder ();
-
- void get_cmd_arg (out string cmd, out string arg)
+ PreprocessorDirective get_cmd_arg (out string arg)
{
- int c;
-
+ int c;
+
tokens_seen = false;
arg = "";
- static_cmd_arg.Length = 0;
+
+ var cmd = GetPreprocessorDirective (id_builder, TokenizePreprocessorIdentifier (out c));
+
+ if ((cmd & PreprocessorDirective.CustomArgumentsParsing) != 0)
+ return cmd;
// skip over white space
- while ((c = get_char ()) != -1 && (c != '\n') && ((c == '\r') || (c == ' ') || (c == '\t')))
- ;
-
- while ((c != -1) && (c != '\n') && (c != ' ') && (c != '\t') && (c != '\r')){
- if (is_identifier_part_character ((char) c)){
- static_cmd_arg.Append ((char) c);
- c = get_char ();
- } else {
- putback (c);
+ while (c == ' ' || c == '\t')
+ c = get_char ();
+
+ int has_identifier_argument = (int)(cmd & PreprocessorDirective.RequiresArgument);
+ int pos = 0;
+
+ while (c != -1 && c != '\n') {
+ if (c == '\\' && has_identifier_argument >= 0) {
+ if (has_identifier_argument != 0) {
+ has_identifier_argument = 1;
+
+ int peek = peek_char ();
+ if (peek == 'U' || peek == 'u') {
+ int surrogate;
+ c = EscapeUnicode (c, out surrogate);
+ if (surrogate != 0) {
+ if (is_identifier_part_character ((char) c)) {
+ if (pos == value_builder.Length)
+ Array.Resize (ref value_builder, pos * 2);
+
+ value_builder[pos++] = (char) c;
+ }
+ c = surrogate;
+ }
+ }
+ } else {
+ has_identifier_argument = -1;
+ }
+ } else if (c == '/' && peek_char () == '/') {
+ //
+ // Eat single-line comments
+ //
+ get_char ();
+ do {
+ c = get_char ();
+ } while (c != -1 && c != '\n');
+
break;
}
- }
- cmd = static_cmd_arg.ToString ();
+ if (pos == value_builder.Length)
+ Array.Resize (ref value_builder, pos * 2);
- if (c == '\n' || c == '\r'){
- return;
+ value_builder[pos++] = (char) c;
+ c = get_char ();
}
- // skip over white space
- while ((c = get_char ()) != -1 && (c != '\n') && ((c == '\r') || (c == ' ') || (c == '\t')))
- ;
+ if (pos != 0) {
+ if (pos > max_id_size)
+ arg = new string (value_builder, 0, pos);
+ else
+ arg = InternIdentifier (value_builder, pos);
- if (c == '\n'){
- return;
- } else if (c == '\r'){
- return;
- } else if (c == -1){
- arg = "";
- return;
- }
-
- static_cmd_arg.Length = 0;
- static_cmd_arg.Append ((char) c);
-
- while ((c = get_char ()) != -1 && (c != '\n') && (c != '\r')){
- static_cmd_arg.Append ((char) c);
+ // Eat any trailing whitespaces
+ arg = arg.Trim (simple_whitespaces);
}
- arg = static_cmd_arg.ToString ();
+ return cmd;
}
//
if (arg == "default"){
ref_line = line;
ref_name = file_name;
- Location.Push (ref_name);
+ hidden = false;
+ Location.Push (file_name, ref_name);
return true;
} else if (arg == "hidden"){
- //
- // We ignore #line hidden
- //
+ hidden = true;
return true;
}
char [] quotes = { '\"' };
string name = arg.Substring (pos). Trim (quotes);
- ref_name = Location.LookupFile (name);
- file_name.HasLineDirective = true;
- ref_name.HasLineDirective = true;
- Location.Push (ref_name);
+ ref_name = context.LookupFile (file_name, name);
+ file_name.AddIncludeFile (ref_name);
+ hidden = false;
+ Location.Push (file_name, ref_name);
} else {
ref_line = System.Int32.Parse (arg);
+ hidden = false;
}
} catch {
return false;
//
// Handles #define and #undef
//
- void PreProcessDefinition (bool is_define, string arg, bool caller_is_taking)
+ void PreProcessDefinition (bool is_define, string ident, bool caller_is_taking)
{
- if (arg.Length == 0 || arg == "true" || arg == "false"){
- Report.Error (1001, Location, "Missing identifer to pre-processor directive");
+ if (ident.Length == 0 || ident == "true" || ident == "false"){
+ Report.Error (1001, Location, "Missing identifier to pre-processor directive");
return;
}
- if (arg.IndexOfAny (simple_whitespaces) != -1){
+ if (ident.IndexOfAny (simple_whitespaces) != -1){
Error_EndLineExpected ();
return;
}
- if (!is_identifier_start_character (arg [0]))
- Report.Error (1001, Location, "Identifier expected: " + arg);
+ if (!is_identifier_start_character (ident [0]))
+ Report.Error (1001, Location, "Identifier expected: {0}", ident);
- foreach (char c in arg.Substring (1)){
+ foreach (char c in ident.Substring (1)){
if (!is_identifier_part_character (c)){
- Report.Error (1001, Location, "Identifier expected: " + arg);
+ Report.Error (1001, Location, "Identifier expected: {0}", ident);
return;
}
}
if (!caller_is_taking)
return;
- if (is_define){
- if (defines == null)
- defines = new Hashtable ();
- define (arg);
- } else {
- if (defines == null)
+ if (is_define) {
+ //
+ // #define ident
+ //
+ if (context.Settings.IsConditionalSymbolDefined (ident))
return;
- if (defines.Contains (arg))
- defines.Remove (arg);
+
+ file_name.AddDefine (ident);
+ } else {
+ //
+ // #undef ident
+ //
+ file_name.AddUndefine (ident);
}
}
- /// <summary>
- /// Handles #pragma directive
- /// </summary>
- void PreProcessPragma (string arg)
+ byte read_hex (out bool error)
{
- const string warning = "warning";
- const string w_disable = "warning disable";
- const string w_restore = "warning restore";
+ int total;
+ int c = get_char ();
- if (arg == w_disable) {
- Report.RegisterWarningRegion (Location).WarningDisable (line);
- return;
+ if ((c >= '0') && (c <= '9'))
+ total = (int) c - (int) '0';
+ else if ((c >= 'A') && (c <= 'F'))
+ total = (int) c - (int) 'A' + 10;
+ else if ((c >= 'a') && (c <= 'f'))
+ total = (int) c - (int) 'a' + 10;
+ else {
+ error = true;
+ return 0;
}
- if (arg == w_restore) {
- Report.RegisterWarningRegion (Location).WarningEnable (line);
- return;
+ total *= 16;
+ c = get_char ();
+
+ if ((c >= '0') && (c <= '9'))
+ total += (int) c - (int) '0';
+ else if ((c >= 'A') && (c <= 'F'))
+ total += (int) c - (int) 'A' + 10;
+ else if ((c >= 'a') && (c <= 'f'))
+ total += (int) c - (int) 'a' + 10;
+ else {
+ error = true;
+ return 0;
}
- if (arg.StartsWith (w_disable)) {
- int[] codes = ParseNumbers (arg.Substring (w_disable.Length));
- foreach (int code in codes) {
- if (code != 0)
- Report.RegisterWarningRegion (Location).WarningDisable (Location, code);
+ error = false;
+ return (byte) total;
+ }
+
+ //
+ // Parses #pragma checksum
+ //
+ bool ParsePragmaChecksum ()
+ {
+ //
+ // The syntax is ` "foo.txt" "{guid}" "hash"'
+ //
+ int c = get_char ();
+
+ if (c != '"')
+ return false;
+
+ string_builder.Length = 0;
+ while (c != -1 && c != '\n') {
+ c = get_char ();
+ if (c == '"') {
+ c = get_char ();
+ break;
}
- return;
+
+ string_builder.Append ((char) c);
}
- if (arg.StartsWith (w_restore)) {
- int[] codes = ParseNumbers (arg.Substring (w_restore.Length));
- Hashtable w_table = Report.warning_ignore_table;
- foreach (int code in codes) {
- if (w_table != null && w_table.Contains (code))
- Report.Warning (1635, 1, Location, String.Format ("Cannot restore warning `CS{0:0000}' because it was disabled globally", code));
- Report.RegisterWarningRegion (Location).WarningEnable (Location, code);
- }
- return;
+ if (string_builder.Length == 0) {
+ Report.Warning (1709, 1, Location, "Filename specified for preprocessor directive is empty");
}
- if (arg.StartsWith (warning)) {
- Report.Warning (1634, 1, Location, "Expected disable or restore");
- return;
+ // TODO: Any white-spaces count
+ if (c != ' ')
+ return false;
+
+ SourceFile file = context.LookupFile (file_name, string_builder.ToString ());
+
+ if (get_char () != '"' || get_char () != '{')
+ return false;
+
+ bool error;
+ byte[] guid_bytes = new byte [16];
+ int i = 0;
+
+ for (; i < 4; i++) {
+ guid_bytes [i] = read_hex (out error);
+ if (error)
+ return false;
}
- Report.Warning (1633, 1, Location, "Unrecognized #pragma directive");
+ if (get_char () != '-')
+ return false;
+
+ for (; i < 10; i++) {
+ guid_bytes [i] = read_hex (out error);
+ if (error)
+ return false;
+
+ guid_bytes [i++] = read_hex (out error);
+ if (error)
+ return false;
+
+ if (get_char () != '-')
+ return false;
+ }
+
+ for (; i < 16; i++) {
+ guid_bytes [i] = read_hex (out error);
+ if (error)
+ return false;
+ }
+
+ if (get_char () != '}' || get_char () != '"')
+ return false;
+
+ // TODO: Any white-spaces count
+ c = get_char ();
+ if (c != ' ')
+ return false;
+
+ if (get_char () != '"')
+ return false;
+
+ // Any length of checksum
+ List<byte> checksum_bytes = new List<byte> (16);
+
+ c = peek_char ();
+ while (c != '"' && c != -1) {
+ checksum_bytes.Add (read_hex (out error));
+ if (error)
+ return false;
+
+ c = peek_char ();
+ }
+
+ if (c == '/') {
+ ReadSingleLineComment ();
+ } else if (get_char () != '"') {
+ return false;
+ }
+
+ file.SetChecksum (guid_bytes, checksum_bytes.ToArray ());
+ ref_name.AutoGenerated = true;
+ return true;
}
- int[] ParseNumbers (string text)
+ bool IsTokenIdentifierEqual (char[] identifier)
{
- string[] string_array = text.Split (',');
- int[] values = new int [string_array.Length];
- int index = 0;
- foreach (string string_code in string_array) {
+ for (int i = 0; i < identifier.Length; ++i) {
+ if (identifier[i] != id_builder[i])
+ return false;
+ }
+
+ return true;
+ }
+
+ int TokenizePragmaNumber (ref int c)
+ {
+ number_pos = 0;
+
+ int number;
+
+ if (c >= '0' && c <= '9') {
+ decimal_digits (c);
+ uint ui = (uint) (number_builder[0] - '0');
+
try {
- values[index++] = int.Parse (string_code, System.Globalization.CultureInfo.InvariantCulture);
+ for (int i = 1; i < number_pos; i++) {
+ ui = checked ((ui * 10) + ((uint) (number_builder[i] - '0')));
+ }
+
+ number = (int) ui;
+ } catch (OverflowException) {
+ Error_NumericConstantTooLong ();
+ number = -1;
}
- catch (FormatException) {
+
+
+ c = get_char ();
+
+ // skip over white space
+ while (c == ' ' || c == '\t')
+ c = get_char ();
+
+ if (c == ',') {
+ c = get_char ();
+ }
+
+ // skip over white space
+ while (c == ' ' || c == '\t')
+ c = get_char ();
+ } else {
+ number = -1;
+ if (c == '/') {
+ ReadSingleLineComment ();
+ } else {
Report.Warning (1692, 1, Location, "Invalid number");
+
+ // Read everything till the end of the line or file
+ do {
+ c = get_char ();
+ } while (c != -1 && c != '\n');
+ }
+ }
+
+ return number;
+ }
+
+ void ReadSingleLineComment ()
+ {
+ if (peek_char () != '/')
+ Report.Warning (1696, 1, Location, "Single-line comment or end-of-line expected");
+
+ // Read everything till the end of the line or file
+ int c;
+ do {
+ c = get_char ();
+ } while (c != -1 && c != '\n');
+ }
+
+ /// <summary>
+ /// Handles #pragma directive
+ /// </summary>
+ void ParsePragmaDirective (string arg)
+ {
+ int c;
+ int length = TokenizePreprocessorIdentifier (out c);
+ if (length == pragma_warning.Length && IsTokenIdentifierEqual (pragma_warning)) {
+ length = TokenizePreprocessorIdentifier (out c);
+
+ //
+ // #pragma warning disable
+ // #pragma warning restore
+ //
+ if (length == pragma_warning_disable.Length) {
+ bool disable = IsTokenIdentifierEqual (pragma_warning_disable);
+ if (disable || IsTokenIdentifierEqual (pragma_warning_restore)) {
+ // skip over white space
+ while (c == ' ' || c == '\t')
+ c = get_char ();
+
+ var loc = Location;
+
+ if (c == '\n' || c == '/') {
+ if (c == '/')
+ ReadSingleLineComment ();
+
+ //
+ // Disable/Restore all warnings
+ //
+ if (disable) {
+ Report.RegisterWarningRegion (loc).WarningDisable (loc.Row);
+ } else {
+ Report.RegisterWarningRegion (loc).WarningEnable (loc.Row);
+ }
+ } else {
+ //
+ // Disable/Restore a warning or group of warnings
+ //
+ int code;
+ do {
+ code = TokenizePragmaNumber (ref c);
+ if (code > 0) {
+ if (disable) {
+ Report.RegisterWarningRegion (loc).WarningDisable (loc, code, Report);
+ } else {
+ Report.RegisterWarningRegion (loc).WarningEnable (loc, code, Report);
+ }
+ }
+ } while (code >= 0 && c != '\n' && c != -1);
+ }
+
+ return;
+ }
+ }
+
+ Report.Warning (1634, 1, Location, "Expected disable or restore");
+ return;
+ }
+
+ //
+ // #pragma checksum
+ //
+ if (length == pragma_checksum.Length && IsTokenIdentifierEqual (pragma_checksum)) {
+ if (c != ' ' || !ParsePragmaChecksum ()) {
+ Report.Warning (1695, 1, Location,
+ "Invalid #pragma checksum syntax. Expected \"filename\" \"{XXXXXXXX-XXXX-XXXX-XXXX-XXXXXXXXXXXX}\" \"XXXX...\"");
}
+
+ return;
}
- return values;
+
+ Report.Warning (1633, 1, Location, "Unrecognized #pragma directive");
}
bool eval_val (string s)
return true;
if (s == "false")
return false;
-
- if (defines == null)
- return false;
- if (defines.Contains (s))
- return true;
- return false;
+ return file_name.IsConditionalDefined (context, s);
}
bool pp_primary (ref string s)
void Error_NumericConstantTooLong ()
{
- Report.Error (1021, Location, "Numeric constant too long");
+ Report.Error (1021, Location, "Integral constant is too large");
}
void Error_InvalidDirective ()
{
Report.Error (
1028, Location,
- "Unexpected processor directive (" + extra + ")");
- }
-
- void Error_TokenExpected (string token)
- {
- Report.Error (1026, Location, "Expecting `{0}'", token);
+ "Unexpected processor directive ({0})", extra);
}
void Error_TokensSeen ()
{
Report.Error (1025, Location, "Single-line comment or end-of-line expected");
}
+
+ //
+ // Raises a warning when tokenizer found documentation comment
+ // on unexpected place
+ //
+ void WarningMisplacedComment (Location loc)
+ {
+ if (doc_state != XmlCommentState.Error) {
+ doc_state = XmlCommentState.Error;
+ Report.Warning (1587, 2, loc, "XML comment is not placed on a valid language element");
+ }
+ }
//
// if true, then the code continues processing the code
// reached.
// When caller_is_taking is false we ignore all directives except the ones
// which can help us to identify where the #if block ends
- bool handle_preprocessing_directive (bool caller_is_taking)
+ bool ParsePreprocessingDirective (bool caller_is_taking)
{
- string cmd, arg;
+ string arg;
bool region_directive = false;
- get_cmd_arg (out cmd, out arg);
-
- // Eat any trailing whitespaces and single-line comments
- if (arg.IndexOf ("//") != -1)
- arg = arg.Substring (0, arg.IndexOf ("//"));
- arg = arg.Trim (simple_whitespaces);
+ var directive = get_cmd_arg (out arg);
//
// The first group of pre-processing instructions is always processed
//
- switch (cmd){
- case "region":
+ switch (directive) {
+ case PreprocessorDirective.Region:
region_directive = true;
arg = "true";
- goto case "if";
+ goto case PreprocessorDirective.If;
- case "endregion":
+ case PreprocessorDirective.Endregion:
if (ifstack == null || ifstack.Count == 0){
Error_UnexpectedDirective ("no #region for this #endregion");
return true;
}
- int pop = (int) ifstack.Pop ();
+ int pop = ifstack.Pop ();
if ((pop & REGION) == 0)
Report.Error (1027, Location, "Expected `#endif' directive");
return caller_is_taking;
- case "if":
+ case PreprocessorDirective.If:
if (ifstack == null)
- ifstack = new Stack (2);
+ ifstack = new Stack<int> (2);
int flags = region_directive ? REGION : 0;
if (ifstack.Count == 0){
flags |= PARENT_TAKING;
} else {
- int state = (int) ifstack.Peek ();
+ int state = ifstack.Peek ();
if ((state & TAKING) != 0) {
flags |= PARENT_TAKING;
}
}
- if (caller_is_taking && eval (arg)) {
+ if (eval (arg) && caller_is_taking) {
ifstack.Push (flags | TAKING);
return true;
}
ifstack.Push (flags);
return false;
-
- case "endif":
+
+ case PreprocessorDirective.Endif:
if (ifstack == null || ifstack.Count == 0){
Error_UnexpectedDirective ("no #if for this #endif");
return true;
} else {
- pop = (int) ifstack.Pop ();
+ pop = ifstack.Pop ();
if ((pop & REGION) != 0)
Report.Error (1038, Location, "#endregion directive expected");
if (ifstack.Count == 0)
return true;
- int state = (int) ifstack.Peek ();
+ int state = ifstack.Peek ();
return (state & TAKING) != 0;
}
- case "elif":
+ case PreprocessorDirective.Elif:
if (ifstack == null || ifstack.Count == 0){
Error_UnexpectedDirective ("no #if for this #elif");
return true;
} else {
- int state = (int) ifstack.Pop ();
+ int state = ifstack.Pop ();
if ((state & REGION) != 0) {
Report.Error (1038, Location, "#endregion directive expected");
return false;
}
- case "else":
+ case PreprocessorDirective.Else:
if (ifstack == null || ifstack.Count == 0){
Error_UnexpectedDirective ("no #if for this #else");
return true;
} else {
- int state = (int) ifstack.Peek ();
+ int state = ifstack.Peek ();
if ((state & REGION) != 0) {
Report.Error (1038, Location, "#endregion directive expected");
return ret;
}
- case "define":
- if (any_token_seen){
- Error_TokensSeen ();
- return caller_is_taking;
- }
- PreProcessDefinition (true, arg, caller_is_taking);
+ case PreprocessorDirective.Define:
+ if (any_token_seen){
+ Error_TokensSeen ();
return caller_is_taking;
+ }
+ PreProcessDefinition (true, arg, caller_is_taking);
+ return caller_is_taking;
- case "undef":
- if (any_token_seen){
- Error_TokensSeen ();
- return caller_is_taking;
- }
- PreProcessDefinition (false, arg, caller_is_taking);
+ case PreprocessorDirective.Undef:
+ if (any_token_seen){
+ Error_TokensSeen ();
return caller_is_taking;
+ }
+ PreProcessDefinition (false, arg, caller_is_taking);
+ return caller_is_taking;
+
+ case PreprocessorDirective.Invalid:
+ Report.Error (1024, Location, "Wrong preprocessor directive");
+ return true;
}
//
if (!caller_is_taking)
return false;
- switch (cmd){
- case "error":
- Report.Error (1029, Location, "#error: '" + arg + "'");
+ switch (directive){
+ case PreprocessorDirective.Error:
+ Report.Error (1029, Location, "#error: '{0}'", arg);
return true;
- case "warning":
+ case PreprocessorDirective.Warning:
Report.Warning (1030, 1, Location, "#warning: `{0}'", arg);
return true;
- case "pragma":
- if (RootContext.Version == LanguageVersion.ISO_1) {
- Report.FeatureIsNotISO1 (Location, "#pragma");
- return true;
+ case PreprocessorDirective.Pragma:
+ if (context.Settings.Version == LanguageVersion.ISO_1) {
+ Report.FeatureIsNotAvailable (context, Location, "#pragma");
}
- PreProcessPragma (arg);
+ ParsePragmaDirective (arg);
return true;
- case "line":
+ case PreprocessorDirective.Line:
if (!PreProcessLine (arg))
Report.Error (
1576, Location,
return caller_is_taking;
}
- Report.Error (1024, Location, "Wrong preprocessor directive");
- return true;
-
+ throw new NotImplementedException (directive.ToString ());
}
private int consume_string (bool quoted)
{
int c;
- string_builder.Length = 0;
-
- while ((c = get_char ()) != -1){
- if (c == '"'){
- if (quoted && peek_char () == '"'){
- string_builder.Append ((char) c);
+ int pos = 0;
+ Location start_location = Location;
+ if (quoted)
+ start_location = start_location - 1;
+
+#if FULL_AST
+ int reader_pos = reader.Position;
+#endif
+
+ while (true){
+ c = get_char ();
+ if (c == '"') {
+ if (quoted && peek_char () == '"') {
+ if (pos == value_builder.Length)
+ Array.Resize (ref value_builder, pos * 2);
+
+ value_builder[pos++] = (char) c;
get_char ();
continue;
- } else {
- val = string_builder.ToString ();
- return Token.LITERAL_STRING;
}
- }
- if (c == '\n'){
- if (!quoted)
- Report.Error (1010, Location, "Newline in constant");
+ string s;
+ if (pos == 0)
+ s = string.Empty;
+ else if (pos <= 4)
+ s = InternIdentifier (value_builder, pos);
+ else
+ s = new string (value_builder, 0, pos);
+
+ ILiteralConstant res = new StringLiteral (context.BuiltinTypes, s, start_location);
+ val = res;
+#if FULL_AST
+ res.ParsedValue = quoted ?
+ reader.ReadChars (reader_pos - 2, reader.Position - 1) :
+ reader.ReadChars (reader_pos - 1, reader.Position);
+#endif
+
+ return Token.LITERAL;
}
- if (!quoted){
- c = escape (c);
+ if (c == '\n') {
+ if (!quoted) {
+ Report.Error (1010, Location, "Newline in constant");
+ val = new StringLiteral (context.BuiltinTypes, new string (value_builder, 0, pos), start_location);
+ return Token.LITERAL;
+ }
+ } else if (c == '\\' && !quoted) {
+ int surrogate;
+ c = escape (c, out surrogate);
if (c == -1)
return Token.ERROR;
+ if (surrogate != 0) {
+ if (pos == value_builder.Length)
+ Array.Resize (ref value_builder, pos * 2);
+
+ value_builder[pos++] = (char) c;
+ c = surrogate;
+ }
+ } else if (c == -1) {
+ Report.Error (1039, Location, "Unterminated string literal");
+ return Token.EOF;
}
- string_builder.Append ((char) c);
- }
- Report.Error (1039, Location, "Unterminated string literal");
- return Token.EOF;
+ if (pos == value_builder.Length)
+ Array.Resize (ref value_builder, pos * 2);
+
+ value_builder[pos++] = (char) c;
+ }
}
private int consume_identifier (int s)
if (doc_state == XmlCommentState.Allowed)
doc_state = XmlCommentState.NotAllowed;
- switch (res) {
- case Token.USING:
- case Token.NAMESPACE:
- check_incorrect_doc_comment ();
- break;
- }
-
- if (res == Token.PARTIAL) {
- if (parsing_block > 0) {
- val = new LocatedToken (Location, "partial");
- return Token.IDENTIFIER;
- }
-
- // Save current position and parse next token.
- PushPosition ();
- int next_token = token ();
- bool ok = (next_token == Token.CLASS) ||
- (next_token == Token.STRUCT) ||
- (next_token == Token.INTERFACE);
+ return res;
+ }
- PopPosition ();
+ int consume_identifier (int c, bool quoted)
+ {
+ //
+ // This method is very performance sensitive. It accounts
+ // for approximately 25% of all parser time
+ //
- if (ok) {
- if (RootContext.Version == LanguageVersion.ISO_1)
- Report.FeatureIsNotISO1 (Location, "partial types");
+ int pos = 0;
+ int column = col;
+ if (quoted)
+ --column;
- return res;
+ if (c == '\\') {
+ int surrogate;
+ c = escape (c, out surrogate);
+ if (surrogate != 0) {
+ id_builder [pos++] = (char) c;
+ c = surrogate;
}
+ }
- if (next_token < Token.LAST_KEYWORD)
- Report.Error (267, Location, "The `partial' modifier can be used only immediately before keyword `class', `struct', or `interface'");
+ id_builder [pos++] = (char) c;
- val = new LocatedToken (Location, "partial");
- return Token.IDENTIFIER;
- }
+ try {
+ while (true) {
+ c = reader.Read ();
- return res;
- }
+ if ((c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || c == '_' || (c >= '0' && c <= '9')) {
+ id_builder [pos++] = (char) c;
+ continue;
+ }
- private int consume_identifier (int s, bool quoted)
- {
- int pos = 1;
- int c = -1;
-
- id_builder [0] = (char) s;
+ if (c < 0x80) {
+ if (c == '\\') {
+ int surrogate;
+ c = escape (c, out surrogate);
+ if (is_identifier_part_character ((char) c))
+ id_builder[pos++] = (char) c;
- current_location = new Location (ref_line, Col);
+ if (surrogate != 0) {
+ c = surrogate;
+ }
- while ((c = get_char ()) != -1) {
- loop:
- if (is_identifier_part_character ((char) c)){
- if (pos == max_id_size){
- Report.Error (645, Location, "Identifier too long (limit is 512 chars)");
- return Token.ERROR;
+ continue;
+ }
+ } else if (Char.IsLetter ((char) c) || Char.GetUnicodeCategory ((char) c) == UnicodeCategory.ConnectorPunctuation) {
+ id_builder [pos++] = (char) c;
+ continue;
}
-
- id_builder [pos++] = (char) c;
-// putback_char = -1;
- } else if (c == '\\') {
- c = escape (c);
- goto loop;
- } else {
-// putback_char = c;
- putback (c);
+
+ putback_char = c;
break;
}
+ } catch (IndexOutOfRangeException) {
+ Report.Error (645, Location, "Identifier too long (limit is 512 chars)");
+ --pos;
+ col += pos;
}
+ col += pos - 1;
+
//
// Optimization: avoids doing the keyword lookup
- // on uppercase letters and _
+ // on uppercase letters
//
- if (!quoted && (s >= 'a' || s == '_')){
+ if (id_builder [0] >= '_' && !quoted) {
int keyword = GetKeyword (id_builder, pos);
if (keyword != -1) {
- val = Location;
+ val = LocatedToken.Create (keyword == Token.AWAIT ? "await" : null, ref_line, column);
return keyword;
}
}
+ string s = InternIdentifier (id_builder, pos);
+ val = LocatedToken.Create (s, ref_line, column);
+ if (quoted && parsing_attribute_section)
+ AddEscapedIdentifier (((LocatedToken) val).Location);
+
+ return Token.IDENTIFIER;
+ }
+
+ static string InternIdentifier (char[] charBuffer, int length)
+ {
//
// Keep identifiers in an array of hashtables to avoid needless
// allocations
//
-
- if (identifiers [pos] != null) {
- val = identifiers [pos][id_builder];
- if (val != null) {
- val = new LocatedToken (Location, (string) val);
- if (quoted)
- escaped_identifiers.Add (val);
- return Token.IDENTIFIER;
- }
- }
- else
- identifiers [pos] = new CharArrayHashtable (pos);
-
- val = new String (id_builder, 0, pos);
- if (RootContext.Version == LanguageVersion.ISO_1) {
- for (int i = 1; i < id_builder.Length; i += 3) {
- if (id_builder [i] == '_' && (id_builder [i - 1] == '_' || id_builder [i + 1] == '_')) {
- Report.Error (1638, Location,
- "`{0}': Any identifier with double underscores cannot be used when ISO language version mode is specified", val.ToString ());
- break;
- }
+ var identifiers_group = identifiers[length];
+ string s;
+ if (identifiers_group != null) {
+ if (identifiers_group.TryGetValue (charBuffer, out s)) {
+ return s;
}
+ } else {
+ // TODO: this should be number of files dependant
+ // corlib compilation peaks at 1000 and System.Core at 150
+ int capacity = length > 20 ? 10 : 100;
+ identifiers_group = new Dictionary<char[], string> (capacity, new IdentifiersComparer (length));
+ identifiers[length] = identifiers_group;
}
- char [] chars = new char [pos];
- Array.Copy (id_builder, chars, pos);
-
- identifiers [pos] [chars] = val;
+ char[] chars = new char[length];
+ Array.Copy (charBuffer, chars, length);
- val = new LocatedToken (Location, (string) val);
- if (quoted)
- escaped_identifiers.Add (val);
- return Token.IDENTIFIER;
+ s = new string (charBuffer, 0, length);
+ identifiers_group.Add (chars, s);
+ return s;
}
public int xtoken ()
{
- int t;
- bool doread = false;
- int c;
+ int d, c;
// Whether we have seen comments on the current line
bool comments_seen = false;
- val = null;
- for (;(c = get_char ()) != -1;) {
- if (c == '\t'){
- col = ((col + 8) / 8) * 8;
+ while ((c = get_char ()) != -1) {
+ switch (c) {
+ case '\t':
+ col = ((col - 1 + tab_size) / tab_size) * tab_size;
continue;
- }
-
- if (c == ' ' || c == '\f' || c == '\v' || c == 0xa0 || c == 0)
+
+ case ' ':
+ case '\f':
+ case '\v':
+ case 0xa0:
+ case 0:
+ case 0xFEFF: // Ignore BOM anywhere in the file
continue;
- if (c == '\r') {
- if (peek_char () == '\n')
+/* This is required for compatibility with .NET
+ case 0xEF:
+ if (peek_char () == 0xBB) {
+ PushPosition ();
get_char ();
+ if (get_char () == 0xBF)
+ continue;
+ PopPosition ();
+ }
+ break;
+*/
+ case '\\':
+ tokens_seen = true;
+ return consume_identifier (c);
- any_token_seen |= tokens_seen;
- tokens_seen = false;
- comments_seen = false;
- continue;
- }
+ case '{':
+ val = LocatedToken.Create (ref_line, col);
+ return Token.OPEN_BRACE;
+ case '}':
+ val = LocatedToken.Create (ref_line, col);
+ return Token.CLOSE_BRACE;
+ case '[':
+ // To block doccomment inside attribute declaration.
+ if (doc_state == XmlCommentState.Allowed)
+ doc_state = XmlCommentState.NotAllowed;
+
+ val = LocatedToken.Create (ref_line, col);
+
+ if (parsing_block == 0 || lambda_arguments_parsing)
+ return Token.OPEN_BRACKET;
+
+ int next = peek_char ();
+ switch (next) {
+ case ']':
+ case ',':
+ return Token.OPEN_BRACKET;
+
+ case ' ':
+ case '\f':
+ case '\v':
+ case '\r':
+ case '\n':
+ case '/':
+ next = peek_token ();
+ if (next == Token.COMMA || next == Token.CLOSE_BRACKET)
+ return Token.OPEN_BRACKET;
+
+ return Token.OPEN_BRACKET_EXPR;
+ default:
+ return Token.OPEN_BRACKET_EXPR;
+ }
+ case ']':
+ LocatedToken.CreateOptional (ref_line, col, ref val);
+ return Token.CLOSE_BRACKET;
+ case '(':
+ val = LocatedToken.Create (ref_line, col);
+ //
+ // An expression versions of parens can appear in block context only
+ //
+ if (parsing_block != 0 && !lambda_arguments_parsing) {
+
+ //
+ // Optmize most common case where we know that parens
+ // is not special
+ //
+ switch (current_token) {
+ case Token.IDENTIFIER:
+ case Token.IF:
+ case Token.FOR:
+ case Token.FOREACH:
+ case Token.TYPEOF:
+ case Token.WHILE:
+ case Token.USING:
+ case Token.DEFAULT:
+ case Token.DELEGATE:
+ case Token.OP_GENERICS_GT:
+ return Token.OPEN_PARENS;
+ }
- // Handle double-slash comments.
- if (c == '/'){
- int d = peek_char ();
-
- if (d == '/'){
+ // Optimize using peek
+ int xx = peek_char ();
+ switch (xx) {
+ case '(':
+ case '\'':
+ case '"':
+ case '0':
+ case '1':
+ return Token.OPEN_PARENS;
+ }
+
+ lambda_arguments_parsing = true;
+ PushPosition ();
+ d = TokenizeOpenParens ();
+ PopPosition ();
+ lambda_arguments_parsing = false;
+ return d;
+ }
+
+ return Token.OPEN_PARENS;
+ case ')':
+ LocatedToken.CreateOptional (ref_line, col, ref val);
+ return Token.CLOSE_PARENS;
+ case ',':
+ LocatedToken.CreateOptional (ref_line, col, ref val);
+ return Token.COMMA;
+ case ';':
+ LocatedToken.CreateOptional (ref_line, col, ref val);
+ return Token.SEMICOLON;
+ case '~':
+ val = LocatedToken.Create (ref_line, col);
+ return Token.TILDE;
+ case '?':
+ val = LocatedToken.Create (ref_line, col);
+ return TokenizePossibleNullableType ();
+ case '<':
+ val = LocatedToken.Create (ref_line, col);
+ if (parsing_generic_less_than++ > 0)
+ return Token.OP_GENERICS_LT;
+
+ return TokenizeLessThan ();
+
+ case '>':
+ val = LocatedToken.Create (ref_line, col);
+ d = peek_char ();
+
+ if (d == '='){
get_char ();
- if (RootContext.Documentation != null && peek_char () == '/') {
+ return Token.OP_GE;
+ }
+
+ if (parsing_generic_less_than > 1 || (parsing_generic_less_than == 1 && d != '>')) {
+ parsing_generic_less_than--;
+ return Token.OP_GENERICS_GT;
+ }
+
+ if (d == '>') {
+ get_char ();
+ d = peek_char ();
+
+ if (d == '=') {
get_char ();
- // Don't allow ////.
- if ((d = peek_char ()) != '/') {
- update_comment_location ();
- if (doc_state == XmlCommentState.Allowed)
- handle_one_line_xml_comment ();
- else if (doc_state == XmlCommentState.NotAllowed)
- warn_incorrect_doc_comment ();
- }
+ return Token.OP_SHIFT_RIGHT_ASSIGN;
}
- while ((d = get_char ()) != -1 && (d != '\n') && d != '\r')
- if (d == '\n'){
+ return Token.OP_SHIFT_RIGHT;
+ }
+
+ return Token.OP_GT;
+
+ case '+':
+ val = LocatedToken.Create (ref_line, col);
+ d = peek_char ();
+ if (d == '+') {
+ d = Token.OP_INC;
+ } else if (d == '=') {
+ d = Token.OP_ADD_ASSIGN;
+ } else {
+ return Token.PLUS;
+ }
+ get_char ();
+ return d;
+
+ case '-':
+ val = LocatedToken.Create (ref_line, col);
+ d = peek_char ();
+ if (d == '-') {
+ d = Token.OP_DEC;
+ } else if (d == '=')
+ d = Token.OP_SUB_ASSIGN;
+ else if (d == '>')
+ d = Token.OP_PTR;
+ else {
+ return Token.MINUS;
+ }
+ get_char ();
+ return d;
+
+ case '!':
+ val = LocatedToken.Create (ref_line, col);
+ if (peek_char () == '='){
+ get_char ();
+ return Token.OP_NE;
+ }
+ return Token.BANG;
+
+ case '=':
+ val = LocatedToken.Create (ref_line, col);
+ d = peek_char ();
+ if (d == '='){
+ get_char ();
+ return Token.OP_EQ;
+ }
+ if (d == '>'){
+ get_char ();
+ return Token.ARROW;
+ }
+
+ return Token.ASSIGN;
+
+ case '&':
+ val = LocatedToken.Create (ref_line, col);
+ d = peek_char ();
+ if (d == '&'){
+ get_char ();
+ return Token.OP_AND;
+ }
+ if (d == '='){
+ get_char ();
+ return Token.OP_AND_ASSIGN;
+ }
+ return Token.BITWISE_AND;
+
+ case '|':
+ val = LocatedToken.Create (ref_line, col);
+ d = peek_char ();
+ if (d == '|'){
+ get_char ();
+ return Token.OP_OR;
+ }
+ if (d == '='){
+ get_char ();
+ return Token.OP_OR_ASSIGN;
+ }
+ return Token.BITWISE_OR;
+
+ case '*':
+ val = LocatedToken.Create (ref_line, col);
+ if (peek_char () == '='){
+ get_char ();
+ return Token.OP_MULT_ASSIGN;
+ }
+ return Token.STAR;
+
+ case '/':
+ d = peek_char ();
+ if (d == '='){
+ val = LocatedToken.Create (ref_line, col);
+ get_char ();
+ return Token.OP_DIV_ASSIGN;
+ }
+
+ // Handle double-slash comments.
+ if (d == '/'){
+ get_char ();
+ if (doc_processing) {
+ if (peek_char () == '/') {
+ get_char ();
+ // Don't allow ////.
+ if ((d = peek_char ()) != '/') {
+ if (doc_state == XmlCommentState.Allowed)
+ handle_one_line_xml_comment ();
+ else if (doc_state == XmlCommentState.NotAllowed)
+ WarningMisplacedComment (Location - 3);
+ }
+ } else {
+ if (xml_comment_buffer.Length > 0)
+ doc_state = XmlCommentState.NotAllowed;
}
+ }
+
+ while ((d = get_char ()) != -1 && d != '\n');
+
any_token_seen |= tokens_seen;
tokens_seen = false;
comments_seen = false;
} else if (d == '*'){
get_char ();
bool docAppend = false;
- if (RootContext.Documentation != null && peek_char () == '*') {
+ if (doc_processing && peek_char () == '*') {
get_char ();
- update_comment_location ();
// But when it is /**/, just do nothing.
if (peek_char () == '/') {
get_char ();
}
if (doc_state == XmlCommentState.Allowed)
docAppend = true;
- else if (doc_state == XmlCommentState.NotAllowed)
- warn_incorrect_doc_comment ();
+ else if (doc_state == XmlCommentState.NotAllowed) {
+ WarningMisplacedComment (Location - 2);
+ }
}
int current_comment_start = 0;
xml_comment_buffer.Append (Environment.NewLine);
}
- Location start_location = Location;
-
while ((d = get_char ()) != -1){
if (d == '*' && peek_char () == '/'){
get_char ();
}
}
if (!comments_seen)
- Report.Error (1035, start_location, "End-of-file found, '*/' expected");
+ Report.Error (1035, Location, "End-of-file found, '*/' expected");
if (docAppend)
update_formatted_doc_comment (current_comment_start);
continue;
}
- goto is_punct_label;
- }
+ val = LocatedToken.Create (ref_line, col);
+ return Token.DIV;
-
- if (c == '\\' || is_identifier_start_character ((char)c)){
- tokens_seen = true;
- return consume_identifier (c);
- }
+ case '%':
+ val = LocatedToken.Create (ref_line, col);
+ if (peek_char () == '='){
+ get_char ();
+ return Token.OP_MOD_ASSIGN;
+ }
+ return Token.PERCENT;
- is_punct_label:
- current_location = new Location (ref_line, Col);
- if ((t = is_punct ((char)c, ref doread)) != Token.ERROR){
- tokens_seen = true;
- if (doread){
+ case '^':
+ val = LocatedToken.Create (ref_line, col);
+ if (peek_char () == '='){
get_char ();
+ return Token.OP_XOR_ASSIGN;
}
- return t;
- }
+ return Token.CARRET;
+
+ case ':':
+ val = LocatedToken.Create (ref_line, col);
+ if (peek_char () == ':') {
+ get_char ();
+ return Token.DOUBLE_COLON;
+ }
+ return Token.COLON;
+
+ case '0': case '1': case '2': case '3': case '4':
+ case '5': case '6': case '7': case '8': case '9':
+ tokens_seen = true;
+ return is_number (c);
- // white space
- if (c == '\n'){
+ case '\n': // white space
any_token_seen |= tokens_seen;
tokens_seen = false;
comments_seen = false;
continue;
- }
-
- if (c >= '0' && c <= '9'){
- tokens_seen = true;
- return is_number (c);
- }
- if (c == '.'){
+ case '.':
tokens_seen = true;
- int peek = peek_char ();
- if (peek >= '0' && peek <= '9')
+ d = peek_char ();
+ if (d >= '0' && d <= '9')
return is_number (c);
+
+ LocatedToken.CreateOptional (ref_line, col, ref val);
return Token.DOT;
- }
- if (c == '#') {
+ case '#':
if (tokens_seen || comments_seen) {
Eror_WrongPreprocessorLocation ();
return Token.ERROR;
}
- if (handle_preprocessing_directive (true))
+ if (ParsePreprocessingDirective (true))
continue;
bool directive_expected = false;
continue;
}
- if (c == ' ' || c == '\t' || c == '\r' || c == '\n' || c == '\f' || c == '\v' )
+ if (c == ' ' || c == '\t' || c == '\n' || c == '\f' || c == '\v' )
continue;
if (c == '#') {
- if (handle_preprocessing_directive (false))
+ if (ParsePreprocessingDirective (false))
break;
}
directive_expected = false;
}
return Token.EOF;
- }
- if (c == '"')
+ case '"':
return consume_string (false);
- if (c == '\''){
- c = get_char ();
- tokens_seen = true;
- if (c == '\''){
- error_details = "Empty character literal";
- Report.Error (1011, Location, error_details);
- return Token.ERROR;
- }
- if (c == '\r' || c == '\n') {
- Report.Error (1010, Location, "Newline in constant");
- return Token.ERROR;
- }
- c = escape (c);
- if (c == -1)
- return Token.ERROR;
- val = new System.Char ();
- val = (char) c;
- c = get_char ();
-
- if (c != '\''){
- error_details = "Too many characters in character literal";
- Report.Error (1012, Location, error_details);
-
- // Try to recover, read until newline or next "'"
- while ((c = get_char ()) != -1){
- if (c == '\n'){
- break;
- }
- else if (c == '\'')
- break;
- }
- return Token.ERROR;
- }
- return Token.LITERAL_CHARACTER;
- }
+ case '\'':
+ return TokenizeBackslash ();
- if (c == '@') {
+ case '@':
c = get_char ();
if (c == '"') {
tokens_seen = true;
return consume_string (true);
- } else if (is_identifier_start_character ((char) c)){
+ }
+
+ if (is_identifier_start_character (c)){
return consume_identifier (c, true);
- } else {
- Report.Error (1646, Location, "Keyword, identifier, or string expected after verbatim specifier: @");
}
+
+ Report.Error (1646, Location, "Keyword, identifier, or string expected after verbatim specifier: @");
+ return Token.ERROR;
+
+ case EvalStatementParserCharacter:
+ return Token.EVAL_STATEMENT_PARSER;
+ case EvalCompilationUnitParserCharacter:
+ return Token.EVAL_COMPILATION_UNIT_PARSER;
+ case EvalUsingDeclarationsParserCharacter:
+ return Token.EVAL_USING_DECLARATIONS_UNIT_PARSER;
+ case DocumentationXref:
+ return Token.DOC_SEE;
+ }
+
+ if (is_identifier_start_character (c)) {
+ tokens_seen = true;
+ return consume_identifier (c);
}
- error_details = ((char)c).ToString ();
+ if (char.IsWhiteSpace ((char) c))
+ continue;
+
+ Report.Error (1056, Location, "Unexpected character `{0}'", ((char) c).ToString ());
+ }
+
+ if (CompleteOnEOF){
+ if (generated)
+ return Token.COMPLETE_COMPLETION;
- return Token.ERROR;
+ generated = true;
+ return Token.GENERATE_COMPLETION;
}
+
return Token.EOF;
}
+ int TokenizeBackslash ()
+ {
+#if FULL_AST
+ int read_start = reader.Position;
+#endif
+ Location start_location = Location;
+ int c = get_char ();
+ tokens_seen = true;
+ if (c == '\'') {
+ val = new CharLiteral (context.BuiltinTypes, (char) c, start_location);
+ Report.Error (1011, start_location, "Empty character literal");
+ return Token.LITERAL;
+ }
+
+ if (c == '\n') {
+ Report.Error (1010, start_location, "Newline in constant");
+ return Token.ERROR;
+ }
+
+ int d;
+ c = escape (c, out d);
+ if (c == -1)
+ return Token.ERROR;
+ if (d != 0)
+ throw new NotImplementedException ();
+
+ ILiteralConstant res = new CharLiteral (context.BuiltinTypes, (char) c, start_location);
+ val = res;
+ c = get_char ();
+
+ if (c != '\'') {
+ Report.Error (1012, start_location, "Too many characters in character literal");
+
+ // Try to recover, read until newline or next "'"
+ while ((c = get_char ()) != -1) {
+ if (c == '\n' || c == '\'')
+ break;
+ }
+ }
+
+#if FULL_AST
+ res.ParsedValue = reader.ReadChars (read_start - 1, reader.Position);
+#endif
+
+ return Token.LITERAL;
+ }
+
+ int TokenizeLessThan ()
+ {
+ int d;
+ if (handle_typeof) {
+ PushPosition ();
+ if (parse_generic_dimension (out d)) {
+ val = d;
+ DiscardPosition ();
+ return Token.GENERIC_DIMENSION;
+ }
+ PopPosition ();
+ }
+
+ // Save current position and parse next token.
+ PushPosition ();
+ if (parse_less_than ()) {
+ if (parsing_generic_declaration && (parsing_generic_declaration_doc || token () != Token.DOT)) {
+ d = Token.OP_GENERICS_LT_DECL;
+ } else {
+ d = Token.OP_GENERICS_LT;
+ }
+ PopPosition ();
+ return d;
+ }
+
+ PopPosition ();
+ parsing_generic_less_than = 0;
+
+ d = peek_char ();
+ if (d == '<') {
+ get_char ();
+ d = peek_char ();
+
+ if (d == '=') {
+ get_char ();
+ return Token.OP_SHIFT_LEFT_ASSIGN;
+ }
+ return Token.OP_SHIFT_LEFT;
+ }
+
+ if (d == '=') {
+ get_char ();
+ return Token.OP_LE;
+ }
+ return Token.OP_LT;
+ }
+
//
// Handles one line xml comment
//
xml_comment_buffer.Insert (current_comment_start, String.Join (Environment.NewLine, lines));
}
- //
- // Updates current comment location.
- //
- private void update_comment_location ()
- {
- if (current_comment_location.IsNull) {
- // "-2" is for heading "//" or "/*"
- current_comment_location =
- new Location (ref_line, col - 2);
- }
- }
-
//
// Checks if there was incorrect doc comments and raise
// warnings.
public void check_incorrect_doc_comment ()
{
if (xml_comment_buffer.Length > 0)
- warn_incorrect_doc_comment ();
- }
-
- //
- // Raises a warning when tokenizer found incorrect doccomment
- // markup.
- //
- private void warn_incorrect_doc_comment ()
- {
- if (doc_state != XmlCommentState.Error) {
- doc_state = XmlCommentState.Error;
- // in csc, it is 'XML comment is not placed on
- // a valid language element'. But that does not
- // make sense.
- Report.Warning (1587, 2, Location, "XML comment is not placed on a valid language element");
- }
+ WarningMisplacedComment (Location);
}
//
return null;
}
+ Report Report {
+ get { return context.Report; }
+ }
+
void reset_doc_comment ()
{
xml_comment_buffer.Length = 0;
- current_comment_location = Location.Null;
}
public void cleanup ()
{
if (ifstack != null && ifstack.Count >= 1) {
- current_location = new Location (ref_line, Col);
- int state = (int) ifstack.Pop ();
+ int state = ifstack.Pop ();
if ((state & REGION) != 0)
Report.Error (1038, Location, "#endregion directive expected");
else