projects/dil: trunk/src/dil/Lexer.d comparison

comparison trunk/src/dil/Lexer.d @ 499:52447db67938

Implemented global table of identifiers.

author	Aziz K?ksal <aziz.koeksal@gmail.com>
date	Sun, 09 Dec 2007 22:37:47 +0100
parents	49c201b5c465
children	4e14cd1b24da

comparison

equal deleted inserted replaced

-:49c201b5c465
+:52447db67938
 public import dil.LexerFuncs;
 /// U+FFFD = �. Used to replace invalid Unicode characters.
 const dchar REPLACEMENT_CHAR = '\uFFFD';
+/// Global table of identifiers. Access must be synchronized.
+private Identifier*[string] idTable;
+static this()
+{
+foreach(ref k; keywords)
+idTable[k.str] = &k;
+}
+Identifier* idTableLookup(string idString)
+out(id)
+{ assert(id !is null); }
+body
+{
+synchronized
+{
+Identifier** id = idString in idTable;
+if (id)
+return *id;
+auto newID = Identifier(TOK.Identifier, idString);
+idTable[idString] = newID;
+return newID;
+}
+}
+/++
+The Lexer analyzes the characters of a source text and
+produces a doubly-linked list of tokens.
++/
 class Lexer
 {
 Token* head;      /// The head of the doubly linked token list.
 Token* tail;      /// The tail of the linked list. Set in scan().
 Token* token;     /// Points to the current token in the token list.
 uint lineNum = 1;   /// Current, actual source text line number.
 uint lineNum_hline; /// Line number set by #line.
 uint inTokenString; /// > 0 if inside q{ }
 char[] errorPath;   /// The path displayed in error messages.
-Identifier[string] idtable;
 /++
 Construct a Lexer object.
 Params:
 text     = the UTF-8 source code.
 filePath = the path to the source code; used for error messages.
 }
 this.p = this.text.ptr;
 this.end = this.p + this.text.length;
 this.lineBegin = this.p;
-loadKeywords(this.idtable);
 this.head = new Token;
 this.head.type = TOK.HEAD;
 this.head.start = this.head.end = this.p;
 this.token = this.head;
 { c = *++p; }
 while (isident(c) || !isascii(c) && isUniAlpha(decodeUTF8()))
 t.end = p;
-string str = t.srcText;
+auto id = idTableLookup(t.srcText);
-Identifier* id = str in idtable;
-if (!id)
-{
-idtable[str] = Identifier(TOK.Identifier, str);
-id = str in idtable;
-}
-assert(id);
 t.type = id.type;
 if (t.type == TOK.Identifier || t.isKeyword)
 return;
 else if (t.isSpecialToken)
 finalizeSpecialToken(t);
 else if (t.type == TOK.EOF)
 { c = *++p; }
 while (isident(c) || !isascii(c) && isUniAlpha(decodeUTF8()))
 t.end = p;
-string str = t.srcText;
+auto id = idTableLookup(t.srcText);
-Identifier* id = str in idtable;
-if (!id)
-{
-idtable[str] = Identifier(TOK.Identifier, str);
-id = str in idtable;
-}
-assert(id);
 t.type = id.type;
 if (t.type == TOK.Identifier || t.isKeyword)
 return;
 else if (t.isSpecialToken)
 finalizeSpecialToken(t);
 else if (t.type == TOK.EOF)
 if (ident.length == 0)
 return false;
 static Identifier[string] reserved_ids_table;
 if (reserved_ids_table is null)
-loadKeywords(reserved_ids_table);
+Lexer.loadKeywords(reserved_ids_table);
 size_t idx = 1; // Index to the 2nd character in ident.
 dchar isFirstCharUniAlpha()
 {
 idx = 0;

Mercurial > projects > dil

comparison trunk/src/dil/Lexer.d @ 499:52447db67938