projects/ldc: dmd/lexer.c comparison

comparison dmd/lexer.c @ 1614:dbf7b54f542f

Merge DMD r292: bugzilla 3455 Some Unicode characters not allowed... bugzilla 3455 Some Unicode characters not allowed in identifiers. --- dmd/lexer.c | 34 ++++++++++++++++++++++------------ 1 files changed, 22 insertions(+), 12 deletions(-)

author	Leandro Lucarella <llucax@gmail.com>
date	Wed, 06 Jan 2010 15:18:21 -0300
parents	eae495e6ae8d
children

comparison

equal deleted inserted replaced

-:8f50a13d09a0
+:dbf7b54f542f
 	    case 'U':  	case 'V':   case 'W':   case 'X':   case 'Y':
 	    case 'Z':
 	    case '_':
 	    case_ident:
 	    {   unsigned char c;
-		StringValue *sv;
-		Identifier *id;
+		while (1)
-		do
 		{
 		    c = *++p;
-		} while (isidchar(c) || (c & 0x80 && isUniAlpha(decodeUTF())));
+		    if (isidchar(c))
-		sv = stringtable.update((char *)t->ptr, p - t->ptr);
+			continue;
-		id = (Identifier *) sv->ptrvalue;
+		    else if (c & 0x80)
+		    {	unsigned char *s = p;
+			unsigned u = decodeUTF();
+			if (isUniAlpha(u))
+			    continue;
+			error("char 0x%04x not allowed in identifier", u);
+			p = s;
+		    }
+		    break;
+		}
+		StringValue *sv = stringtable.update((char *)t->ptr, p - t->ptr);
+		Identifier *id = (Identifier *) sv->ptrvalue;
 		if (!id)
 		{   id = new Identifier(sv->lstring.string,TOKidentifier);
 		    sv->ptrvalue = id;
 		}
 		t->ident = id;
 		p++;
 		pragma();
 		continue;
 	    default:
-	    {	unsigned char c = *p;
+	    {	unsigned c = *p;
 		if (c & 0x80)
-		{   unsigned u = decodeUTF();
+		{   c = decodeUTF();
 		    // Check for start of unicode identifier
-		    if (isUniAlpha(u))
+		    if (isUniAlpha(c))
 			goto case_ident;
-		    if (u == PS || u == LS)
+		    if (c == PS || c == LS)
 		    {
 			loc.linnum++;
 			p++;
 			continue;
 		    }
 		}
-		if (isprint(c))
+		if (c < 0x80 && isprint(c))
 		    error("unsupported char '%c'", c);
 		else
 		    error("unsupported char 0x%02x", c);
 		p++;
 		continue;
 		    unsigned u = decodeUTF();
 		    p++;
 		    if (u == PS || u == LS)
 			loc.linnum++;
 		    else
-			error("non-hex character \\u%x", u);
+			error("non-hex character \\u%04x", u);
 		}
 		else
 		    error("non-hex character '%c'", c);
 		if (n & 1)
 		{   v = (v << 4) | c;

Mercurial > projects > ldc

comparison dmd/lexer.c @ 1614:dbf7b54f542f