2 see copyright notice in squirrel.h
\r
4 #include "sqpcheader.h"
\r
8 #include "sqstring.h"
\r
9 #include "sqcompiler.h"
\r
10 #include "sqlexer.h"
\r
12 #define CUR_CHAR (_currdata)
\r
13 #define RETURN_TOKEN(t) { _prevtoken = _curtoken; _curtoken = t; return t;}
\r
14 #define IS_EOB() (CUR_CHAR <= SQUIRREL_EOB)
\r
15 #define NEXT() {Next();_currentcolumn++;}
\r
16 #define INIT_TEMP_STRING() { _longstr.resize(0);}
\r
17 #define APPEND_CHAR(c) { _longstr.push_back(c);}
\r
18 #define TERMINATE_BUFFER() {_longstr.push_back(_SC('\0'));}
\r
19 #define ADD_KEYWORD(key,id) _keywords->NewSlot( SQString::Create(ss, _SC(#key)) ,SQInteger(id))
\r
21 SQLexer::SQLexer(){}
\r
24 _keywords->Release();
\r
27 void SQLexer::Init(SQSharedState *ss, SQLEXREADFUNC rg, SQUserPointer up,CompilerErrorFunc efunc,void *ed)
\r
32 _keywords = SQTable::Create(ss, 26);
\r
33 ADD_KEYWORD(while, TK_WHILE);
\r
34 ADD_KEYWORD(do, TK_DO);
\r
35 ADD_KEYWORD(if, TK_IF);
\r
36 ADD_KEYWORD(else, TK_ELSE);
\r
37 ADD_KEYWORD(break, TK_BREAK);
\r
38 ADD_KEYWORD(continue, TK_CONTINUE);
\r
39 ADD_KEYWORD(return, TK_RETURN);
\r
40 ADD_KEYWORD(null, TK_NULL);
\r
41 ADD_KEYWORD(function, TK_FUNCTION);
\r
42 ADD_KEYWORD(local, TK_LOCAL);
\r
43 ADD_KEYWORD(for, TK_FOR);
\r
44 ADD_KEYWORD(foreach, TK_FOREACH);
\r
45 ADD_KEYWORD(in, TK_IN);
\r
46 ADD_KEYWORD(typeof, TK_TYPEOF);
\r
47 ADD_KEYWORD(delegate, TK_DELEGATE);
\r
48 ADD_KEYWORD(delete, TK_DELETE);
\r
49 ADD_KEYWORD(try, TK_TRY);
\r
50 ADD_KEYWORD(catch, TK_CATCH);
\r
51 ADD_KEYWORD(throw, TK_THROW);
\r
52 ADD_KEYWORD(clone, TK_CLONE);
\r
53 ADD_KEYWORD(yield, TK_YIELD);
\r
54 ADD_KEYWORD(resume, TK_RESUME);
\r
55 ADD_KEYWORD(switch, TK_SWITCH);
\r
56 ADD_KEYWORD(case, TK_CASE);
\r
57 ADD_KEYWORD(default, TK_DEFAULT);
\r
58 ADD_KEYWORD(this, TK_THIS);
\r
59 ADD_KEYWORD(parent,TK_PARENT);
\r
60 ADD_KEYWORD(class,TK_CLASS);
\r
61 ADD_KEYWORD(extends,TK_EXTENDS);
\r
62 ADD_KEYWORD(constructor,TK_CONSTRUCTOR);
\r
63 ADD_KEYWORD(instanceof,TK_INSTANCEOF);
\r
64 ADD_KEYWORD(vargc,TK_VARGC);
\r
65 ADD_KEYWORD(vargv,TK_VARGV);
\r
66 ADD_KEYWORD(true,TK_TRUE);
\r
67 ADD_KEYWORD(false,TK_FALSE);
\r
68 ADD_KEYWORD(static,TK_STATIC);
\r
69 ADD_KEYWORD(enum,TK_ENUM);
\r
70 ADD_KEYWORD(const,TK_CONST);
\r
74 _lasttokenline = _currentline = 1;
\r
80 void SQLexer::Error(const SQChar *err)
\r
82 _errfunc(_errtarget,err);
\r
85 void SQLexer::Next()
\r
87 SQInteger t = _readf(_up);
\r
88 if(t > MAX_CHAR) Error(_SC("Invalid character"));
\r
90 _currdata = (LexChar)t;
\r
93 _currdata = SQUIRREL_EOB;
\r
96 const SQChar *SQLexer::Tok2Str(SQInteger tok)
\r
98 SQObjectPtr itr, key, val;
\r
100 while((nitr = _keywords->Next(false,itr, key, val)) != -1) {
\r
101 itr = (SQInteger)nitr;
\r
102 if(((SQInteger)_integer(val)) == tok)
\r
103 return _stringval(key);
\r
108 void SQLexer::LexBlockComment()
\r
113 case _SC('*'): { NEXT(); if(CUR_CHAR == _SC('/')) { done = true; NEXT(); }}; continue;
\r
114 case _SC('\n'): _currentline++; NEXT(); continue;
\r
115 case SQUIRREL_EOB: Error(_SC("missing \"*/\" in comment"));
\r
121 SQInteger SQLexer::Lex()
\r
123 _lasttokenline = _currentline;
\r
124 while(CUR_CHAR != SQUIRREL_EOB) {
\r
126 case _SC('\t'): case _SC('\r'): case _SC(' '): NEXT(); continue;
\r
129 _prevtoken=_curtoken;
\r
130 _curtoken=_SC('\n');
\r
142 do { NEXT(); } while (CUR_CHAR != _SC('\n') && (!IS_EOB()));
\r
146 RETURN_TOKEN(TK_DIVEQ);
\r
150 RETURN_TOKEN(TK_ATTR_CLOSE);
\r
157 if (CUR_CHAR != _SC('=')){ RETURN_TOKEN('=') }
\r
158 else { NEXT(); RETURN_TOKEN(TK_EQ); }
\r
161 if ( CUR_CHAR == _SC('=') ) { NEXT(); RETURN_TOKEN(TK_LE) }
\r
162 else if ( CUR_CHAR == _SC('-') ) { NEXT(); RETURN_TOKEN(TK_NEWSLOT); }
\r
163 else if ( CUR_CHAR == _SC('<') ) { NEXT(); RETURN_TOKEN(TK_SHIFTL); }
\r
164 else if ( CUR_CHAR == _SC('/') ) { NEXT(); RETURN_TOKEN(TK_ATTR_OPEN); }
\r
165 //else if ( CUR_CHAR == _SC('[') ) { NEXT(); ReadMultilineString(); RETURN_TOKEN(TK_STRING_LITERAL); }
\r
166 else { RETURN_TOKEN('<') }
\r
169 if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_GE);}
\r
170 else if(CUR_CHAR == _SC('>')){
\r
172 if(CUR_CHAR == _SC('>')){
\r
174 RETURN_TOKEN(TK_USHIFTR);
\r
176 RETURN_TOKEN(TK_SHIFTR);
\r
178 else { RETURN_TOKEN('>') }
\r
181 if (CUR_CHAR != _SC('=')){ RETURN_TOKEN('!')}
\r
182 else { NEXT(); RETURN_TOKEN(TK_NE); }
\r
186 if(CUR_CHAR != _SC('"'))
\r
187 Error(_SC("string expected"));
\r
188 if((stype=ReadString('"',true))!=-1) {
\r
189 RETURN_TOKEN(stype);
\r
191 Error(_SC("error parsing the string"));
\r
196 if((stype=ReadString(CUR_CHAR,false))!=-1){
\r
197 RETURN_TOKEN(stype);
\r
199 Error(_SC("error parsing the string"));
\r
201 case _SC('{'): case _SC('}'): case _SC('('): case _SC(')'): case _SC('['): case _SC(']'):
\r
202 case _SC(';'): case _SC(','): case _SC('?'): case _SC('^'): case _SC('~'):
\r
203 {SQInteger ret = CUR_CHAR;
\r
204 NEXT(); RETURN_TOKEN(ret); }
\r
207 if (CUR_CHAR != _SC('.')){ RETURN_TOKEN('.') }
\r
209 if (CUR_CHAR != _SC('.')){ Error(_SC("invalid token '..'")); }
\r
211 RETURN_TOKEN(TK_VARPARAMS);
\r
214 if (CUR_CHAR != _SC('&')){ RETURN_TOKEN('&') }
\r
215 else { NEXT(); RETURN_TOKEN(TK_AND); }
\r
218 if (CUR_CHAR != _SC('|')){ RETURN_TOKEN('|') }
\r
219 else { NEXT(); RETURN_TOKEN(TK_OR); }
\r
222 if (CUR_CHAR != _SC(':')){ RETURN_TOKEN(':') }
\r
223 else { NEXT(); RETURN_TOKEN(TK_DOUBLE_COLON); }
\r
226 if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_MULEQ);}
\r
227 else RETURN_TOKEN('*');
\r
230 if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_MODEQ);}
\r
231 else RETURN_TOKEN('%');
\r
234 if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_MINUSEQ);}
\r
235 else if (CUR_CHAR == _SC('-')){ NEXT(); RETURN_TOKEN(TK_MINUSMINUS);}
\r
236 else RETURN_TOKEN('-');
\r
239 if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_PLUSEQ);}
\r
240 else if (CUR_CHAR == _SC('+')){ NEXT(); RETURN_TOKEN(TK_PLUSPLUS);}
\r
241 else RETURN_TOKEN('+');
\r
245 if (scisdigit(CUR_CHAR)) {
\r
246 SQInteger ret = ReadNumber();
\r
249 else if (scisalpha(CUR_CHAR) || CUR_CHAR == _SC('_')) {
\r
250 SQInteger t = ReadID();
\r
254 SQInteger c = CUR_CHAR;
\r
255 if (sciscntrl((int)c)) Error(_SC("unexpected character(control)"));
\r
266 SQInteger SQLexer::GetIDType(SQChar *s)
\r
269 if(_keywords->Get(SQString::Create(_sharedstate, s), t)) {
\r
270 return SQInteger(_integer(t));
\r
272 return TK_IDENTIFIER;
\r
276 SQInteger SQLexer::ReadString(SQInteger ndelim,bool verbatim)
\r
278 INIT_TEMP_STRING();
\r
280 if(IS_EOB()) return -1;
\r
282 while(CUR_CHAR != ndelim) {
\r
285 Error(_SC("unfinished string"));
\r
288 if(!verbatim) Error(_SC("newline in a constant"));
\r
289 APPEND_CHAR(CUR_CHAR); NEXT();
\r
294 APPEND_CHAR('\\'); NEXT();
\r
299 case _SC('x'): NEXT(); {
\r
300 if(!isxdigit(CUR_CHAR)) Error(_SC("hexadecimal number expected"));
\r
301 const SQInteger maxdigits = 4;
\r
302 SQChar temp[maxdigits+1];
\r
304 while(isxdigit(CUR_CHAR) && n < maxdigits) {
\r
305 temp[n] = CUR_CHAR;
\r
311 APPEND_CHAR((SQChar)scstrtoul(temp,&sTemp,16));
\r
314 case _SC('t'): APPEND_CHAR(_SC('\t')); NEXT(); break;
\r
315 case _SC('a'): APPEND_CHAR(_SC('\a')); NEXT(); break;
\r
316 case _SC('b'): APPEND_CHAR(_SC('\b')); NEXT(); break;
\r
317 case _SC('n'): APPEND_CHAR(_SC('\n')); NEXT(); break;
\r
318 case _SC('r'): APPEND_CHAR(_SC('\r')); NEXT(); break;
\r
319 case _SC('v'): APPEND_CHAR(_SC('\v')); NEXT(); break;
\r
320 case _SC('f'): APPEND_CHAR(_SC('\f')); NEXT(); break;
\r
321 case _SC('0'): APPEND_CHAR(_SC('\0')); NEXT(); break;
\r
322 case _SC('\\'): APPEND_CHAR(_SC('\\')); NEXT(); break;
\r
323 case _SC('"'): APPEND_CHAR(_SC('"')); NEXT(); break;
\r
324 case _SC('\''): APPEND_CHAR(_SC('\'')); NEXT(); break;
\r
326 Error(_SC("unrecognised escaper char"));
\r
332 APPEND_CHAR(CUR_CHAR);
\r
337 if(verbatim && CUR_CHAR == '"') { //double quotation
\r
338 APPEND_CHAR(CUR_CHAR);
\r
345 TERMINATE_BUFFER();
\r
346 SQInteger len = _longstr.size()-1;
\r
347 if(ndelim == _SC('\'')) {
\r
348 if(len == 0) Error(_SC("empty constant"));
\r
349 if(len > 1) Error(_SC("constant too long"));
\r
350 _nvalue = _longstr[0];
\r
353 _svalue = &_longstr[0];
\r
354 return TK_STRING_LITERAL;
\r
357 void LexHexadecimal(const SQChar *s,SQUnsignedInteger *res)
\r
362 if(scisdigit(*s)) *res = (*res)*16+((*s++)-'0');
\r
363 else if(scisxdigit(*s)) *res = (*res)*16+(toupper(*s++)-'A'+10);
\r
364 else { assert(0); }
\r
368 void LexInteger(const SQChar *s,SQUnsignedInteger *res)
\r
373 *res = (*res)*10+((*s++)-'0');
\r
377 SQInteger scisodigit(SQInteger c) { return c >= _SC('0') && c <= _SC('7'); }
\r
379 void LexOctal(const SQChar *s,SQUnsignedInteger *res)
\r
384 if(scisodigit(*s)) *res = (*res)*8+((*s++)-'0');
\r
385 else { assert(0); }
\r
389 SQInteger isexponent(SQInteger c) { return c == 'e' || c=='E'; }
\r
392 #define MAX_HEX_DIGITS (sizeof(SQInteger)*2)
\r
393 SQInteger SQLexer::ReadNumber()
\r
398 #define TSCIENTIFIC 4
\r
400 SQInteger type = TINT, firstchar = CUR_CHAR;
\r
402 INIT_TEMP_STRING();
\r
404 if(firstchar == _SC('0') && (toupper(CUR_CHAR) == _SC('X') || scisodigit(CUR_CHAR)) ) {
\r
405 if(scisodigit(CUR_CHAR)) {
\r
407 while(scisodigit(CUR_CHAR)) {
\r
408 APPEND_CHAR(CUR_CHAR);
\r
411 if(scisdigit(CUR_CHAR)) Error(_SC("invalid octal number"));
\r
416 while(isxdigit(CUR_CHAR)) {
\r
417 APPEND_CHAR(CUR_CHAR);
\r
420 if(_longstr.size() > MAX_HEX_DIGITS) Error(_SC("too many digits for an Hex number"));
\r
424 APPEND_CHAR((int)firstchar);
\r
425 while (CUR_CHAR == _SC('.') || scisdigit(CUR_CHAR) || isexponent(CUR_CHAR)) {
\r
426 if(CUR_CHAR == _SC('.') || isexponent(CUR_CHAR)) type = TFLOAT;
\r
427 if(isexponent(CUR_CHAR)) {
\r
428 if(type != TFLOAT) Error(_SC("invalid numeric format"));
\r
429 type = TSCIENTIFIC;
\r
430 APPEND_CHAR(CUR_CHAR);
\r
432 if(CUR_CHAR == '+' || CUR_CHAR == '-'){
\r
433 APPEND_CHAR(CUR_CHAR);
\r
436 if(!scisdigit(CUR_CHAR)) Error(_SC("exponent expected"));
\r
439 APPEND_CHAR(CUR_CHAR);
\r
443 TERMINATE_BUFFER();
\r
447 _fvalue = (SQFloat)scstrtod(&_longstr[0],&sTemp);
\r
450 LexInteger(&_longstr[0],(SQUnsignedInteger *)&_nvalue);
\r
453 LexHexadecimal(&_longstr[0],(SQUnsignedInteger *)&_nvalue);
\r
456 LexOctal(&_longstr[0],(SQUnsignedInteger *)&_nvalue);
\r
462 SQInteger SQLexer::ReadID()
\r
465 INIT_TEMP_STRING();
\r
467 APPEND_CHAR(CUR_CHAR);
\r
469 } while(scisalnum(CUR_CHAR) || CUR_CHAR == _SC('_'));
\r
470 TERMINATE_BUFFER();
\r
471 res = GetIDType(&_longstr[0]);
\r
472 if(res == TK_IDENTIFIER || res == TK_CONSTRUCTOR) {
\r
473 _svalue = &_longstr[0];
\r