sqlexer.cpp 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647
  1. /*
  2. see copyright notice in squirrel.h
  3. */
  4. #include "sqpcheader.h"
  5. #include <ctype.h>
  6. #include <stdlib.h>
  7. #include <limits.h>
  8. #include "sqtable.h"
  9. #include "sqstring.h"
  10. #include "sqcompiler.h"
  11. #include "sqlexer.h"
  12. #define CUR_CHAR (_currdata)
  13. #define RETURN_TOKEN(t) { _prevtoken = _curtoken; _curtoken = t; return t;}
  14. #define IS_EOB() (CUR_CHAR <= SQUIRREL_EOB)
  15. #define NEXT() {Next();_currentcolumn++;}
  16. #define INIT_TEMP_STRING() { _longstr.resize(0);}
  17. #define APPEND_CHAR(c) { _longstr.push_back(c);}
  18. #define TERMINATE_BUFFER() {_longstr.push_back(_SC('\0'));}
  19. #define ADD_KEYWORD(key,id) tbl->NewSlot( SQString::Create(_sharedstate, _SC(#key)) ,SQInteger(id))
  20. SQLexer::SQLexer(){_keywords=0;}
  21. SQLexer::~SQLexer()
  22. {
  23. _keywords->Release();
  24. }
  25. void SQLexer::Init(SQSharedState *ss, SQLEXREADFUNC rg, SQUserPointer up,CompilerErrorFunc efunc,void *ed)
  26. {
  27. _errfunc = efunc;
  28. _errtarget = ed;
  29. _sharedstate = ss;
  30. if(_keywords) _keywords->Release();
  31. _keywords = GetKeywords();
  32. _readf = rg;
  33. _up = up;
  34. _lasttokenline = _currentline = 1;
  35. _currentcolumn = 0;
  36. _prevtoken = -1;
  37. _reached_eof = SQFalse;
  38. Next();
  39. }
  40. SQTable * SQLexer::GetKeywords()
  41. {
  42. SQTable *tbl = SQTable::Create(_sharedstate, (TK_LAST_ENUM_TOKEN - TK_FIRST_ENUM_TOKEN - 1) /*26*/);
  43. ADD_KEYWORD(while, TK_WHILE);
  44. ADD_KEYWORD(do, TK_DO);
  45. ADD_KEYWORD(if, TK_IF);
  46. ADD_KEYWORD(else, TK_ELSE);
  47. ADD_KEYWORD(break, TK_BREAK);
  48. ADD_KEYWORD(continue, TK_CONTINUE);
  49. ADD_KEYWORD(return, TK_RETURN);
  50. ADD_KEYWORD(null, TK_NULL);
  51. ADD_KEYWORD(NULL, TK_NULL);
  52. ADD_KEYWORD(function, TK_FUNCTION);
  53. ADD_KEYWORD(local, TK_LOCAL);
  54. ADD_KEYWORD(var, TK_LOCAL);
  55. ADD_KEYWORD(auto, TK_LOCAL);
  56. ADD_KEYWORD(let, TK_LOCAL);
  57. ADD_KEYWORD(char_t, TK_LOCAL_CHAR_T);
  58. ADD_KEYWORD(wchar_t, TK_LOCAL_WCHAR_T);
  59. ADD_KEYWORD(bool_t, TK_LOCAL_BOOL_T);
  60. ADD_KEYWORD(table_t, TK_LOCAL_TABLE_T);
  61. ADD_KEYWORD(array_t, TK_LOCAL_ARRAY_T);
  62. ADD_KEYWORD(int8_t, TK_LOCAL_INT8_T);
  63. ADD_KEYWORD(int16_t, TK_LOCAL_INT16_T);
  64. ADD_KEYWORD(int32_t, TK_LOCAL_INT32_T);
  65. ADD_KEYWORD(int64_t, TK_LOCAL_INT64_T);
  66. ADD_KEYWORD(int_t, TK_LOCAL_INT_T);
  67. ADD_KEYWORD(uint8_t, TK_LOCAL_UINT8_T);
  68. ADD_KEYWORD(uint16_t, TK_LOCAL_UINT16_T);
  69. ADD_KEYWORD(uint32_t, TK_LOCAL_UINT32_T);
  70. ADD_KEYWORD(uint64_t, TK_LOCAL_UINT64_T);
  71. ADD_KEYWORD(uint_t, TK_LOCAL_UINT_T);
  72. ADD_KEYWORD(float_t, TK_LOCAL_FLOAT_T);
  73. ADD_KEYWORD(double_t, TK_LOCAL_DOUBLE_T);
  74. ADD_KEYWORD(long_double_t, TK_LOCAL_LONG_DOUBLE_T);
  75. ADD_KEYWORD(for, TK_FOR);
  76. ADD_KEYWORD(foreach, TK_FOREACH);
  77. ADD_KEYWORD(in, TK_IN);
  78. ADD_KEYWORD(typeof, TK_TYPEOF);
  79. ADD_KEYWORD(base, TK_BASE);
  80. ADD_KEYWORD(delete, TK_DELETE);
  81. ADD_KEYWORD(try, TK_TRY);
  82. ADD_KEYWORD(catch, TK_CATCH);
  83. ADD_KEYWORD(throw, TK_THROW);
  84. ADD_KEYWORD(clone, TK_CLONE);
  85. ADD_KEYWORD(yield, TK_YIELD);
  86. ADD_KEYWORD(resume, TK_RESUME);
  87. ADD_KEYWORD(switch, TK_SWITCH);
  88. ADD_KEYWORD(case, TK_CASE);
  89. ADD_KEYWORD(default, TK_DEFAULT);
  90. ADD_KEYWORD(this, TK_THIS);
  91. ADD_KEYWORD(class,TK_CLASS);
  92. ADD_KEYWORD(extends,TK_EXTENDS);
  93. ADD_KEYWORD(constructor,TK_CONSTRUCTOR);
  94. ADD_KEYWORD(destructor,TK_DESTRUCTOR);
  95. ADD_KEYWORD(instanceof,TK_INSTANCEOF);
  96. ADD_KEYWORD(true,TK_TRUE);
  97. ADD_KEYWORD(false,TK_FALSE);
  98. ADD_KEYWORD(static,TK_STATIC);
  99. ADD_KEYWORD(enum,TK_ENUM);
  100. ADD_KEYWORD(const,TK_CONST);
  101. ADD_KEYWORD(__LINE__,TK___LINE__);
  102. ADD_KEYWORD(__FUNCTION__,TK___FUNCTION__);
  103. ADD_KEYWORD(__FILE__,TK___FILE__);
  104. ADD_KEYWORD(private,TK_PRIVATE);
  105. ADD_KEYWORD(public,TK_PUBLIC);
  106. ADD_KEYWORD(new,TK_IGNORE);
  107. return tbl;
  108. }
  109. void SQLexer::Error(const SQChar *fmt, ...)
  110. {
  111. static SQChar temp[256];
  112. va_list vl;
  113. va_start(vl, fmt);
  114. scvsprintf(temp, fmt, vl);
  115. va_end(vl);
  116. _errfunc(_errtarget,temp);
  117. }
  118. void SQLexer::Next()
  119. {
  120. SQInteger t = _readf(_up);
  121. if(t > MAX_CHAR) Error(_SC("Invalid character"));
  122. if(t != 0) {
  123. _currdata = (LexChar)t;
  124. return;
  125. }
  126. _currdata = SQUIRREL_EOB;
  127. _reached_eof = SQTrue;
  128. }
  129. const SQChar *SQLexer::Tok2Str(SQInteger tok)
  130. {
  131. SQObjectPtr itr, key, val;
  132. SQInteger nitr;
  133. while((nitr = _keywords->Next(false,itr, key, val)) != -1) {
  134. itr = (SQInteger)nitr;
  135. if(((SQInteger)_integer(val)) == tok)
  136. return _stringval(key);
  137. }
  138. return NULL;
  139. }
  140. void SQLexer::LexBlockComment()
  141. {
  142. /*
  143. if(CUR_CHAR == _SC('*'))
  144. {
  145. NEXT();
  146. if(CUR_CHAR != _SC('*')){ //document comment
  147. printf("Doument comment found at line %d\n", _currentline);
  148. }
  149. }
  150. */
  151. bool done = false;
  152. while(!done) {
  153. switch(CUR_CHAR) {
  154. case _SC('*'): { NEXT(); if(CUR_CHAR == _SC('/')) { done = true; NEXT(); }}; continue;
  155. case _SC('\n'): _currentline++; NEXT(); continue;
  156. case SQUIRREL_EOB: Error(_SC("missing \"*/\" in comment"));
  157. default: NEXT();
  158. }
  159. }
  160. }
  161. void SQLexer::LexLineComment()
  162. {
  163. do { NEXT(); } while (CUR_CHAR != _SC('\n') && (!IS_EOB()));
  164. }
  165. SQInteger SQLexer::Lex()
  166. {
  167. _lasttokenline = _currentline;
  168. while(CUR_CHAR != SQUIRREL_EOB) {
  169. switch(CUR_CHAR){
  170. case _SC('\t'): case _SC('\r'): case _SC(' '): NEXT(); continue;
  171. case _SC('\n'):
  172. _currentline++;
  173. _prevtoken=_curtoken;
  174. _curtoken=_SC('\n');
  175. NEXT();
  176. _currentcolumn=1;
  177. continue;
  178. case _SC('#'): LexLineComment(); continue;
  179. case _SC('/'):
  180. NEXT();
  181. switch(CUR_CHAR){
  182. case _SC('*'):
  183. NEXT();
  184. LexBlockComment();
  185. continue;
  186. case _SC('/'):
  187. LexLineComment();
  188. continue;
  189. case _SC('='):
  190. NEXT();
  191. RETURN_TOKEN(TK_DIVEQ);
  192. continue;
  193. case _SC('>'):
  194. NEXT();
  195. RETURN_TOKEN(TK_ATTR_CLOSE);
  196. continue;
  197. default:
  198. RETURN_TOKEN('/');
  199. }
  200. case _SC('='):
  201. NEXT();
  202. if (CUR_CHAR != _SC('=')){ RETURN_TOKEN('=') }
  203. else {
  204. NEXT();
  205. if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_EQ_IDENTITY) }
  206. else { RETURN_TOKEN(TK_EQ); }
  207. }
  208. case _SC('<'):
  209. NEXT();
  210. switch(CUR_CHAR) {
  211. case _SC('='):
  212. NEXT();
  213. if(CUR_CHAR == _SC('>')) {
  214. NEXT();
  215. RETURN_TOKEN(TK_3WAYSCMP);
  216. }
  217. RETURN_TOKEN(TK_LE)
  218. break;
  219. case _SC('-'): NEXT(); RETURN_TOKEN(TK_NEWSLOT); break;
  220. case _SC('<'): NEXT(); RETURN_TOKEN(TK_SHIFTL); break;
  221. case _SC('/'): NEXT(); RETURN_TOKEN(TK_ATTR_OPEN); break;
  222. }
  223. RETURN_TOKEN('<');
  224. case _SC('>'):
  225. NEXT();
  226. if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_GE);}
  227. else if(CUR_CHAR == _SC('>')){
  228. NEXT();
  229. if(CUR_CHAR == _SC('>')){
  230. NEXT();
  231. RETURN_TOKEN(TK_USHIFTR);
  232. }
  233. RETURN_TOKEN(TK_SHIFTR);
  234. }
  235. else { RETURN_TOKEN('>') }
  236. case _SC('!'):
  237. NEXT();
  238. if (CUR_CHAR != _SC('=')){ RETURN_TOKEN('!')}
  239. else {
  240. NEXT();
  241. if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_NE_IDENTITY)}
  242. else { RETURN_TOKEN(TK_NE); }
  243. }
  244. case _SC('@'): {
  245. SQInteger stype;
  246. NEXT();
  247. if(CUR_CHAR != _SC('"')) {
  248. RETURN_TOKEN('@');
  249. }
  250. if((stype=ReadString('"',true))!=-1) {
  251. RETURN_TOKEN(stype);
  252. }
  253. Error(_SC("error parsing the string"));
  254. }
  255. case _SC('"'):
  256. case _SC('\''): {
  257. SQInteger stype;
  258. if((stype=ReadString(CUR_CHAR,false))!=-1){
  259. RETURN_TOKEN(stype);
  260. }
  261. Error(_SC("error parsing the string"));
  262. }
  263. case _SC('{'): case _SC('}'): case _SC('('): case _SC(')'): case _SC('['): case _SC(']'):
  264. case _SC(';'): case _SC(','): case _SC('?'): case _SC('~'):
  265. {
  266. SQInteger ret = CUR_CHAR;
  267. NEXT();
  268. if((ret == _SC('[') || ret == _SC('{') || ret == _SC('(')) && CUR_CHAR == _SC('=')){
  269. //lets try lua literal delimiters
  270. SQInteger stype;
  271. if((stype=ReadString(ret,true))!=-1){
  272. RETURN_TOKEN(stype);
  273. }
  274. Error(_SC("error parsing the string"));
  275. }
  276. else RETURN_TOKEN(ret);
  277. }
  278. case _SC('.'):
  279. NEXT();
  280. if (CUR_CHAR != _SC('.')){ RETURN_TOKEN('.') }
  281. NEXT();
  282. if (CUR_CHAR != _SC('.')){ Error(_SC("invalid token '..'")); }
  283. NEXT();
  284. RETURN_TOKEN(TK_VARPARAMS);
  285. case _SC('^'):
  286. NEXT();
  287. //if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_BIT_XOR_EQ);}
  288. RETURN_TOKEN('^');
  289. case _SC('&'):
  290. NEXT();
  291. //if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_BIT_AND_EQ);}
  292. if (CUR_CHAR != _SC('&')){ RETURN_TOKEN('&') }
  293. else { NEXT(); RETURN_TOKEN(TK_AND); }
  294. case _SC('|'):
  295. NEXT();
  296. //if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_BIT_OR_EQ);}
  297. if (CUR_CHAR != _SC('|')){ RETURN_TOKEN('|') }
  298. else { NEXT(); RETURN_TOKEN(TK_OR); }
  299. case _SC(':'):
  300. NEXT();
  301. if (CUR_CHAR != _SC(':')){ RETURN_TOKEN(':') }
  302. else { NEXT(); RETURN_TOKEN(TK_DOUBLE_COLON); }
  303. case _SC('*'):
  304. NEXT();
  305. if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_MULEQ);}
  306. else RETURN_TOKEN('*');
  307. case _SC('%'):
  308. NEXT();
  309. if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_MODEQ);}
  310. else RETURN_TOKEN('%');
  311. case _SC('-'):
  312. NEXT();
  313. if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_MINUSEQ);}
  314. else if (CUR_CHAR == _SC('-')){ NEXT(); RETURN_TOKEN(TK_MINUSMINUS);}
  315. else if (CUR_CHAR == _SC('>')){ NEXT(); RETURN_TOKEN('.');} //accept C/C++ like pointers
  316. else RETURN_TOKEN('-');
  317. case _SC('+'):
  318. NEXT();
  319. if (CUR_CHAR == _SC('=')){ NEXT(); RETURN_TOKEN(TK_PLUSEQ);}
  320. else if (CUR_CHAR == _SC('+')){ NEXT(); RETURN_TOKEN(TK_PLUSPLUS);}
  321. else RETURN_TOKEN('+');
  322. case SQUIRREL_EOB:
  323. return 0;
  324. default:{
  325. if (scisdigit(CUR_CHAR)) {
  326. SQInteger ret = ReadNumber();
  327. RETURN_TOKEN(ret);
  328. }
  329. else if (scisalpha(CUR_CHAR) || CUR_CHAR == _SC('_')) {
  330. SQInteger t = ReadID();
  331. RETURN_TOKEN(t);
  332. }
  333. else {
  334. SQInteger c = CUR_CHAR;
  335. if (sciscntrl((int)c)) Error(_SC("unexpected character(control)"));
  336. NEXT();
  337. RETURN_TOKEN(c);
  338. }
  339. RETURN_TOKEN(0);
  340. }
  341. }
  342. }
  343. return 0;
  344. }
  345. SQInteger SQLexer::GetIDType(const SQChar *s,SQInteger len)
  346. {
  347. SQObjectPtr t;
  348. if(_keywords->GetStr(s,len, t)) {
  349. return SQInteger(_integer(t));
  350. }
  351. return TK_IDENTIFIER;
  352. }
  353. SQInteger SQLexer::ReadString(SQInteger ndelim,bool verbatim)
  354. {
  355. INIT_TEMP_STRING();
  356. SQInteger start_equals = 0;
  357. SQChar cdelim1, cdelim2;
  358. if(ndelim == _SC('{')){
  359. cdelim1 = _SC('{');
  360. cdelim2 = _SC('}');
  361. }
  362. else if(ndelim == _SC('(')){
  363. cdelim1 = _SC('(');
  364. cdelim2 = _SC(')');
  365. }
  366. else {
  367. cdelim1 = _SC('[');
  368. cdelim2 = _SC(']');
  369. }
  370. if(CUR_CHAR == _SC('=')){
  371. //lua like literal
  372. while(!IS_EOB() && CUR_CHAR == _SC('=')) {
  373. ++start_equals;
  374. NEXT();
  375. }
  376. if(CUR_CHAR != cdelim1){
  377. //it's not a lua literal delimiter
  378. Error(_SC("expect '%c' on literal delimiter"), cdelim1);
  379. return -1;
  380. }
  381. ndelim = cdelim2;
  382. }
  383. NEXT();
  384. if(IS_EOB()) return -1;
  385. if(start_equals) {
  386. int cr_nl = CUR_CHAR == _SC('\r');
  387. if(cr_nl) NEXT();
  388. cr_nl = CUR_CHAR == _SC('\n');
  389. if(cr_nl) NEXT();
  390. if(cr_nl) {//if a new line follows the start of delimiter drop it
  391. ++_currentline;
  392. if(IS_EOB())
  393. {
  394. Error(_SC("unfinished string"));
  395. return -1;
  396. }
  397. }
  398. }
  399. for(;;) {
  400. while(CUR_CHAR != ndelim) {
  401. switch(CUR_CHAR) {
  402. case SQUIRREL_EOB:
  403. Error(_SC("unfinished string"));
  404. return -1;
  405. case _SC('\n'):
  406. if(!verbatim) Error(_SC("newline in a constant"));
  407. APPEND_CHAR(CUR_CHAR); NEXT();
  408. _currentline++;
  409. break;
  410. case _SC('\\'):
  411. if(verbatim) {
  412. APPEND_CHAR('\\'); NEXT();
  413. }
  414. else {
  415. NEXT();
  416. switch(CUR_CHAR) {
  417. case _SC('x'): NEXT(); {
  418. if(!isxdigit(CUR_CHAR)) Error(_SC("hexadecimal number expected"));
  419. const SQInteger maxdigits = 4;
  420. SQChar temp[maxdigits+1];
  421. SQInteger n = 0;
  422. while(isxdigit(CUR_CHAR) && n < maxdigits) {
  423. temp[n] = CUR_CHAR;
  424. n++;
  425. NEXT();
  426. }
  427. temp[n] = 0;
  428. SQChar *sTemp;
  429. APPEND_CHAR((SQChar)scstrtoul(temp,&sTemp,16));
  430. }
  431. break;
  432. case _SC('t'): APPEND_CHAR(_SC('\t')); NEXT(); break;
  433. case _SC('a'): APPEND_CHAR(_SC('\a')); NEXT(); break;
  434. case _SC('b'): APPEND_CHAR(_SC('\b')); NEXT(); break;
  435. case _SC('n'): APPEND_CHAR(_SC('\n')); NEXT(); break;
  436. case _SC('r'): APPEND_CHAR(_SC('\r')); NEXT(); break;
  437. case _SC('v'): APPEND_CHAR(_SC('\v')); NEXT(); break;
  438. case _SC('f'): APPEND_CHAR(_SC('\f')); NEXT(); break;
  439. case _SC('0'): APPEND_CHAR(_SC('\0')); NEXT(); break;
  440. case _SC('\\'): APPEND_CHAR(_SC('\\')); NEXT(); break;
  441. case _SC('"'): APPEND_CHAR(_SC('"')); NEXT(); break;
  442. case _SC('\''): APPEND_CHAR(_SC('\'')); NEXT(); break;
  443. case _SC('u'): NEXT(); break; //unicode escape leave as is
  444. default:
  445. Error(_SC("unrecognised escaper char"));
  446. break;
  447. }
  448. }
  449. break;
  450. default:
  451. APPEND_CHAR(CUR_CHAR);
  452. NEXT();
  453. }
  454. }
  455. NEXT();
  456. if(start_equals){
  457. bool lastBraceAdded = false;
  458. if(CUR_CHAR == _SC('=')){
  459. SQInteger end_equals = start_equals;
  460. NEXT();
  461. if(CUR_CHAR == _SC('=') || CUR_CHAR == cdelim2){
  462. --end_equals;
  463. while(!IS_EOB() && CUR_CHAR == _SC('=')) {
  464. --end_equals;
  465. NEXT();
  466. }
  467. if(end_equals) Error(_SC("expect same number of '=' on literal delimiter"));
  468. if(CUR_CHAR != cdelim2) Error(_SC("expect '%c' to close literal delimiter"), cdelim2);
  469. NEXT();
  470. break;
  471. }
  472. APPEND_CHAR(cdelim2); //the first NEXT() after break the while loop
  473. APPEND_CHAR(_SC('='));
  474. lastBraceAdded = true;
  475. }
  476. if(!lastBraceAdded) APPEND_CHAR(cdelim2); //the first NEXT() after break the while loop
  477. APPEND_CHAR(CUR_CHAR);
  478. NEXT();
  479. }
  480. else if(verbatim && CUR_CHAR == '"') { //double quotation
  481. APPEND_CHAR(CUR_CHAR);
  482. NEXT();
  483. }
  484. else {
  485. break;
  486. }
  487. }
  488. TERMINATE_BUFFER();
  489. SQInteger len = _longstr.size()-1;
  490. if(ndelim == _SC('\'')) {
  491. if(len == 0) Error(_SC("empty constant"));
  492. if(len > 1) Error(_SC("constant too long"));
  493. _nvalue = _longstr[0];
  494. return TK_INTEGER;
  495. }
  496. _svalue = &_longstr[0];
  497. return TK_STRING_LITERAL;
  498. }
  499. void LexHexadecimal(const SQChar *s,SQUnsignedInteger *res)
  500. {
  501. *res = 0;
  502. while(*s != 0)
  503. {
  504. if(scisdigit(*s)) *res = (*res)*16+((*s++)-'0');
  505. else if(scisxdigit(*s)) *res = (*res)*16+(toupper(*s++)-'A'+10);
  506. else { assert(0); }
  507. }
  508. }
  509. void LexInteger(const SQChar *s,SQUnsignedInteger *res)
  510. {
  511. *res = 0;
  512. while(*s != 0)
  513. {
  514. *res = (*res)*10+((*s++)-'0');
  515. }
  516. }
  517. SQInteger scisodigit(SQInteger c) { return c >= _SC('0') && c <= _SC('7'); }
  518. void LexOctal(const SQChar *s,SQUnsignedInteger *res)
  519. {
  520. *res = 0;
  521. while(*s != 0)
  522. {
  523. if(scisodigit(*s)) *res = (*res)*8+((*s++)-'0');
  524. else { assert(0); }
  525. }
  526. }
  527. SQInteger isexponent(SQInteger c) { return c == 'e' || c=='E'; }
  528. #define MAX_HEX_DIGITS (sizeof(SQInteger)*2)
  529. SQInteger SQLexer::ReadNumber()
  530. {
  531. #define TINT 1
  532. #define TFLOAT 2
  533. #define THEX 3
  534. #define TSCIENTIFIC 4
  535. #define TOCTAL 5
  536. SQInteger type = TINT, firstchar = CUR_CHAR;
  537. SQUnsignedInteger itmp;
  538. SQChar *sTemp;
  539. INIT_TEMP_STRING();
  540. NEXT();
  541. if(firstchar == _SC('0') && (toupper(CUR_CHAR) == _SC('X') || scisodigit(CUR_CHAR)) ) {
  542. if(scisodigit(CUR_CHAR)) {
  543. type = TOCTAL;
  544. while(scisodigit(CUR_CHAR)) {
  545. APPEND_CHAR(CUR_CHAR);
  546. NEXT();
  547. }
  548. if(scisdigit(CUR_CHAR)) Error(_SC("invalid octal number"));
  549. }
  550. else {
  551. NEXT();
  552. type = THEX;
  553. while(isxdigit(CUR_CHAR)) {
  554. APPEND_CHAR(CUR_CHAR);
  555. NEXT();
  556. }
  557. if(_longstr.size() > MAX_HEX_DIGITS) Error(_SC("too many digits for an Hex number"));
  558. }
  559. }
  560. else {
  561. APPEND_CHAR((int)firstchar);
  562. while (CUR_CHAR == _SC('.') || scisdigit(CUR_CHAR) || isexponent(CUR_CHAR)) {
  563. if(CUR_CHAR == _SC('.') || isexponent(CUR_CHAR)) type = TFLOAT;
  564. if(isexponent(CUR_CHAR)) {
  565. if(type != TFLOAT) Error(_SC("invalid numeric format"));
  566. type = TSCIENTIFIC;
  567. APPEND_CHAR(CUR_CHAR);
  568. NEXT();
  569. if(CUR_CHAR == '+' || CUR_CHAR == '-'){
  570. APPEND_CHAR(CUR_CHAR);
  571. NEXT();
  572. }
  573. if(!scisdigit(CUR_CHAR)) Error(_SC("exponent expected"));
  574. }
  575. APPEND_CHAR(CUR_CHAR);
  576. NEXT();
  577. }
  578. }
  579. TERMINATE_BUFFER();
  580. switch(type) {
  581. case TSCIENTIFIC:
  582. case TFLOAT:
  583. _fvalue = (SQFloat)scstrtod(&_longstr[0],&sTemp);
  584. return TK_FLOAT;
  585. case TINT:
  586. LexInteger(&_longstr[0],&itmp);
  587. break;
  588. case THEX:
  589. LexHexadecimal(&_longstr[0],&itmp);
  590. break;
  591. case TOCTAL:
  592. LexOctal(&_longstr[0],&itmp);
  593. break;
  594. }
  595. switch(type) {
  596. case TINT:
  597. case THEX:
  598. case TOCTAL:
  599. //to allow 64 bits integers comment bellow
  600. //if(itmp > INT_MAX) Error(_SC("integer overflow %ulld %d"));
  601. _nvalue = (SQInteger) itmp;
  602. return TK_INTEGER;
  603. }
  604. return 0;
  605. }
  606. SQInteger SQLexer::ReadID()
  607. {
  608. SQInteger res;
  609. INIT_TEMP_STRING();
  610. do {
  611. APPEND_CHAR(CUR_CHAR);
  612. NEXT();
  613. } while(scisalnum(CUR_CHAR) || CUR_CHAR == _SC('_'));
  614. TERMINATE_BUFFER();
  615. res = GetIDType(&_longstr[0],_longstr.size() - 1);
  616. if(res == TK_IDENTIFIER || res == TK_CONSTRUCTOR || res == TK_DESTRUCTOR) {
  617. _svalue = &_longstr[0];
  618. }
  619. return res;
  620. }