| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362 | /*************************************************************************//*  gd_tokenizer.cpp                                                     *//*************************************************************************//*                       This file is part of:                           *//*                           GODOT ENGINE                                *//*                    http://www.godotengine.org                         *//*************************************************************************//* Copyright (c) 2007-2014 Juan Linietsky, Ariel Manzur.                 *//*                                                                       *//* Permission is hereby granted, free of charge, to any person obtaining *//* a copy of this software and associated documentation files (the       *//* "Software"), to deal in the Software without restriction, including   *//* without limitation the rights to use, copy, modify, merge, publish,   *//* distribute, sublicense, and/or sell copies of the Software, and to    *//* permit persons to whom the Software is furnished to do so, subject to *//* the following conditions:                                             *//*                                                                       *//* The above copyright notice and this permission notice shall be        *//* included in all copies or substantial portions of the Software.       *//*                                                                       *//* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,       *//* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF    *//* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.*//* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY  *//* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,  *//* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE     *//* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.                *//*************************************************************************/#include "gd_tokenizer.h"#include "print_string.h"#include "gd_functions.h"#include "io/marshalls.h"#include "map.h"const char* GDTokenizer::token_names[TK_MAX]={"Empty","Identifier","Constant","Self","Built-In Type","Built-In Func","In","'=='","'!='","'<'","'<='","'>'","'>='","'and'","'or'","'not'","'+'","'-'","'*'","'/'","'%'","'<<'","'>>'","'='","'+='","'-='","'*='","'/='","'%='","'<<='","'>>='","'&='","'|='","'^='","'&'","'|'","'^'","'~'",//"Plus Plus",//"Minus Minus","if","elif","else","for","do","while","switch","case","break","continue","pass","return","func","class","extends","tool","static","export","const","var","preload","assert","'['","']'","'{'","'}'","'('","')'","','","';'","'.'","'?'","':'","'\\n'","Error","EOF"};const char *GDTokenizer::get_token_name(Token p_token) {	ERR_FAIL_INDEX_V(p_token,TK_MAX,"<error>");	return token_names[p_token];}static bool _is_text_char(CharType c) {	return (c>='a' && c<='z') || (c>='A' && c<='Z') || (c>='0' && c<='9') || c=='_';}static bool _is_number(CharType c) {	return (c>='0' && c<='9');}static bool _is_hex(CharType c) {	return (c>='0' && c<='9') || (c>='a' && c<='f') || (c>='A' && c<='F');}void GDTokenizerText::_make_token(Token p_type)  {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=p_type;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_identifier(const StringName& p_identifier)  {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_IDENTIFIER;	tk.identifier=p_identifier;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_built_in_func(GDFunctions::Function p_func)  {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_BUILT_IN_FUNC;	tk.func=p_func;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_constant(const Variant& p_constant)  {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_CONSTANT;	tk.constant=p_constant;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_type(const Variant::Type& p_type) {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_BUILT_IN_TYPE;	tk.vtype=p_type;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_error(const String& p_error) {	error_flag=true;	last_error=p_error;	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_ERROR;	tk.constant=p_error;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_newline(int p_spaces) {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_NEWLINE;	tk.constant=p_spaces;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_advance() {	if (error_flag) {		//parser broke		_make_error(last_error);		return;	}	if (code_pos>=len) {		_make_token(TK_EOF);		return;	}#define GETCHAR(m_ofs) ((m_ofs+code_pos)>=len?0:_code[m_ofs+code_pos])#define INCPOS(m_amount) { code_pos+=m_amount; column+=m_amount; }	while (true) {		bool is_node_path=false;		switch(GETCHAR(0)) {			case 0:				_make_token(TK_EOF);				break;			case '\\':				INCPOS(1);				if (GETCHAR(0)=='\r') {					INCPOS(1);				}				if (GETCHAR(0)!='\n') {					_make_error("Expected newline after '\\'.");					return;				}				INCPOS(1);				while(GETCHAR(0)==' ' || GETCHAR(0)=='\t') {					INCPOS(1);				}				continue;			case '\t':			case '\r':			case ' ':				INCPOS(1);				continue;			case '\n': {				line++;				INCPOS(1);				column=0;				int i=0;				while(GETCHAR(i)==' ' || GETCHAR(i)=='\t') {					i++;				}				_make_newline(i);				return;			}#if 1 //py style tokenizer			case '#': { // line comment skip				while(GETCHAR(0)!='\n') {					code_pos++;					if (GETCHAR(0)==0) { //end of file						_make_error("Unterminated Comment");						return;					}				}				INCPOS(1);				column=0;				line++;				int i=0;				while(GETCHAR(i)==' ' || GETCHAR(i)=='\t') {					i++;				}				_make_newline(i);				return;			} break;#endif			case '/': {				switch(GETCHAR(1)) {#if 0 // c style tokenizer					case '*': { // block comment						int pos = code_pos+2;						int new_line=line;						int new_col=column+2;						while(true) {							if (_code[pos]=='0') {								_make_error("Unterminated Comment");								code_pos=pos;								return;							}							if (_code[pos]=='*' && _code[pos+1]=='/') {								new_col+=2;								pos+=2; //compensate								break;							} else if (_code[pos]=='\n') {								new_line++;								new_col=0;							} else {								new_col++;							}							pos++;						}						column=new_col;						line=new_line;						code_pos=pos;						continue;					} break;					case '/': { // line comment skip						while(GETCHAR(0)!='\n') {							code_pos++;							if (GETCHAR(0)==0) { //end of file								_make_error("Unterminated Comment");								return;							}						}						INCPOS(1);						column=0;						line++;						continue;					} break;#endif					case '=': { // diveq						_make_token(TK_OP_ASSIGN_DIV);						INCPOS(1);					} break;					default:						_make_token(TK_OP_DIV);				}			} break;			case '=': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_EQUAL);					INCPOS(1);				} else					_make_token(TK_OP_ASSIGN);			} break;			case '<': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_LESS_EQUAL);					INCPOS(1);				} else if (GETCHAR(1)=='<') {					if (GETCHAR(2)=='=') {						_make_token(TK_OP_ASSIGN_SHIFT_LEFT);						INCPOS(1);					} else {						_make_token(TK_OP_SHIFT_LEFT);					}					INCPOS(1);				} else					_make_token(TK_OP_LESS);			} break;			case '>': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_GREATER_EQUAL);					INCPOS(1);				} else if (GETCHAR(1)=='>') {					if (GETCHAR(2)=='=') {						_make_token(TK_OP_ASSIGN_SHIFT_RIGHT);						INCPOS(1);					} else {						_make_token(TK_OP_SHIFT_RIGHT);					}					INCPOS(1);				} else {					_make_token(TK_OP_GREATER);				}			} break;			case '!': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_NOT_EQUAL);					INCPOS(1);				} else {					_make_token(TK_OP_NOT);				}			} break;			//case '"' //string - no strings in shader			//case '\'' //string - no strings in shader			case '{':				_make_token(TK_CURLY_BRACKET_OPEN);				break;			case '}':				_make_token(TK_CURLY_BRACKET_CLOSE);				break;			case '[':				_make_token(TK_BRACKET_OPEN);				break;			case ']':				_make_token(TK_BRACKET_CLOSE);				break;			case '(':				_make_token(TK_PARENTHESIS_OPEN);				break;			case ')':				_make_token(TK_PARENTHESIS_CLOSE);				break;			case ',':				_make_token(TK_COMMA);				break;			case ';':				_make_token(TK_SEMICOLON);				break;			case '?':				_make_token(TK_QUESTION_MARK);				break;			case ':':				_make_token(TK_COLON); //for methods maybe but now useless.				break;			case '^': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_BIT_XOR);					INCPOS(1);				} else {					_make_token(TK_OP_BIT_XOR);				}			} break;			case '~':				_make_token(TK_OP_BIT_INVERT);				break;			case '&': {				if (GETCHAR(1)=='&') {					_make_token(TK_OP_AND);					INCPOS(1);				} else if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_BIT_AND);					INCPOS(1);				} else {					_make_token(TK_OP_BIT_AND);				}			} break;			case '|': {				if (GETCHAR(1)=='|') {					_make_token(TK_OP_OR);					INCPOS(1);				} else if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_BIT_OR);					INCPOS(1);				} else {					_make_token(TK_OP_BIT_OR);				}			} break;			case '*': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_MUL);					INCPOS(1);				} else {					_make_token(TK_OP_MUL);				}			} break;			case '+': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_ADD);					INCPOS(1);				//}  else if (GETCHAR(1)=='+') {				//	_make_token(TK_OP_PLUS_PLUS);				//	INCPOS(1);				} else {					_make_token(TK_OP_ADD);				}			} break;			case '-': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_SUB);					INCPOS(1);				//}  else if (GETCHAR(1)=='-') {				//	_make_token(TK_OP_MINUS_MINUS);				//	INCPOS(1);				} else {					_make_token(TK_OP_SUB);				}			} break;			case '%': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_MOD);					INCPOS(1);				} else {					_make_token(TK_OP_MOD);				}			} break;			case '@':				if (CharType(GETCHAR(1))!='"') {					_make_error("Unexpected '@'");					return;				}				INCPOS(1);				is_node_path=true;			case '"': {				int i=1;				String str;				while(true) {					if (CharType(GETCHAR(i)==0)) {						_make_error("Unterminated String");						return;					} else if (CharType(GETCHAR(i)=='"')) {						break;					} else if (CharType(GETCHAR(i)=='\\')) {						//escaped characters...						i++;						CharType next = GETCHAR(i);						if (next==0) {							_make_error("Unterminated String");							return;						}						CharType res=0;						switch(next) {							case 'a': res=7; break;							case 'b': res=8; break;							case 't': res=9; break;							case 'n': res=10; break;							case 'v': res=11; break;							case 'f': res=12; break;							case 'r': res=13; break;							case '\'': res='\''; break;							case '\"': res='\"'; break;							case '\\': res='\\'; break;							case 'x': {								//hexnumbarh - oct is deprecated								int read=0;								for(int j=0;j<4;j++) {									CharType c = GETCHAR(i+j);									if (c==0) {										_make_error("Unterminated String");										return;									}									if (!_is_hex(c)) {										if (j==0 || !(j&1)) {											_make_error("Malformed hex constant in string");											return;										} else											break;									}									CharType v;									if (c>='0' && c<='9') {										v=c-'0';									} else if (c>='a' && c<='f') {										v=c-'a';										v+=10;									} else if (c>='A' && c<='F') {										v=c-'A';										v+=10;									} else {										ERR_PRINT("BUG");										v=0;									}									res<<=4;									res|=v;									read++;								}								i+=read-1;							} break;							default: {								_make_error("Invalid escape sequence");								return;							} break;						}						str+=res;					} else {						str+=CharType(GETCHAR(i));					}					i++;				}				INCPOS(i);				if (is_node_path) {					_make_constant(NodePath(str));				} else {					_make_constant(str);				}			} break;			default: {				if (_is_number(GETCHAR(0)) || (GETCHAR(0)=='.' && _is_number(GETCHAR(1)))) {					// parse number					bool period_found=false;					bool exponent_found=false;					bool hexa_found=false;					bool sign_found=false;					String str;					int i=0;					while(true) {						if (GETCHAR(i)=='.') {							if (period_found || exponent_found) {                                _make_error("Invalid numeric constant at '.'");								return;							}							period_found=true;						} else if (GETCHAR(i)=='x') {                            if (hexa_found || str.length()!=1 || !( (i==1 && str[0]=='0') || (i==2 && str[1]=='0' && str[0]=='-') ) ) {                                _make_error("Invalid numeric constant at 'x'");								return;							}							hexa_found=true;                        } else if (!hexa_found && GETCHAR(i)=='e') {							if (hexa_found || exponent_found) {                                _make_error("Invalid numeric constant at 'e'");								return;							}							exponent_found=true;						} else if (_is_number(GETCHAR(i))) {							//all ok						} else if (hexa_found && _is_hex(GETCHAR(i))) {						} else if ((GETCHAR(i)=='-' || GETCHAR(i)=='+') && exponent_found) {							if (sign_found) {                                _make_error("Invalid numeric constant at '-'");								return;							}							sign_found=true;						} else							break;						str+=CharType(GETCHAR(i));						i++;					}                    if (!( _is_number(str[str.length()-1]) || (hexa_found && _is_hex(str[str.length()-1])))) {                        _make_error("Invalid numeric constant: "+str);						return;					}					INCPOS(str.length());                    if (hexa_found) {                        int val = str.hex_to_int();                        _make_constant(val);                    } else if (period_found) {						real_t val = str.to_double();						//print_line("*%*%*%*% to convert: "+str+" result: "+rtos(val));						_make_constant(val);                    } else {						int val = str.to_int();						_make_constant(val);					}					return;				}				if (GETCHAR(0)=='.') {					//parse period					_make_token(TK_PERIOD);					break;				}				if (_is_text_char(GETCHAR(0))) {					// parse identifier					String str;					str+=CharType(GETCHAR(0));					int i=1;					while(_is_text_char(GETCHAR(i))) {						str+=CharType(GETCHAR(i));						i++;					}					bool identifier=false;					if (str=="null") {						_make_constant(Variant());					} else if (str=="true") {						_make_constant(true);					} else if (str=="false") {						_make_constant(false);					} else {						bool found=false;						struct _bit { Variant::Type type; const char *text;};						//built in types						static const  _bit type_list[]={							//types							{Variant::BOOL,"bool"},							{Variant::INT,"int"},							{Variant::REAL,"float"},							{Variant::STRING,"String"},							{Variant::VECTOR2,"vec2"},							{Variant::VECTOR2,"Vector2"},							{Variant::RECT2,"Rect2"},							{Variant::MATRIX32,"Matrix32"},							{Variant::MATRIX32,"mat32"},							{Variant::VECTOR3,"vec3"},							{Variant::VECTOR3,"Vector3"},							{Variant::_AABB,"AABB"},							{Variant::_AABB,"Rect3"},							{Variant::PLANE,"Plane"},							{Variant::QUAT,"Quat"},							{Variant::MATRIX3,"mat3"},							{Variant::MATRIX3,"Matrix3"},							{Variant::TRANSFORM,"trn"},							{Variant::TRANSFORM,"Transform"},							{Variant::COLOR,"Color"},							{Variant::IMAGE,"Image"},							{Variant::_RID,"RID"},							{Variant::OBJECT,"Object"},							{Variant::INPUT_EVENT,"InputEvent"},							{Variant::DICTIONARY,"dict"},							{Variant::DICTIONARY,"Dictionary"},							{Variant::ARRAY,"Array"},							{Variant::RAW_ARRAY,"RawArray"},							{Variant::INT_ARRAY,"IntArray"},							{Variant::REAL_ARRAY,"FloatArray"},							{Variant::STRING_ARRAY,"StringArray"},							{Variant::VECTOR2_ARRAY,"Vector2Array"},							{Variant::VECTOR3_ARRAY,"Vector3Array"},							{Variant::COLOR_ARRAY,"ColorArray"},							{Variant::VARIANT_MAX,NULL},						};						{							int idx=0;							while(type_list[idx].text) {								if (str==type_list[idx].text) {									_make_type(type_list[idx].type);									found=true;									break;								}								idx++;							}						}						if (!found) {							//built in func?							for(int i=0;i<GDFunctions::FUNC_MAX;i++) {								if (str==GDFunctions::get_func_name(GDFunctions::Function(i))) {									_make_built_in_func(GDFunctions::Function(i));									found=true;									 break;								}							}							//keywor						}						if (!found) {							struct _kws { Token token; const char *text;};							static const  _kws keyword_list[]={								//ops								{TK_OP_IN,"in"},								{TK_OP_NOT,"not"},								{TK_OP_OR,"or"},								{TK_OP_AND,"and"},								//func								{TK_PR_FUNCTION,"func"},								{TK_PR_FUNCTION,"function"},								{TK_PR_CLASS,"class"},								{TK_PR_EXTENDS,"extends"},								{TK_PR_TOOL,"tool"},								{TK_PR_STATIC,"static"},								{TK_PR_EXPORT,"export"},								{TK_PR_VAR,"var"},								{TK_PR_PRELOAD,"preload"},								{TK_PR_ASSERT,"assert"},								{TK_PR_CONST,"const"},								//controlflow								{TK_CF_IF,"if"},								{TK_CF_ELIF,"elif"},								{TK_CF_ELSE,"else"},								{TK_CF_FOR,"for"},								{TK_CF_WHILE,"while"},								{TK_CF_DO,"do"},								{TK_CF_SWITCH,"switch"},								{TK_CF_BREAK,"break"},								{TK_CF_CONTINUE,"continue"},								{TK_CF_RETURN,"return"},								{TK_CF_PASS,"pass"},								{TK_SELF,"self"},								{TK_ERROR,NULL}							};							int idx=0;							found=false;							while(keyword_list[idx].text) {								if (str==keyword_list[idx].text) {									_make_token(keyword_list[idx].token);									found=true;									break;								}								idx++;							}						}						if (!found)							identifier=true;					}					if (identifier) {						_make_identifier(str);					}					INCPOS(str.length());					return;				}				_make_error("Unknown character");				return;			} break;		}		INCPOS(1);		break;	}}void GDTokenizerText::set_code(const String& p_code) {	code=p_code;	len = p_code.length();	if (len) {		_code=&code[0];	} else {		_code=NULL;	}	code_pos=0;	line=1; //it is stand-ar-ized that lines begin in 1 in code..	column=0;	tk_rb_pos=0;	error_flag=false;	last_error="";	for(int i=0;i<MAX_LOOKAHEAD+1;i++)		_advance();}GDTokenizerText::Token GDTokenizerText::get_token(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, TK_ERROR);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, TK_ERROR);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	return tk_rb[ofs].type;}int GDTokenizerText::get_token_line(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, -1);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, -1);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	return tk_rb[ofs].line;}int GDTokenizerText::get_token_column(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, -1);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, -1);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	return tk_rb[ofs].col;}const Variant& GDTokenizerText::get_token_constant(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, tk_rb[0].constant);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, tk_rb[0].constant);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_CONSTANT,tk_rb[0].constant);	return tk_rb[ofs].constant;}StringName GDTokenizerText::get_token_identifier(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, StringName());	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, StringName());	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_IDENTIFIER,StringName());	return tk_rb[ofs].identifier;}GDFunctions::Function GDTokenizerText::get_token_built_in_func(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, GDFunctions::FUNC_MAX);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, GDFunctions::FUNC_MAX);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_BUILT_IN_FUNC,GDFunctions::FUNC_MAX);	return tk_rb[ofs].func;}Variant::Type GDTokenizerText::get_token_type(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, Variant::NIL);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, Variant::NIL);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_BUILT_IN_TYPE,Variant::NIL);	return tk_rb[ofs].vtype;}int GDTokenizerText::get_token_line_indent(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, 0);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, 0);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_NEWLINE,0);	return tk_rb[ofs].constant;}String GDTokenizerText::get_token_error(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, String());	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, String());	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_ERROR,String());	return tk_rb[ofs].constant;}void GDTokenizerText::advance(int p_amount) {	ERR_FAIL_COND( p_amount <=0 );	for(int i=0;i<p_amount;i++)		_advance();}//////////////////////////////////////////////////////////////////////////////////////////////////////#define BYTECODE_VERSION 1Error GDTokenizerBuffer::set_code_buffer(const Vector<uint8_t> & p_buffer) {	const uint8_t *buf=p_buffer.ptr();	int total_len=p_buffer.size();	ERR_FAIL_COND_V( p_buffer.size()<24 || p_buffer[0]!='G' || p_buffer[1]!='D' || p_buffer[2]!='S' || p_buffer[3]!='C',ERR_INVALID_DATA);		int version = decode_uint32(&buf[4]);	if (version>1) {		ERR_EXPLAIN("Bytecode is too New!");		ERR_FAIL_COND_V(version>BYTECODE_VERSION,ERR_INVALID_DATA);	}	int identifier_count = decode_uint32(&buf[8]);	int constant_count = decode_uint32(&buf[12]);	int line_count = decode_uint32(&buf[16]);	int token_count = decode_uint32(&buf[20]);	const uint8_t *b=buf;		b=&buf[24];	total_len-=24;		identifiers.resize(identifier_count);	for(int i=0;i<identifier_count;i++) {				int len = decode_uint32(b);		ERR_FAIL_COND_V(len>total_len,ERR_INVALID_DATA);		b+=4;		Vector<uint8_t> cs;		cs.resize(len);		for(int j=0;j<len;j++) {			cs[j]=b[j]^0xb6;		}		cs[cs.size()-1]=0;		String s;		s.parse_utf8((const char*)cs.ptr());		b+=len;		total_len-=len+4;		identifiers[i]=s;	}		constants.resize(constant_count);	for(int i=0;i<constant_count;i++) {		Variant v;		int len;		Error err = decode_variant(v,b,total_len,&len);		if (err)			return err;		b+=len;		total_len-=len;		constants[i]=v;	}	ERR_FAIL_COND_V(line_count*8>total_len,ERR_INVALID_DATA);	for(int i=0;i<line_count;i++) {		uint32_t token=decode_uint32(b);		b+=4;		uint32_t linecol=decode_uint32(b);		b+=4;		lines.insert(token,linecol);		total_len-=8;	}	tokens.resize(token_count);	for(int i=0;i<token_count;i++) {		ERR_FAIL_COND_V( total_len < 1, ERR_INVALID_DATA);		if ((*b)&TOKEN_BYTE_MASK) { //little endian always			ERR_FAIL_COND_V( total_len < 4, ERR_INVALID_DATA);			tokens[i]=decode_uint32(b)&~TOKEN_BYTE_MASK;			b+=4;		} else {			tokens[i]=*b;			b+=1;			total_len--;		}	}	token=0;	return OK;}Vector<uint8_t> GDTokenizerBuffer::parse_code_string(const String& p_code) {	Vector<uint8_t> buf;	Map<StringName,int> identifier_map;	HashMap<Variant,int,VariantHasher> constant_map;	Map<uint32_t,int> line_map;	Vector<uint32_t> token_array;	GDTokenizerText tt;	tt.set_code(p_code);	int line=-1;	int col=0;	while(true) {		if (tt.get_token_line()!=line) {			line=tt.get_token_line();			line_map[line]=token_array.size();		}		uint32_t token=tt.get_token();		switch(tt.get_token()) {			case TK_IDENTIFIER: {				StringName id = tt.get_token_identifier();				if (!identifier_map.has(id)) {					int idx = identifier_map.size();					identifier_map[id]=idx;				}				token|=identifier_map[id]<<TOKEN_BITS;			} break;			case TK_CONSTANT: {				Variant c = tt.get_token_constant();				if (!constant_map.has(c)) {					int idx = constant_map.size();					constant_map[c]=idx;				}				token|=constant_map[c]<<TOKEN_BITS;			} break;			case TK_BUILT_IN_TYPE: {				token|=tt.get_token_type()<<TOKEN_BITS;			} break;			case TK_BUILT_IN_FUNC: {				token|=tt.get_token_built_in_func()<<TOKEN_BITS;			} break;			case TK_NEWLINE: {				token|=tt.get_token_line_indent()<<TOKEN_BITS;			} break;			case TK_ERROR: {				ERR_FAIL_V(Vector<uint8_t>());			} break;			default: {}		};		token_array.push_back(token);		if (tt.get_token()==TK_EOF)			break;		tt.advance();	}	//reverse maps	Map<int,StringName> rev_identifier_map;	for(Map<StringName,int>::Element *E=identifier_map.front();E;E=E->next()) {		rev_identifier_map[E->get()]=E->key();	}	Map<int,Variant> rev_constant_map;	const Variant *K =NULL;	while((K=constant_map.next(K))) {		rev_constant_map[constant_map[*K]]=*K;	}	Map<int,uint32_t> rev_line_map;	for(Map<uint32_t,int>::Element *E=line_map.front();E;E=E->next()) {		rev_line_map[E->get()]=E->key();	}	//save header	buf.resize(24);	buf[0]='G';	buf[1]='D';	buf[2]='S';	buf[3]='C';	encode_uint32(BYTECODE_VERSION,&buf[4]);	encode_uint32(identifier_map.size(),&buf[8]);	encode_uint32(constant_map.size(),&buf[12]);	encode_uint32(line_map.size(),&buf[16]);	encode_uint32(token_array.size(),&buf[20]);	//save identifiers	for(Map<int,StringName>::Element *E=rev_identifier_map.front();E;E=E->next()) {		CharString cs = String(E->get()).utf8();		int len = cs.length()+1;		int extra = 4-(len%4);		if (extra==4)			extra=0;		uint8_t ibuf[4];		encode_uint32(len+extra,ibuf);		for(int i=0;i<4;i++) {			buf.push_back(ibuf[i]);		}		for(int i=0;i<len;i++) {			buf.push_back(cs[i]^0xb6);		}		for(int i=0;i<extra;i++) {			buf.push_back(0^0xb6);		}	}	for(Map<int,Variant>::Element *E=rev_constant_map.front();E;E=E->next()) {		int len;		Error err = encode_variant(E->get(),NULL,len);		ERR_FAIL_COND_V(err!=OK,Vector<uint8_t>());		int pos=buf.size();		buf.resize(pos+len);		encode_variant(E->get(),&buf[pos],len);	}	for(Map<int,uint32_t>::Element *E=rev_line_map.front();E;E=E->next()) {		uint8_t ibuf[8];		encode_uint32(E->key(),&ibuf[0]);		encode_uint32(E->get(),&ibuf[4]);		for(int i=0;i<8;i++)			buf.push_back(ibuf[i]);	}	for(int i=0;i<token_array.size();i++) {		uint32_t token = token_array[i];		if (token&~TOKEN_MASK) {			uint8_t buf4[4];			encode_uint32(token_array[i]|TOKEN_BYTE_MASK,&buf4[0]);			for(int j=0;j<4;j++) {				buf.push_back(buf4[j]);			}		} else {			buf.push_back(token);		}	}	return buf;}GDTokenizerBuffer::Token GDTokenizerBuffer::get_token(int p_offset) const {	int offset = token+p_offset;	if (offset<0 || offset>=tokens.size())		return TK_EOF;	return GDTokenizerBuffer::Token(tokens[offset]&TOKEN_MASK);}StringName GDTokenizerBuffer::get_token_identifier(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),StringName());	uint32_t identifier = tokens[offset]>>TOKEN_BITS;	ERR_FAIL_INDEX_V(identifier,identifiers.size(),StringName());	return identifiers[identifier];}GDFunctions::Function GDTokenizerBuffer::get_token_built_in_func(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),GDFunctions::FUNC_MAX);	return GDFunctions::Function(tokens[offset]>>TOKEN_BITS);}Variant::Type GDTokenizerBuffer::get_token_type(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),Variant::NIL);	return Variant::Type(tokens[offset]>>TOKEN_BITS);}int GDTokenizerBuffer::get_token_line(int p_offset) const{	int offset = token+p_offset;	int pos = lines.find_nearest(offset);	if (pos<0)		return -1;	if (pos>=lines.size())		pos=lines.size()-1;	uint32_t l = lines.getv(pos);	return l&TOKEN_LINE_MASK;}int GDTokenizerBuffer::get_token_column(int p_offset) const{	int offset = token+p_offset;	int pos = lines.find_nearest(offset);	if (pos<0)		return -1;	if (pos>=lines.size())		pos=lines.size()-1;	uint32_t l = lines.getv(pos);	return l>>TOKEN_LINE_BITS;}int GDTokenizerBuffer::get_token_line_indent(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),0);	return tokens[offset]>>TOKEN_BITS;}const Variant& GDTokenizerBuffer::get_token_constant(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),nil);	uint32_t constant = tokens[offset]>>TOKEN_BITS;	ERR_FAIL_INDEX_V(constant,constants.size(),nil);	return constants[constant];}String GDTokenizerBuffer::get_token_error(int p_offset) const{	ERR_FAIL_V(String());}void GDTokenizerBuffer::advance(int p_amount){	ERR_FAIL_INDEX(p_amount+token,tokens.size());	token+=p_amount;}GDTokenizerBuffer::GDTokenizerBuffer(){	token=0;}
 |