| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394 | /*************************************************************************//*  gd_tokenizer.cpp                                                     *//*************************************************************************//*                       This file is part of:                           *//*                           GODOT ENGINE                                *//*                    http://www.godotengine.org                         *//*************************************************************************//* Copyright (c) 2007-2015 Juan Linietsky, Ariel Manzur.                 *//*                                                                       *//* Permission is hereby granted, free of charge, to any person obtaining *//* a copy of this software and associated documentation files (the       *//* "Software"), to deal in the Software without restriction, including   *//* without limitation the rights to use, copy, modify, merge, publish,   *//* distribute, sublicense, and/or sell copies of the Software, and to    *//* permit persons to whom the Software is furnished to do so, subject to *//* the following conditions:                                             *//*                                                                       *//* The above copyright notice and this permission notice shall be        *//* included in all copies or substantial portions of the Software.       *//*                                                                       *//* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,       *//* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF    *//* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.*//* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY  *//* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,  *//* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE     *//* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.                *//*************************************************************************/#include "gd_tokenizer.h"#include "print_string.h"#include "gd_functions.h"#include "io/marshalls.h"#include "map.h"const char* GDTokenizer::token_names[TK_MAX]={"Empty","Identifier","Constant","Self","Built-In Type","Built-In Func","In","'=='","'!='","'<'","'<='","'>'","'>='","'and'","'or'","'not'","'+'","'-'","'*'","'/'","'%'","'<<'","'>>'","'='","'+='","'-='","'*='","'/='","'%='","'<<='","'>>='","'&='","'|='","'^='","'&'","'|'","'^'","'~'",//"Plus Plus",//"Minus Minus","if","elif","else","for","do","while","switch","case","break","continue","pass","return","func","class","extends","tool","static","export","setget","const","var","preload","assert","yield","'['","']'","'{'","'}'","'('","')'","','","';'","'.'","'?'","':'","'\\n'","Error","EOF","Cursor"};const char *GDTokenizer::get_token_name(Token p_token) {	ERR_FAIL_INDEX_V(p_token,TK_MAX,"<error>");	return token_names[p_token];}static bool _is_text_char(CharType c) {	return (c>='a' && c<='z') || (c>='A' && c<='Z') || (c>='0' && c<='9') || c=='_';}static bool _is_number(CharType c) {	return (c>='0' && c<='9');}static bool _is_hex(CharType c) {	return (c>='0' && c<='9') || (c>='a' && c<='f') || (c>='A' && c<='F');}void GDTokenizerText::_make_token(Token p_type)  {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=p_type;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_identifier(const StringName& p_identifier)  {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_IDENTIFIER;	tk.identifier=p_identifier;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_built_in_func(GDFunctions::Function p_func)  {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_BUILT_IN_FUNC;	tk.func=p_func;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_constant(const Variant& p_constant)  {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_CONSTANT;	tk.constant=p_constant;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_type(const Variant::Type& p_type) {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_BUILT_IN_TYPE;	tk.vtype=p_type;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_error(const String& p_error) {	error_flag=true;	last_error=p_error;	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_ERROR;	tk.constant=p_error;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_make_newline(int p_spaces) {	TokenData &tk=tk_rb[tk_rb_pos];	tk.type=TK_NEWLINE;	tk.constant=p_spaces;	tk.line=line;	tk.col=column;	tk_rb_pos=(tk_rb_pos+1)%TK_RB_SIZE;}void GDTokenizerText::_advance() {	if (error_flag) {		//parser broke		_make_error(last_error);		return;	}	if (code_pos>=len) {		_make_token(TK_EOF);		return;	}#define GETCHAR(m_ofs) ((m_ofs+code_pos)>=len?0:_code[m_ofs+code_pos])#define INCPOS(m_amount) { code_pos+=m_amount; column+=m_amount; }	while (true) {		bool is_node_path  = false;		StringMode string_mode=STRING_DOUBLE_QUOTE;		switch(GETCHAR(0)) {			case 0:				_make_token(TK_EOF);				break;			case '\\':				INCPOS(1);				if (GETCHAR(0)=='\r') {					INCPOS(1);				}				if (GETCHAR(0)!='\n') {					_make_error("Expected newline after '\\'.");					return;				}				INCPOS(1);				while(GETCHAR(0)==' ' || GETCHAR(0)=='\t') {					INCPOS(1);				}				continue;			case '\t':			case '\r':			case ' ':				INCPOS(1);				continue;			case '\n': {				line++;				INCPOS(1);				column=0;				int i=0;				while(GETCHAR(i)==' ' || GETCHAR(i)=='\t') {					i++;				}				_make_newline(i);				return;			}#if 1 //py style tokenizer			case '#': { // line comment skip				while(GETCHAR(0)!='\n') {					code_pos++;					if (GETCHAR(0)==0) { //end of file						//_make_error("Unterminated Comment");						_make_token(TK_EOF);						return;					}				}				INCPOS(1);				column=0;				line++;				int i=0;				while(GETCHAR(i)==' ' || GETCHAR(i)=='\t') {					i++;				}				_make_newline(i);				return;			} break;#endif			case '/': {				switch(GETCHAR(1)) {#if 0 // c style tokenizer					case '*': { // block comment						int pos = code_pos+2;						int new_line=line;						int new_col=column+2;						while(true) {							if (_code[pos]=='0') {								_make_error("Unterminated Comment");								code_pos=pos;								return;							}							if (_code[pos]=='*' && _code[pos+1]=='/') {								new_col+=2;								pos+=2; //compensate								break;							} else if (_code[pos]=='\n') {								new_line++;								new_col=0;							} else {								new_col++;							}							pos++;						}						column=new_col;						line=new_line;						code_pos=pos;						continue;					} break;					case '/': { // line comment skip						while(GETCHAR(0)!='\n') {							code_pos++;							if (GETCHAR(0)==0) { //end of file								_make_error("Unterminated Comment");								return;							}						}						INCPOS(1);						column=0;						line++;						continue;					} break;#endif					case '=': { // diveq						_make_token(TK_OP_ASSIGN_DIV);						INCPOS(1);					} break;					default:						_make_token(TK_OP_DIV);				}			} break;			case '=': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_EQUAL);					INCPOS(1);				} else					_make_token(TK_OP_ASSIGN);			} break;			case '<': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_LESS_EQUAL);					INCPOS(1);				} else if (GETCHAR(1)=='<') {					if (GETCHAR(2)=='=') {						_make_token(TK_OP_ASSIGN_SHIFT_LEFT);						INCPOS(1);					} else {						_make_token(TK_OP_SHIFT_LEFT);					}					INCPOS(1);				} else					_make_token(TK_OP_LESS);			} break;			case '>': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_GREATER_EQUAL);					INCPOS(1);				} else if (GETCHAR(1)=='>') {					if (GETCHAR(2)=='=') {						_make_token(TK_OP_ASSIGN_SHIFT_RIGHT);						INCPOS(1);					} else {						_make_token(TK_OP_SHIFT_RIGHT);					}					INCPOS(1);				} else {					_make_token(TK_OP_GREATER);				}			} break;			case '!': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_NOT_EQUAL);					INCPOS(1);				} else {					_make_token(TK_OP_NOT);				}			} break;			//case '"' //string - no strings in shader			//case '\'' //string - no strings in shader			case '{':				_make_token(TK_CURLY_BRACKET_OPEN);				break;			case '}':				_make_token(TK_CURLY_BRACKET_CLOSE);				break;			case '[':				_make_token(TK_BRACKET_OPEN);				break;			case ']':				_make_token(TK_BRACKET_CLOSE);				break;			case '(':				_make_token(TK_PARENTHESIS_OPEN);				break;			case ')':				_make_token(TK_PARENTHESIS_CLOSE);				break;			case ',':				_make_token(TK_COMMA);				break;			case ';':				_make_token(TK_SEMICOLON);				break;			case '?':				_make_token(TK_QUESTION_MARK);				break;			case ':':				_make_token(TK_COLON); //for methods maybe but now useless.				break;			case '^': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_BIT_XOR);					INCPOS(1);				} else {					_make_token(TK_OP_BIT_XOR);				}			} break;			case '~':				_make_token(TK_OP_BIT_INVERT);				break;			case '&': {				if (GETCHAR(1)=='&') {					_make_token(TK_OP_AND);					INCPOS(1);				} else if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_BIT_AND);					INCPOS(1);				} else {					_make_token(TK_OP_BIT_AND);				}			} break;			case '|': {				if (GETCHAR(1)=='|') {					_make_token(TK_OP_OR);					INCPOS(1);				} else if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_BIT_OR);					INCPOS(1);				} else {					_make_token(TK_OP_BIT_OR);				}			} break;			case '*': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_MUL);					INCPOS(1);				} else {					_make_token(TK_OP_MUL);				}			} break;			case '+': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_ADD);					INCPOS(1);				//}  else if (GETCHAR(1)=='+') {				//	_make_token(TK_OP_PLUS_PLUS);				//	INCPOS(1);				} else {					_make_token(TK_OP_ADD);				}			} break;			case '-': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_SUB);					INCPOS(1);				//}  else if (GETCHAR(1)=='-') {				//	_make_token(TK_OP_MINUS_MINUS);				//	INCPOS(1);				} else {					_make_token(TK_OP_SUB);				}			} break;			case '%': {				if (GETCHAR(1)=='=') {					_make_token(TK_OP_ASSIGN_MOD);					INCPOS(1);				} else {					_make_token(TK_OP_MOD);				}			} break;			case '@':				if( CharType(GETCHAR(1))!='"' && CharType(GETCHAR(1))!='\'' ) {					_make_error("Unexpected '@'");					return;				}				INCPOS(1);				is_node_path=true;							case '\'':			case '"': {					if (GETCHAR(0)=='\'')					string_mode=STRING_SINGLE_QUOTE;																																						int i=1;				if (string_mode==STRING_DOUBLE_QUOTE && GETCHAR(i)=='"' && GETCHAR(i+1)=='"') {					i+=2;					string_mode=STRING_MULTILINE;				}				String str;				while(true) {					if (CharType(GETCHAR(i))==0) {						_make_error("Unterminated String");						return;					} else if( string_mode==STRING_DOUBLE_QUOTE && CharType(GETCHAR(i))=='"' ) {						break;					} else if( string_mode==STRING_SINGLE_QUOTE && CharType(GETCHAR(i))=='\'' ) {						break;					} else if( string_mode==STRING_MULTILINE && CharType(GETCHAR(i))=='\"' &&  CharType(GETCHAR(i+1))=='\"' && CharType(GETCHAR(i+2))=='\"') {						i+=2;						break;					} else if( string_mode!=STRING_MULTILINE && CharType(GETCHAR(i))=='\n') {						_make_error("Unexpected EOL at String.");						return;					} else if (CharType(GETCHAR(i))=='\\') {						//escaped characters...						i++;						CharType next = GETCHAR(i);						if (next==0) {							_make_error("Unterminated String");							return;						}						CharType res=0;						switch(next) {							case 'a': res=7; break;							case 'b': res=8; break;							case 't': res=9; break;							case 'n': res=10; break;							case 'v': res=11; break;							case 'f': res=12; break;							case 'r': res=13; break;							case '\'': res='\''; break;							case '\"': res='\"'; break;							case '\\': res='\\'; break;							case '/': res='/'; break; //wtf							case 'u': {								//hexnumbarh - oct is deprecated								i+=1;								for(int j=0;j<4;j++) {									CharType c = GETCHAR(i+j);									if (c==0) {										_make_error("Unterminated String");										return;									}									if (!((c>='0' && c<='9') || (c>='a' && c<='f') || (c>='A' && c<='F'))) {										_make_error("Malformed hex constant in string");										return;									}									CharType v;									if (c>='0' && c<='9') {										v=c-'0';									} else if (c>='a' && c<='f') {										v=c-'a';										v+=10;									} else if (c>='A' && c<='F') {										v=c-'A';										v+=10;									} else {										ERR_PRINT("BUG");										v=0;									}									res<<=4;									res|=v;								}								i+=3;							} break;							default: {								_make_error("Invalid escape sequence");								return;							} break;						}						str+=res;					} else {						str+=CharType(GETCHAR(i));					}					i++;				}				INCPOS(i);				if (is_node_path) {					_make_constant(NodePath(str));				} else {					_make_constant(str);				}			} break;			case 0xFFFF: {				_make_token(TK_CURSOR);			} break;			default: {				if (_is_number(GETCHAR(0)) || (GETCHAR(0)=='.' && _is_number(GETCHAR(1)))) {					// parse number					bool period_found=false;					bool exponent_found=false;					bool hexa_found=false;					bool sign_found=false;					String str;					int i=0;					while(true) {						if (GETCHAR(i)=='.') {							if (period_found || exponent_found) {                                _make_error("Invalid numeric constant at '.'");								return;							}							period_found=true;						} else if (GETCHAR(i)=='x') {                            if (hexa_found || str.length()!=1 || !( (i==1 && str[0]=='0') || (i==2 && str[1]=='0' && str[0]=='-') ) ) {                                _make_error("Invalid numeric constant at 'x'");								return;							}							hexa_found=true;                        } else if (!hexa_found && GETCHAR(i)=='e') {							if (hexa_found || exponent_found) {                                _make_error("Invalid numeric constant at 'e'");								return;							}							exponent_found=true;						} else if (_is_number(GETCHAR(i))) {							//all ok						} else if (hexa_found && _is_hex(GETCHAR(i))) {						} else if ((GETCHAR(i)=='-' || GETCHAR(i)=='+') && exponent_found) {							if (sign_found) {                                _make_error("Invalid numeric constant at '-'");								return;							}							sign_found=true;						} else							break;						str+=CharType(GETCHAR(i));						i++;					}                    if (!( _is_number(str[str.length()-1]) || (hexa_found && _is_hex(str[str.length()-1])))) {                        _make_error("Invalid numeric constant: "+str);						return;					}					INCPOS(str.length());                    if (hexa_found) {                        int val = str.hex_to_int();                        _make_constant(val);                    } else if (period_found) {						real_t val = str.to_double();						//print_line("*%*%*%*% to convert: "+str+" result: "+rtos(val));						_make_constant(val);                    } else {						int val = str.to_int();						_make_constant(val);					}					return;				}				if (GETCHAR(0)=='.') {					//parse period					_make_token(TK_PERIOD);					break;				}				if (_is_text_char(GETCHAR(0))) {					// parse identifier					String str;					str+=CharType(GETCHAR(0));					int i=1;					while(_is_text_char(GETCHAR(i))) {						str+=CharType(GETCHAR(i));						i++;					}					bool identifier=false;					if (str=="null") {						_make_constant(Variant());					} else if (str=="true") {						_make_constant(true);					} else if (str=="false") {						_make_constant(false);					} else {						bool found=false;						struct _bit { Variant::Type type; const char *text;};						//built in types						static const  _bit type_list[]={							//types							{Variant::BOOL,"bool"},							{Variant::INT,"int"},							{Variant::REAL,"float"},							{Variant::STRING,"String"},							{Variant::VECTOR2,"vec2"},							{Variant::VECTOR2,"Vector2"},							{Variant::RECT2,"Rect2"},							{Variant::MATRIX32,"Matrix32"},							{Variant::MATRIX32,"mat32"},							{Variant::VECTOR3,"vec3"},							{Variant::VECTOR3,"Vector3"},							{Variant::_AABB,"AABB"},							{Variant::_AABB,"Rect3"},							{Variant::PLANE,"Plane"},							{Variant::QUAT,"Quat"},							{Variant::MATRIX3,"mat3"},							{Variant::MATRIX3,"Matrix3"},							{Variant::TRANSFORM,"trn"},							{Variant::TRANSFORM,"Transform"},							{Variant::COLOR,"Color"},							{Variant::IMAGE,"Image"},							{Variant::_RID,"RID"},							{Variant::OBJECT,"Object"},							{Variant::INPUT_EVENT,"InputEvent"},							{Variant::NODE_PATH,"NodePath"},							{Variant::DICTIONARY,"dict"},							{Variant::DICTIONARY,"Dictionary"},							{Variant::ARRAY,"Array"},							{Variant::RAW_ARRAY,"RawArray"},							{Variant::INT_ARRAY,"IntArray"},							{Variant::REAL_ARRAY,"FloatArray"},							{Variant::STRING_ARRAY,"StringArray"},							{Variant::VECTOR2_ARRAY,"Vector2Array"},							{Variant::VECTOR3_ARRAY,"Vector3Array"},							{Variant::COLOR_ARRAY,"ColorArray"},							{Variant::VARIANT_MAX,NULL},						};						{							int idx=0;							while(type_list[idx].text) {								if (str==type_list[idx].text) {									_make_type(type_list[idx].type);									found=true;									break;								}								idx++;							}						}						if (!found) {							//built in func?							for(int i=0;i<GDFunctions::FUNC_MAX;i++) {								if (str==GDFunctions::get_func_name(GDFunctions::Function(i))) {									_make_built_in_func(GDFunctions::Function(i));									found=true;									 break;								}							}							//keywor						}						if (!found) {							struct _kws { Token token; const char *text;};							static const  _kws keyword_list[]={								//ops								{TK_OP_IN,"in"},								{TK_OP_NOT,"not"},								{TK_OP_OR,"or"},								{TK_OP_AND,"and"},								//func								{TK_PR_FUNCTION,"func"},								{TK_PR_FUNCTION,"function"},								{TK_PR_CLASS,"class"},								{TK_PR_EXTENDS,"extends"},								{TK_PR_TOOL,"tool"},								{TK_PR_STATIC,"static"},								{TK_PR_EXPORT,"export"},								{TK_PR_SETGET,"setget"},								{TK_PR_VAR,"var"},								{TK_PR_PRELOAD,"preload"},								{TK_PR_ASSERT,"assert"},								{TK_PR_YIELD,"yield"},								{TK_PR_SIGNAL,"signal"},								{TK_PR_CONST,"const"},								//controlflow								{TK_CF_IF,"if"},								{TK_CF_ELIF,"elif"},								{TK_CF_ELSE,"else"},								{TK_CF_FOR,"for"},								{TK_CF_WHILE,"while"},								{TK_CF_DO,"do"},								{TK_CF_SWITCH,"switch"},								{TK_CF_BREAK,"break"},								{TK_CF_CONTINUE,"continue"},								{TK_CF_RETURN,"return"},								{TK_CF_PASS,"pass"},								{TK_SELF,"self"},								{TK_ERROR,NULL}							};							int idx=0;							found=false;							while(keyword_list[idx].text) {								if (str==keyword_list[idx].text) {									_make_token(keyword_list[idx].token);									found=true;									break;								}								idx++;							}						}						if (!found)							identifier=true;					}					if (identifier) {						_make_identifier(str);					}					INCPOS(str.length());					return;				}				_make_error("Unknown character");				return;			} break;		}		INCPOS(1);		break;	}}void GDTokenizerText::set_code(const String& p_code) {	code=p_code;	len = p_code.length();	if (len) {		_code=&code[0];	} else {		_code=NULL;	}	code_pos=0;	line=1; //it is stand-ar-ized that lines begin in 1 in code..	column=0;	tk_rb_pos=0;	error_flag=false;	last_error="";	for(int i=0;i<MAX_LOOKAHEAD+1;i++)		_advance();}GDTokenizerText::Token GDTokenizerText::get_token(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, TK_ERROR);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, TK_ERROR);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	return tk_rb[ofs].type;}int GDTokenizerText::get_token_line(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, -1);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, -1);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	return tk_rb[ofs].line;}int GDTokenizerText::get_token_column(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, -1);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, -1);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	return tk_rb[ofs].col;}const Variant& GDTokenizerText::get_token_constant(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, tk_rb[0].constant);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, tk_rb[0].constant);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_CONSTANT,tk_rb[0].constant);	return tk_rb[ofs].constant;}StringName GDTokenizerText::get_token_identifier(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, StringName());	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, StringName());	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_IDENTIFIER,StringName());	return tk_rb[ofs].identifier;}GDFunctions::Function GDTokenizerText::get_token_built_in_func(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, GDFunctions::FUNC_MAX);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, GDFunctions::FUNC_MAX);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_BUILT_IN_FUNC,GDFunctions::FUNC_MAX);	return tk_rb[ofs].func;}Variant::Type GDTokenizerText::get_token_type(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, Variant::NIL);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, Variant::NIL);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_BUILT_IN_TYPE,Variant::NIL);	return tk_rb[ofs].vtype;}int GDTokenizerText::get_token_line_indent(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, 0);	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, 0);	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_NEWLINE,0);	return tk_rb[ofs].constant;}String GDTokenizerText::get_token_error(int p_offset) const {	ERR_FAIL_COND_V( p_offset <= -MAX_LOOKAHEAD, String());	ERR_FAIL_COND_V( p_offset >= MAX_LOOKAHEAD, String());	int ofs = (TK_RB_SIZE + tk_rb_pos + p_offset - MAX_LOOKAHEAD -1)%TK_RB_SIZE;	ERR_FAIL_COND_V(tk_rb[ofs].type!=TK_ERROR,String());	return tk_rb[ofs].constant;}void GDTokenizerText::advance(int p_amount) {	ERR_FAIL_COND( p_amount <=0 );	for(int i=0;i<p_amount;i++)		_advance();}//////////////////////////////////////////////////////////////////////////////////////////////////////#define BYTECODE_VERSION 4Error GDTokenizerBuffer::set_code_buffer(const Vector<uint8_t> & p_buffer) {	const uint8_t *buf=p_buffer.ptr();	int total_len=p_buffer.size();	ERR_FAIL_COND_V( p_buffer.size()<24 || p_buffer[0]!='G' || p_buffer[1]!='D' || p_buffer[2]!='S' || p_buffer[3]!='C',ERR_INVALID_DATA);		int version = decode_uint32(&buf[4]);	if (version>BYTECODE_VERSION) {		ERR_EXPLAIN("Bytecode is too New! Please use a newer engine version.");		ERR_FAIL_COND_V(version>BYTECODE_VERSION,ERR_INVALID_DATA);	}	int identifier_count = decode_uint32(&buf[8]);	int constant_count = decode_uint32(&buf[12]);	int line_count = decode_uint32(&buf[16]);	int token_count = decode_uint32(&buf[20]);	const uint8_t *b=buf;		b=&buf[24];	total_len-=24;		identifiers.resize(identifier_count);	for(int i=0;i<identifier_count;i++) {				int len = decode_uint32(b);		ERR_FAIL_COND_V(len>total_len,ERR_INVALID_DATA);		b+=4;		Vector<uint8_t> cs;		cs.resize(len);		for(int j=0;j<len;j++) {			cs[j]=b[j]^0xb6;		}		cs[cs.size()-1]=0;		String s;		s.parse_utf8((const char*)cs.ptr());		b+=len;		total_len-=len+4;		identifiers[i]=s;	}		constants.resize(constant_count);	for(int i=0;i<constant_count;i++) {		Variant v;		int len;		Error err = decode_variant(v,b,total_len,&len);		if (err)			return err;		b+=len;		total_len-=len;		constants[i]=v;	}	ERR_FAIL_COND_V(line_count*8>total_len,ERR_INVALID_DATA);	for(int i=0;i<line_count;i++) {		uint32_t token=decode_uint32(b);		b+=4;		uint32_t linecol=decode_uint32(b);		b+=4;		lines.insert(token,linecol);		total_len-=8;	}	tokens.resize(token_count);	for(int i=0;i<token_count;i++) {		ERR_FAIL_COND_V( total_len < 1, ERR_INVALID_DATA);		if ((*b)&TOKEN_BYTE_MASK) { //little endian always			ERR_FAIL_COND_V( total_len < 4, ERR_INVALID_DATA);			tokens[i]=decode_uint32(b)&~TOKEN_BYTE_MASK;			b+=4;		} else {			tokens[i]=*b;			b+=1;			total_len--;		}	}	token=0;	return OK;}Vector<uint8_t> GDTokenizerBuffer::parse_code_string(const String& p_code) {	Vector<uint8_t> buf;	Map<StringName,int> identifier_map;	HashMap<Variant,int,VariantHasher> constant_map;	Map<uint32_t,int> line_map;	Vector<uint32_t> token_array;	GDTokenizerText tt;	tt.set_code(p_code);	int line=-1;	int col=0;	while(true) {		if (tt.get_token_line()!=line) {			line=tt.get_token_line();			line_map[line]=token_array.size();		}		uint32_t token=tt.get_token();		switch(tt.get_token()) {			case TK_IDENTIFIER: {				StringName id = tt.get_token_identifier();				if (!identifier_map.has(id)) {					int idx = identifier_map.size();					identifier_map[id]=idx;				}				token|=identifier_map[id]<<TOKEN_BITS;			} break;			case TK_CONSTANT: {				Variant c = tt.get_token_constant();				if (!constant_map.has(c)) {					int idx = constant_map.size();					constant_map[c]=idx;				}				token|=constant_map[c]<<TOKEN_BITS;			} break;			case TK_BUILT_IN_TYPE: {				token|=tt.get_token_type()<<TOKEN_BITS;			} break;			case TK_BUILT_IN_FUNC: {				token|=tt.get_token_built_in_func()<<TOKEN_BITS;			} break;			case TK_NEWLINE: {				token|=tt.get_token_line_indent()<<TOKEN_BITS;			} break;			case TK_ERROR: {				ERR_FAIL_V(Vector<uint8_t>());			} break;			default: {}		};		token_array.push_back(token);		if (tt.get_token()==TK_EOF)			break;		tt.advance();	}	//reverse maps	Map<int,StringName> rev_identifier_map;	for(Map<StringName,int>::Element *E=identifier_map.front();E;E=E->next()) {		rev_identifier_map[E->get()]=E->key();	}	Map<int,Variant> rev_constant_map;	const Variant *K =NULL;	while((K=constant_map.next(K))) {		rev_constant_map[constant_map[*K]]=*K;	}	Map<int,uint32_t> rev_line_map;	for(Map<uint32_t,int>::Element *E=line_map.front();E;E=E->next()) {		rev_line_map[E->get()]=E->key();	}	//save header	buf.resize(24);	buf[0]='G';	buf[1]='D';	buf[2]='S';	buf[3]='C';	encode_uint32(BYTECODE_VERSION,&buf[4]);	encode_uint32(identifier_map.size(),&buf[8]);	encode_uint32(constant_map.size(),&buf[12]);	encode_uint32(line_map.size(),&buf[16]);	encode_uint32(token_array.size(),&buf[20]);	//save identifiers	for(Map<int,StringName>::Element *E=rev_identifier_map.front();E;E=E->next()) {		CharString cs = String(E->get()).utf8();		int len = cs.length()+1;		int extra = 4-(len%4);		if (extra==4)			extra=0;		uint8_t ibuf[4];		encode_uint32(len+extra,ibuf);		for(int i=0;i<4;i++) {			buf.push_back(ibuf[i]);		}		for(int i=0;i<len;i++) {			buf.push_back(cs[i]^0xb6);		}		for(int i=0;i<extra;i++) {			buf.push_back(0^0xb6);		}	}	for(Map<int,Variant>::Element *E=rev_constant_map.front();E;E=E->next()) {		int len;		Error err = encode_variant(E->get(),NULL,len);		ERR_FAIL_COND_V(err!=OK,Vector<uint8_t>());		int pos=buf.size();		buf.resize(pos+len);		encode_variant(E->get(),&buf[pos],len);	}	for(Map<int,uint32_t>::Element *E=rev_line_map.front();E;E=E->next()) {		uint8_t ibuf[8];		encode_uint32(E->key(),&ibuf[0]);		encode_uint32(E->get(),&ibuf[4]);		for(int i=0;i<8;i++)			buf.push_back(ibuf[i]);	}	for(int i=0;i<token_array.size();i++) {		uint32_t token = token_array[i];		if (token&~TOKEN_MASK) {			uint8_t buf4[4];			encode_uint32(token_array[i]|TOKEN_BYTE_MASK,&buf4[0]);			for(int j=0;j<4;j++) {				buf.push_back(buf4[j]);			}		} else {			buf.push_back(token);		}	}	return buf;}GDTokenizerBuffer::Token GDTokenizerBuffer::get_token(int p_offset) const {	int offset = token+p_offset;	if (offset<0 || offset>=tokens.size())		return TK_EOF;	return GDTokenizerBuffer::Token(tokens[offset]&TOKEN_MASK);}StringName GDTokenizerBuffer::get_token_identifier(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),StringName());	uint32_t identifier = tokens[offset]>>TOKEN_BITS;	ERR_FAIL_INDEX_V(identifier,identifiers.size(),StringName());	return identifiers[identifier];}GDFunctions::Function GDTokenizerBuffer::get_token_built_in_func(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),GDFunctions::FUNC_MAX);	return GDFunctions::Function(tokens[offset]>>TOKEN_BITS);}Variant::Type GDTokenizerBuffer::get_token_type(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),Variant::NIL);	return Variant::Type(tokens[offset]>>TOKEN_BITS);}int GDTokenizerBuffer::get_token_line(int p_offset) const{	int offset = token+p_offset;	int pos = lines.find_nearest(offset);	if (pos<0)		return -1;	if (pos>=lines.size())		pos=lines.size()-1;	uint32_t l = lines.getv(pos);	return l&TOKEN_LINE_MASK;}int GDTokenizerBuffer::get_token_column(int p_offset) const{	int offset = token+p_offset;	int pos = lines.find_nearest(offset);	if (pos<0)		return -1;	if (pos>=lines.size())		pos=lines.size()-1;	uint32_t l = lines.getv(pos);	return l>>TOKEN_LINE_BITS;}int GDTokenizerBuffer::get_token_line_indent(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),0);	return tokens[offset]>>TOKEN_BITS;}const Variant& GDTokenizerBuffer::get_token_constant(int p_offset) const{	int offset = token+p_offset;	ERR_FAIL_INDEX_V(offset,tokens.size(),nil);	uint32_t constant = tokens[offset]>>TOKEN_BITS;	ERR_FAIL_INDEX_V(constant,constants.size(),nil);	return constants[constant];}String GDTokenizerBuffer::get_token_error(int p_offset) const{	ERR_FAIL_V(String());}void GDTokenizerBuffer::advance(int p_amount){	ERR_FAIL_INDEX(p_amount+token,tokens.size());	token+=p_amount;}GDTokenizerBuffer::GDTokenizerBuffer(){	token=0;}
 |