| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318 | /**************************************************************************//*  gdscript_tokenizer.h                                                  *//**************************************************************************//*                         This file is part of:                          *//*                             GODOT ENGINE                               *//*                        https://godotengine.org                         *//**************************************************************************//* Copyright (c) 2014-present Godot Engine contributors (see AUTHORS.md). *//* Copyright (c) 2007-2014 Juan Linietsky, Ariel Manzur.                  *//*                                                                        *//* Permission is hereby granted, free of charge, to any person obtaining  *//* a copy of this software and associated documentation files (the        *//* "Software"), to deal in the Software without restriction, including    *//* without limitation the rights to use, copy, modify, merge, publish,    *//* distribute, sublicense, and/or sell copies of the Software, and to     *//* permit persons to whom the Software is furnished to do so, subject to  *//* the following conditions:                                              *//*                                                                        *//* The above copyright notice and this permission notice shall be         *//* included in all copies or substantial portions of the Software.        *//*                                                                        *//* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,        *//* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF     *//* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. *//* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY   *//* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,   *//* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE      *//* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.                 *//**************************************************************************/#pragma once#include "core/templates/hash_map.h"#include "core/templates/list.h"#include "core/templates/vector.h"#include "core/variant/variant.h"class GDScriptTokenizer {public:	enum CursorPlace {		CURSOR_NONE,		CURSOR_BEGINNING,		CURSOR_MIDDLE,		CURSOR_END,	};	struct Token {		// If this enum changes, please increment the TOKENIZER_VERSION in gdscript_tokenizer_buffer.h		enum Type {			EMPTY,			// Basic			ANNOTATION,			IDENTIFIER,			LITERAL,			// Comparison			LESS,			LESS_EQUAL,			GREATER,			GREATER_EQUAL,			EQUAL_EQUAL,			BANG_EQUAL,			// Logical			AND,			OR,			NOT,			AMPERSAND_AMPERSAND,			PIPE_PIPE,			BANG,			// Bitwise			AMPERSAND,			PIPE,			TILDE,			CARET,			LESS_LESS,			GREATER_GREATER,			// Math			PLUS,			MINUS,			STAR,			STAR_STAR,			SLASH,			PERCENT,			// Assignment			EQUAL,			PLUS_EQUAL,			MINUS_EQUAL,			STAR_EQUAL,			STAR_STAR_EQUAL,			SLASH_EQUAL,			PERCENT_EQUAL,			LESS_LESS_EQUAL,			GREATER_GREATER_EQUAL,			AMPERSAND_EQUAL,			PIPE_EQUAL,			CARET_EQUAL,			// Control flow			IF,			ELIF,			ELSE,			FOR,			WHILE,			BREAK,			CONTINUE,			PASS,			RETURN,			MATCH,			WHEN,			// Keywords			AS,			ASSERT,			AWAIT,			BREAKPOINT,			CLASS,			CLASS_NAME,			TK_CONST, // Conflict with WinAPI.			ENUM,			EXTENDS,			FUNC,			TK_IN, // Conflict with WinAPI.			IS,			NAMESPACE,			PRELOAD,			SELF,			SIGNAL,			STATIC,			SUPER,			TRAIT,			VAR,			TK_VOID, // Conflict with WinAPI.			YIELD,			// Punctuation			BRACKET_OPEN,			BRACKET_CLOSE,			BRACE_OPEN,			BRACE_CLOSE,			PARENTHESIS_OPEN,			PARENTHESIS_CLOSE,			COMMA,			SEMICOLON,			PERIOD,			PERIOD_PERIOD,			PERIOD_PERIOD_PERIOD,			COLON,			DOLLAR,			FORWARD_ARROW,			UNDERSCORE,			// Whitespace			NEWLINE,			INDENT,			DEDENT,			// Constants			CONST_PI,			CONST_TAU,			CONST_INF,			CONST_NAN,			// Error message improvement			VCS_CONFLICT_MARKER,			BACKTICK,			QUESTION_MARK,			// Special			ERROR,			TK_EOF, // "EOF" is reserved			TK_MAX		};		Type type = EMPTY;		Variant literal;		int start_line = 0, end_line = 0, start_column = 0, end_column = 0;		int cursor_position = -1;		CursorPlace cursor_place = CURSOR_NONE;		String source;		const char *get_name() const;		String get_debug_name() const;		bool can_precede_bin_op() const;		bool is_identifier() const;		bool is_node_name() const;		StringName get_identifier() const { return literal; }		Token(Type p_type) {			type = p_type;		}		Token() {}	};#ifdef TOOLS_ENABLED	struct CommentData {		String comment;		// true: Comment starts at beginning of line or after indentation.		// false: Inline comment (starts after some code).		bool new_line = false;		CommentData() {}		CommentData(const String &p_comment, bool p_new_line) {			comment = p_comment;			new_line = p_new_line;		}	};	virtual const HashMap<int, CommentData> &get_comments() const = 0;#endif // TOOLS_ENABLED	static String get_token_name(Token::Type p_token_type);#ifdef TOOLS_ENABLED	// This is a temporary solution, as Tokens are not able to store their position, only lines and columns.	virtual int get_current_position() const { return 0; }	virtual String get_source_code() const { return ""; }#endif // TOOLS_ENABLED	virtual int get_cursor_line() const = 0;	virtual int get_cursor_column() const = 0;	virtual void set_cursor_position(int p_line, int p_column) = 0;	virtual void set_multiline_mode(bool p_state) = 0;	virtual bool is_past_cursor() const = 0;	virtual void push_expression_indented_block() = 0; // For lambdas, or blocks inside expressions.	virtual void pop_expression_indented_block() = 0; // For lambdas, or blocks inside expressions.	virtual bool is_text() = 0;	virtual Token scan() = 0;	virtual ~GDScriptTokenizer() {}};class GDScriptTokenizerText : public GDScriptTokenizer {	String source;	const char32_t *_source = nullptr;	const char32_t *_current = nullptr;	int line = -1, column = -1;	int cursor_line = -1, cursor_column = -1;	int tab_size = 4;	// Keep track of multichar tokens.	const char32_t *_start = nullptr;	int start_line = 0, start_column = 0;	// Info cache.	bool line_continuation = false; // Whether this line is a continuation of the previous, like when using '\'.	bool multiline_mode = false;	List<Token> error_stack;	bool pending_newline = false;	Token last_token;	Token last_newline;	int pending_indents = 0;	List<int> indent_stack;	List<List<int>> indent_stack_stack; // For lambdas, which require manipulating the indentation point.	List<char32_t> paren_stack;	char32_t indent_char = '\0';	int position = 0;	int length = 0;	Vector<int> continuation_lines;#ifdef DEBUG_ENABLED	Vector<String> keyword_list;#endif // DEBUG_ENABLED#ifdef TOOLS_ENABLED	HashMap<int, CommentData> comments;#endif // TOOLS_ENABLED	_FORCE_INLINE_ bool _is_at_end() { return position >= length; }	_FORCE_INLINE_ char32_t _peek(int p_offset = 0) { return position + p_offset >= 0 && position + p_offset < length ? _current[p_offset] : '\0'; }	int indent_level() const { return indent_stack.size(); }	bool has_error() const { return !error_stack.is_empty(); }	Token pop_error();	char32_t _advance();	String _get_indent_char_name(char32_t ch);	void _skip_whitespace();	void check_indent();#ifdef DEBUG_ENABLED	void make_keyword_list();#endif // DEBUG_ENABLED	Token make_error(const String &p_message);	void push_error(const String &p_message);	void push_error(const Token &p_error);	Token make_paren_error(char32_t p_paren);	Token make_token(Token::Type p_type);	Token make_literal(const Variant &p_literal);	Token make_identifier(const StringName &p_identifier);	Token check_vcs_marker(char32_t p_test, Token::Type p_double_type);	void push_paren(char32_t p_char);	bool pop_paren(char32_t p_expected);	void newline(bool p_make_token);	Token number();	Token potential_identifier();	Token string();	Token annotation();public:	void set_source_code(const String &p_source_code);	const Vector<int> &get_continuation_lines() const { return continuation_lines; }#ifdef TOOLS_ENABLED	virtual int get_current_position() const override { return position; }	virtual String get_source_code() const override { return source; }#endif // TOOLS_ENABLED	virtual int get_cursor_line() const override;	virtual int get_cursor_column() const override;	virtual void set_cursor_position(int p_line, int p_column) override;	virtual void set_multiline_mode(bool p_state) override;	virtual bool is_past_cursor() const override;	virtual void push_expression_indented_block() override; // For lambdas, or blocks inside expressions.	virtual void pop_expression_indented_block() override; // For lambdas, or blocks inside expressions.	virtual bool is_text() override { return true; }#ifdef TOOLS_ENABLED	virtual const HashMap<int, CommentData> &get_comments() const override {		return comments;	}#endif // TOOLS_ENABLED	virtual Token scan() override;	GDScriptTokenizerText();};
 |