| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | /*************************************************************************/ | 
					
						
							|  |  |  | /*  gd_tokenizer.h                                                       */ | 
					
						
							|  |  |  | /*************************************************************************/ | 
					
						
							|  |  |  | /*                       This file is part of:                           */ | 
					
						
							|  |  |  | /*                           GODOT ENGINE                                */ | 
					
						
							|  |  |  | /*                    http://www.godotengine.org                         */ | 
					
						
							|  |  |  | /*************************************************************************/ | 
					
						
							| 
									
										
										
										
											2016-01-01 11:50:53 -02:00
										 |  |  | /* Copyright (c) 2007-2016 Juan Linietsky, Ariel Manzur.                 */ | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | /*                                                                       */ | 
					
						
							|  |  |  | /* Permission is hereby granted, free of charge, to any person obtaining */ | 
					
						
							|  |  |  | /* a copy of this software and associated documentation files (the       */ | 
					
						
							|  |  |  | /* "Software"), to deal in the Software without restriction, including   */ | 
					
						
							|  |  |  | /* without limitation the rights to use, copy, modify, merge, publish,   */ | 
					
						
							|  |  |  | /* distribute, sublicense, and/or sell copies of the Software, and to    */ | 
					
						
							|  |  |  | /* permit persons to whom the Software is furnished to do so, subject to */ | 
					
						
							|  |  |  | /* the following conditions:                                             */ | 
					
						
							|  |  |  | /*                                                                       */ | 
					
						
							|  |  |  | /* The above copyright notice and this permission notice shall be        */ | 
					
						
							|  |  |  | /* included in all copies or substantial portions of the Software.       */ | 
					
						
							|  |  |  | /*                                                                       */ | 
					
						
							|  |  |  | /* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,       */ | 
					
						
							|  |  |  | /* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF    */ | 
					
						
							|  |  |  | /* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.*/ | 
					
						
							|  |  |  | /* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY  */ | 
					
						
							|  |  |  | /* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,  */ | 
					
						
							|  |  |  | /* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE     */ | 
					
						
							|  |  |  | /* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.                */ | 
					
						
							|  |  |  | /*************************************************************************/ | 
					
						
							|  |  |  | #ifndef GD_TOKENIZER_H
 | 
					
						
							|  |  |  | #define GD_TOKENIZER_H
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include "ustring.h"
 | 
					
						
							|  |  |  | #include "variant.h"
 | 
					
						
							|  |  |  | #include "string_db.h"
 | 
					
						
							|  |  |  | #include "gd_functions.h"
 | 
					
						
							| 
									
										
										
										
											2014-02-25 09:31:47 -03:00
										 |  |  | #include "vmap.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | class GDTokenizer { | 
					
						
							|  |  |  | public: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	enum Token { | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		TK_EMPTY, | 
					
						
							|  |  |  | 		TK_IDENTIFIER, | 
					
						
							|  |  |  | 		TK_CONSTANT, | 
					
						
							|  |  |  | 		TK_SELF, | 
					
						
							|  |  |  | 		TK_BUILT_IN_TYPE, | 
					
						
							|  |  |  | 		TK_BUILT_IN_FUNC, | 
					
						
							|  |  |  | 		TK_OP_IN, | 
					
						
							|  |  |  | 		TK_OP_EQUAL, | 
					
						
							|  |  |  | 		TK_OP_NOT_EQUAL, | 
					
						
							|  |  |  | 		TK_OP_LESS, | 
					
						
							|  |  |  | 		TK_OP_LESS_EQUAL, | 
					
						
							|  |  |  | 		TK_OP_GREATER, | 
					
						
							|  |  |  | 		TK_OP_GREATER_EQUAL, | 
					
						
							|  |  |  | 		TK_OP_AND, | 
					
						
							|  |  |  | 		TK_OP_OR, | 
					
						
							|  |  |  | 		TK_OP_NOT, | 
					
						
							|  |  |  | 		TK_OP_ADD, | 
					
						
							|  |  |  | 		TK_OP_SUB, | 
					
						
							|  |  |  | 		TK_OP_MUL, | 
					
						
							|  |  |  | 		TK_OP_DIV, | 
					
						
							|  |  |  | 		TK_OP_MOD, | 
					
						
							|  |  |  | 		TK_OP_SHIFT_LEFT, | 
					
						
							|  |  |  | 		TK_OP_SHIFT_RIGHT, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_ADD, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_SUB, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_MUL, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_DIV, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_MOD, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_SHIFT_LEFT, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_SHIFT_RIGHT, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_BIT_AND, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_BIT_OR, | 
					
						
							|  |  |  | 		TK_OP_ASSIGN_BIT_XOR, | 
					
						
							|  |  |  | 		TK_OP_BIT_AND, | 
					
						
							|  |  |  | 		TK_OP_BIT_OR, | 
					
						
							|  |  |  | 		TK_OP_BIT_XOR, | 
					
						
							|  |  |  | 		TK_OP_BIT_INVERT, | 
					
						
							|  |  |  | 		//TK_OP_PLUS_PLUS,
 | 
					
						
							|  |  |  | 		//TK_OP_MINUS_MINUS,
 | 
					
						
							|  |  |  | 		TK_CF_IF, | 
					
						
							|  |  |  | 		TK_CF_ELIF, | 
					
						
							|  |  |  | 		TK_CF_ELSE, | 
					
						
							|  |  |  | 		TK_CF_FOR, | 
					
						
							|  |  |  | 		TK_CF_DO, | 
					
						
							|  |  |  | 		TK_CF_WHILE, | 
					
						
							|  |  |  | 		TK_CF_SWITCH, | 
					
						
							|  |  |  | 		TK_CF_CASE, | 
					
						
							|  |  |  | 		TK_CF_BREAK, | 
					
						
							|  |  |  | 		TK_CF_CONTINUE, | 
					
						
							|  |  |  | 		TK_CF_PASS, | 
					
						
							|  |  |  | 		TK_CF_RETURN, | 
					
						
							|  |  |  | 		TK_PR_FUNCTION, | 
					
						
							|  |  |  | 		TK_PR_CLASS, | 
					
						
							|  |  |  | 		TK_PR_EXTENDS, | 
					
						
							| 
									
										
										
										
											2015-12-28 19:31:52 -03:00
										 |  |  | 		TK_PR_ONREADY, | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | 		TK_PR_TOOL, | 
					
						
							|  |  |  | 		TK_PR_STATIC, | 
					
						
							|  |  |  | 		TK_PR_EXPORT, | 
					
						
							| 
									
										
										
										
											2014-10-27 22:54:32 -03:00
										 |  |  | 		TK_PR_SETGET, | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | 		TK_PR_CONST, | 
					
						
							|  |  |  | 		TK_PR_VAR, | 
					
						
							|  |  |  | 		TK_PR_PRELOAD, | 
					
						
							|  |  |  | 		TK_PR_ASSERT, | 
					
						
							| 
									
										
										
										
											2014-09-15 11:33:30 -03:00
										 |  |  | 		TK_PR_YIELD, | 
					
						
							| 
									
										
										
										
											2015-06-24 13:29:23 -03:00
										 |  |  | 		TK_PR_SIGNAL, | 
					
						
							| 
									
										
										
										
											2015-12-29 12:11:21 -03:00
										 |  |  | 		TK_PR_BREAKPOINT, | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | 		TK_BRACKET_OPEN, | 
					
						
							|  |  |  | 		TK_BRACKET_CLOSE, | 
					
						
							|  |  |  | 		TK_CURLY_BRACKET_OPEN, | 
					
						
							|  |  |  | 		TK_CURLY_BRACKET_CLOSE, | 
					
						
							|  |  |  | 		TK_PARENTHESIS_OPEN, | 
					
						
							|  |  |  | 		TK_PARENTHESIS_CLOSE, | 
					
						
							|  |  |  | 		TK_COMMA, | 
					
						
							|  |  |  | 		TK_SEMICOLON, | 
					
						
							|  |  |  | 		TK_PERIOD, | 
					
						
							|  |  |  | 		TK_QUESTION_MARK, | 
					
						
							|  |  |  | 		TK_COLON, | 
					
						
							|  |  |  | 		TK_NEWLINE, | 
					
						
							| 
									
										
										
										
											2016-01-02 17:56:45 -03:00
										 |  |  | 		TK_CONST_PI, | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | 		TK_ERROR, | 
					
						
							|  |  |  | 		TK_EOF, | 
					
						
							| 
									
										
										
										
											2014-12-16 22:31:57 -03:00
										 |  |  | 		TK_CURSOR, //used for code completion
 | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | 		TK_MAX | 
					
						
							|  |  |  | 	}; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-02-25 09:31:47 -03:00
										 |  |  | protected: | 
					
						
							| 
									
										
										
										
											2014-11-02 11:31:01 -03:00
										 |  |  | 
 | 
					
						
							|  |  |  | 	enum StringMode { | 
					
						
							|  |  |  | 		STRING_SINGLE_QUOTE, | 
					
						
							|  |  |  | 		STRING_DOUBLE_QUOTE, | 
					
						
							|  |  |  | 		STRING_MULTILINE | 
					
						
							|  |  |  | 	}; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-02-25 09:31:47 -03:00
										 |  |  | 	static const char* token_names[TK_MAX]; | 
					
						
							|  |  |  | public: | 
					
						
							|  |  |  | 	static const char *get_token_name(Token p_token); | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-02-25 09:31:47 -03:00
										 |  |  | 	virtual const Variant& get_token_constant(int p_offset=0) const=0; | 
					
						
							|  |  |  | 	virtual Token get_token(int p_offset=0) const=0; | 
					
						
							|  |  |  | 	virtual StringName get_token_identifier(int p_offset=0) const=0; | 
					
						
							|  |  |  | 	virtual GDFunctions::Function get_token_built_in_func(int p_offset=0) const=0; | 
					
						
							|  |  |  | 	virtual Variant::Type get_token_type(int p_offset=0) const=0; | 
					
						
							|  |  |  | 	virtual int get_token_line(int p_offset=0) const=0; | 
					
						
							|  |  |  | 	virtual int get_token_column(int p_offset=0) const=0; | 
					
						
							|  |  |  | 	virtual int get_token_line_indent(int p_offset=0) const=0; | 
					
						
							|  |  |  | 	virtual String get_token_error(int p_offset=0) const=0; | 
					
						
							|  |  |  | 	virtual void advance(int p_amount=1)=0; | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-02-25 09:31:47 -03:00
										 |  |  | 	virtual ~GDTokenizer(){}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class GDTokenizerText : public GDTokenizer { | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | 
 | 
					
						
							|  |  |  | 	enum { | 
					
						
							|  |  |  | 		MAX_LOOKAHEAD=4, | 
					
						
							|  |  |  | 		TK_RB_SIZE=MAX_LOOKAHEAD*2+1 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	struct TokenData { | 
					
						
							|  |  |  | 		Token type; | 
					
						
							|  |  |  | 		StringName identifier; //for identifier types
 | 
					
						
							|  |  |  | 		Variant constant; //for constant types
 | 
					
						
							|  |  |  | 		union { | 
					
						
							|  |  |  | 			Variant::Type vtype; //for type types
 | 
					
						
							|  |  |  | 			GDFunctions::Function func; //function for built in functions
 | 
					
						
							|  |  |  | 		}; | 
					
						
							|  |  |  | 		int line,col; | 
					
						
							|  |  |  | 		TokenData() { type = TK_EMPTY; line=col=0; vtype=Variant::NIL; } | 
					
						
							|  |  |  | 	}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	void _make_token(Token p_type); | 
					
						
							|  |  |  | 	void _make_newline(int p_spaces=0); | 
					
						
							|  |  |  | 	void _make_identifier(const StringName& p_identifier); | 
					
						
							|  |  |  | 	void _make_built_in_func(GDFunctions::Function p_func); | 
					
						
							|  |  |  | 	void _make_constant(const Variant& p_constant); | 
					
						
							|  |  |  | 	void _make_type(const Variant::Type& p_type); | 
					
						
							|  |  |  | 	void _make_error(const String& p_error); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	String code; | 
					
						
							|  |  |  | 	int len; | 
					
						
							|  |  |  | 	int code_pos; | 
					
						
							|  |  |  | 	const CharType *_code; | 
					
						
							|  |  |  | 	int line; | 
					
						
							|  |  |  | 	int column; | 
					
						
							|  |  |  | 	TokenData tk_rb[TK_RB_SIZE*2+1]; | 
					
						
							|  |  |  | 	int tk_rb_pos; | 
					
						
							|  |  |  | 	String last_error; | 
					
						
							|  |  |  | 	bool error_flag; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	void _advance(); | 
					
						
							|  |  |  | public: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	void set_code(const String& p_code); | 
					
						
							| 
									
										
										
										
											2014-02-25 09:31:47 -03:00
										 |  |  | 	virtual Token get_token(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual StringName get_token_identifier(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual GDFunctions::Function get_token_built_in_func(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual Variant::Type get_token_type(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual int get_token_line(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual int get_token_column(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual int get_token_line_indent(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual const Variant& get_token_constant(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual String get_token_error(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual void advance(int p_amount=1); | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class GDTokenizerBuffer : public GDTokenizer { | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	enum { | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		TOKEN_BYTE_MASK=0x80, | 
					
						
							|  |  |  | 		TOKEN_BITS=8, | 
					
						
							|  |  |  | 		TOKEN_MASK=(1<<TOKEN_BITS)-1, | 
					
						
							|  |  |  | 		TOKEN_LINE_BITS=24, | 
					
						
							|  |  |  | 		TOKEN_LINE_MASK=(1<<TOKEN_LINE_BITS)-1, | 
					
						
							|  |  |  | 	}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	Vector<StringName> identifiers; | 
					
						
							|  |  |  | 	Vector<Variant> constants; | 
					
						
							|  |  |  | 	VMap<uint32_t,uint32_t> lines; | 
					
						
							|  |  |  | 	Vector<uint32_t> tokens; | 
					
						
							|  |  |  | 	Variant nil; | 
					
						
							|  |  |  | 	int token; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | public: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	Error set_code_buffer(const Vector<uint8_t> & p_buffer); | 
					
						
							|  |  |  | 	static Vector<uint8_t> parse_code_string(const String& p_code); | 
					
						
							|  |  |  | 	virtual Token get_token(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual StringName get_token_identifier(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual GDFunctions::Function get_token_built_in_func(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual Variant::Type get_token_type(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual int get_token_line(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual int get_token_column(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual int get_token_line_indent(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual const Variant& get_token_constant(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual String get_token_error(int p_offset=0) const; | 
					
						
							|  |  |  | 	virtual void advance(int p_amount=1); | 
					
						
							|  |  |  | 	GDTokenizerBuffer(); | 
					
						
							| 
									
										
										
										
											2014-02-09 22:10:30 -03:00
										 |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #endif // TOKENIZER_H
 |