2021-01-23 16:47:20 +02:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2021, Itamar S. <itamar8910@gmail.com>
|
|
|
|
*
|
2021-04-22 01:24:48 -07:00
|
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
2021-01-23 16:47:20 +02:00
|
|
|
*/
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include "AK/NonnullRefPtr.h"
|
|
|
|
#include "AST.h"
|
2021-03-12 17:04:08 +02:00
|
|
|
#include "Preprocessor.h"
|
2021-03-12 15:53:07 +02:00
|
|
|
#include <AK/Noncopyable.h>
|
2021-01-23 16:47:20 +02:00
|
|
|
#include <LibCpp/Lexer.h>
|
|
|
|
|
|
|
|
namespace Cpp {
|
|
|
|
|
|
|
|
class Parser final {
|
2021-03-12 17:04:08 +02:00
|
|
|
AK_MAKE_NONCOPYABLE(Parser);
|
2021-03-12 15:53:07 +02:00
|
|
|
|
2021-01-23 16:47:20 +02:00
|
|
|
public:
|
2021-03-12 17:04:08 +02:00
|
|
|
explicit Parser(const StringView& program, const String& filename, Preprocessor::Definitions&& = {});
|
2021-01-23 16:47:20 +02:00
|
|
|
~Parser() = default;
|
|
|
|
|
|
|
|
NonnullRefPtr<TranslationUnit> parse();
|
|
|
|
bool eof() const;
|
|
|
|
|
|
|
|
RefPtr<ASTNode> eof_node() const;
|
|
|
|
RefPtr<ASTNode> node_at(Position) const;
|
2021-03-12 15:28:30 +02:00
|
|
|
Optional<size_t> index_of_node_at(Position) const;
|
2021-01-23 16:47:20 +02:00
|
|
|
Optional<Token> token_at(Position) const;
|
2021-03-12 15:53:07 +02:00
|
|
|
Optional<size_t> index_of_token_at(Position) const;
|
2021-01-23 16:47:20 +02:00
|
|
|
RefPtr<const TranslationUnit> root_node() const { return m_root_node; }
|
2021-03-12 15:53:07 +02:00
|
|
|
String text_of_node(const ASTNode&) const;
|
2021-02-10 21:48:08 +02:00
|
|
|
StringView text_of_token(const Cpp::Token& token) const;
|
2021-01-23 16:47:20 +02:00
|
|
|
void print_tokens() const;
|
2021-03-28 11:55:17 +03:00
|
|
|
const Vector<String>& errors() const { return m_state.errors; }
|
2021-05-07 14:46:11 +03:00
|
|
|
const Preprocessor::Definitions& preprocessor_definitions() const { return m_preprocessor_definitions; }
|
2021-01-23 16:47:20 +02:00
|
|
|
|
2021-03-13 10:37:23 +02:00
|
|
|
struct TokenAndPreprocessorDefinition {
|
|
|
|
Token token;
|
|
|
|
Preprocessor::DefinedValue preprocessor_value;
|
|
|
|
};
|
|
|
|
const Vector<TokenAndPreprocessorDefinition>& replaced_preprocessor_tokens() const { return m_replaced_preprocessor_tokens; }
|
|
|
|
|
2021-01-23 16:47:20 +02:00
|
|
|
private:
|
|
|
|
enum class DeclarationType {
|
|
|
|
Function,
|
|
|
|
Variable,
|
|
|
|
Enum,
|
2021-04-19 19:41:43 +03:00
|
|
|
Class,
|
2021-06-05 17:57:13 +03:00
|
|
|
Namespace,
|
2021-01-23 16:47:20 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
Optional<DeclarationType> match_declaration_in_translation_unit();
|
2021-06-05 17:57:13 +03:00
|
|
|
Optional<Parser::DeclarationType> match_class_member();
|
2021-01-23 16:47:20 +02:00
|
|
|
bool match_function_declaration();
|
|
|
|
bool match_comment();
|
|
|
|
bool match_preprocessor();
|
|
|
|
bool match_whitespace();
|
|
|
|
bool match_variable_declaration();
|
|
|
|
bool match_expression();
|
|
|
|
bool match_secondary_expression();
|
|
|
|
bool match_enum_declaration();
|
2021-04-19 19:41:43 +03:00
|
|
|
bool match_class_declaration();
|
2021-01-23 16:47:20 +02:00
|
|
|
bool match_literal();
|
|
|
|
bool match_unary_expression();
|
|
|
|
bool match_boolean_literal();
|
|
|
|
bool match_keyword(const String&);
|
|
|
|
bool match_block_statement();
|
2021-03-19 21:47:43 +02:00
|
|
|
bool match_namespace_declaration();
|
2021-03-28 11:55:17 +03:00
|
|
|
bool match_template_arguments();
|
2021-03-29 16:52:35 +03:00
|
|
|
bool match_name();
|
2021-03-31 22:21:31 +03:00
|
|
|
bool match_cpp_cast_expression();
|
2021-04-02 11:29:44 +03:00
|
|
|
bool match_c_style_cast_expression();
|
2021-04-02 10:49:12 +03:00
|
|
|
bool match_sizeof_expression();
|
2021-04-02 11:15:22 +03:00
|
|
|
bool match_braced_init_list();
|
2021-04-06 19:43:43 +03:00
|
|
|
bool match_type();
|
2021-06-06 21:30:53 +03:00
|
|
|
bool match_access_specifier();
|
2021-01-23 16:47:20 +02:00
|
|
|
|
|
|
|
Optional<NonnullRefPtrVector<Parameter>> parse_parameter_list(ASTNode& parent);
|
|
|
|
Optional<Token> consume_whitespace();
|
|
|
|
void consume_preprocessor();
|
|
|
|
|
|
|
|
NonnullRefPtr<Declaration> parse_declaration(ASTNode& parent, DeclarationType);
|
|
|
|
NonnullRefPtr<FunctionDeclaration> parse_function_declaration(ASTNode& parent);
|
|
|
|
NonnullRefPtr<FunctionDefinition> parse_function_definition(ASTNode& parent);
|
|
|
|
NonnullRefPtr<Statement> parse_statement(ASTNode& parent);
|
2021-03-28 11:55:17 +03:00
|
|
|
NonnullRefPtr<VariableDeclaration> parse_variable_declaration(ASTNode& parent, bool expect_semicolon = true);
|
2021-01-23 16:47:20 +02:00
|
|
|
NonnullRefPtr<Expression> parse_expression(ASTNode& parent);
|
|
|
|
NonnullRefPtr<Expression> parse_primary_expression(ASTNode& parent);
|
|
|
|
NonnullRefPtr<Expression> parse_secondary_expression(ASTNode& parent, NonnullRefPtr<Expression> lhs);
|
|
|
|
NonnullRefPtr<FunctionCall> parse_function_call(ASTNode& parent);
|
|
|
|
NonnullRefPtr<StringLiteral> parse_string_literal(ASTNode& parent);
|
|
|
|
NonnullRefPtr<ReturnStatement> parse_return_statement(ASTNode& parent);
|
|
|
|
NonnullRefPtr<EnumDeclaration> parse_enum_declaration(ASTNode& parent);
|
2021-06-05 17:57:13 +03:00
|
|
|
NonnullRefPtr<StructOrClassDeclaration> parse_class_declaration(ASTNode& parent);
|
2021-01-23 16:47:20 +02:00
|
|
|
NonnullRefPtr<Expression> parse_literal(ASTNode& parent);
|
|
|
|
NonnullRefPtr<UnaryExpression> parse_unary_expression(ASTNode& parent);
|
|
|
|
NonnullRefPtr<BooleanLiteral> parse_boolean_literal(ASTNode& parent);
|
|
|
|
NonnullRefPtr<Type> parse_type(ASTNode& parent);
|
|
|
|
NonnullRefPtr<BinaryExpression> parse_binary_expression(ASTNode& parent, NonnullRefPtr<Expression> lhs, BinaryOp);
|
|
|
|
NonnullRefPtr<AssignmentExpression> parse_assignment_expression(ASTNode& parent, NonnullRefPtr<Expression> lhs, AssignmentOp);
|
|
|
|
NonnullRefPtr<ForStatement> parse_for_statement(ASTNode& parent);
|
|
|
|
NonnullRefPtr<BlockStatement> parse_block_statement(ASTNode& parent);
|
|
|
|
NonnullRefPtr<Comment> parse_comment(ASTNode& parent);
|
2021-01-29 12:03:02 +02:00
|
|
|
NonnullRefPtr<IfStatement> parse_if_statement(ASTNode& parent);
|
2021-03-19 21:47:43 +02:00
|
|
|
NonnullRefPtr<NamespaceDeclaration> parse_namespace_declaration(ASTNode& parent, bool is_nested_namespace = false);
|
|
|
|
NonnullRefPtrVector<Declaration> parse_declarations_in_translation_unit(ASTNode& parent);
|
|
|
|
RefPtr<Declaration> parse_single_declaration_in_translation_unit(ASTNode& parent);
|
2021-03-28 11:55:17 +03:00
|
|
|
NonnullRefPtrVector<Type> parse_template_arguments(ASTNode& parent);
|
2021-03-29 16:52:35 +03:00
|
|
|
NonnullRefPtr<Name> parse_name(ASTNode& parent);
|
2021-03-31 22:21:31 +03:00
|
|
|
NonnullRefPtr<CppCastExpression> parse_cpp_cast_expression(ASTNode& parent);
|
2021-04-02 10:49:12 +03:00
|
|
|
NonnullRefPtr<SizeofExpression> parse_sizeof_expression(ASTNode& parent);
|
2021-04-02 11:15:22 +03:00
|
|
|
NonnullRefPtr<BracedInitList> parse_braced_init_list(ASTNode& parent);
|
2021-04-02 11:29:44 +03:00
|
|
|
NonnullRefPtr<CStyleCastExpression> parse_c_style_cast_expression(ASTNode& parent);
|
2021-06-05 17:57:13 +03:00
|
|
|
NonnullRefPtrVector<Declaration> parse_class_members(ASTNode& parent);
|
2021-03-19 21:47:43 +02:00
|
|
|
|
2021-01-23 16:47:20 +02:00
|
|
|
bool match(Token::Type);
|
|
|
|
Token consume(Token::Type);
|
|
|
|
Token consume();
|
|
|
|
Token consume_keyword(const String&);
|
2021-03-01 22:33:46 +02:00
|
|
|
Token peek(size_t offset = 0) const;
|
2021-01-23 16:47:20 +02:00
|
|
|
Optional<Token> peek(Token::Type) const;
|
|
|
|
Position position() const;
|
2021-03-12 15:53:07 +02:00
|
|
|
String text_in_range(Position start, Position end) const;
|
2021-01-23 16:47:20 +02:00
|
|
|
|
|
|
|
void save_state();
|
|
|
|
void load_state();
|
|
|
|
|
|
|
|
struct State {
|
|
|
|
size_t token_index { 0 };
|
2021-03-28 11:55:17 +03:00
|
|
|
Vector<String> errors;
|
2021-04-02 13:57:52 +03:00
|
|
|
NonnullRefPtrVector<ASTNode> nodes;
|
2021-01-23 16:47:20 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
void error(StringView message = {});
|
|
|
|
|
|
|
|
template<class T, class... Args>
|
|
|
|
NonnullRefPtr<T>
|
|
|
|
create_ast_node(ASTNode& parent, const Position& start, Optional<Position> end, Args&&... args)
|
|
|
|
{
|
2021-04-23 16:46:57 +02:00
|
|
|
auto node = adopt_ref(*new T(&parent, start, end, m_filename, forward<Args>(args)...));
|
2021-04-06 19:43:43 +03:00
|
|
|
if (!parent.is_dummy_node()) {
|
2021-04-02 13:57:52 +03:00
|
|
|
m_state.nodes.append(node);
|
|
|
|
}
|
2021-01-23 16:47:20 +02:00
|
|
|
return node;
|
|
|
|
}
|
|
|
|
|
|
|
|
NonnullRefPtr<TranslationUnit>
|
|
|
|
create_root_ast_node(const Position& start, Position end)
|
|
|
|
{
|
2021-04-23 16:46:57 +02:00
|
|
|
auto node = adopt_ref(*new TranslationUnit(nullptr, start, end, m_filename));
|
2021-04-02 13:57:52 +03:00
|
|
|
m_state.nodes.append(node);
|
2021-01-23 16:47:20 +02:00
|
|
|
m_root_node = node;
|
|
|
|
return node;
|
|
|
|
}
|
|
|
|
|
2021-04-02 13:57:52 +03:00
|
|
|
DummyAstNode& get_dummy_node()
|
|
|
|
{
|
2021-04-23 16:46:57 +02:00
|
|
|
static NonnullRefPtr<DummyAstNode> dummy = adopt_ref(*new DummyAstNode(nullptr, {}, {}, {}));
|
2021-04-02 13:57:52 +03:00
|
|
|
return dummy;
|
|
|
|
}
|
|
|
|
|
2021-03-12 17:04:08 +02:00
|
|
|
bool match_attribute_specification();
|
|
|
|
void consume_attribute_specification();
|
2021-06-06 21:30:53 +03:00
|
|
|
void consume_access_specifier();
|
2021-03-12 17:04:08 +02:00
|
|
|
bool match_ellipsis();
|
2021-03-12 15:56:30 +02:00
|
|
|
void initialize_program_tokens(const StringView& program);
|
2021-03-12 17:04:08 +02:00
|
|
|
void add_tokens_for_preprocessor(Token& replaced_token, Preprocessor::DefinedValue&);
|
|
|
|
Vector<StringView> parse_type_qualifiers();
|
2021-03-27 19:19:53 +03:00
|
|
|
Vector<StringView> parse_function_qualifiers();
|
2021-03-12 17:04:08 +02:00
|
|
|
|
2021-05-07 14:46:11 +03:00
|
|
|
Preprocessor::Definitions m_preprocessor_definitions;
|
2021-02-20 12:23:53 +02:00
|
|
|
String m_filename;
|
2021-01-23 16:47:20 +02:00
|
|
|
Vector<Token> m_tokens;
|
|
|
|
State m_state;
|
|
|
|
Vector<State> m_saved_states;
|
|
|
|
RefPtr<TranslationUnit> m_root_node;
|
2021-03-13 10:37:23 +02:00
|
|
|
|
|
|
|
Vector<TokenAndPreprocessorDefinition> m_replaced_preprocessor_tokens;
|
2021-01-23 16:47:20 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
}
|