Parser.h 8.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207
  1. /*
  2. * Copyright (c) 2021, Itamar S. <itamar8910@gmail.com>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #pragma once
  7. #include "AK/NonnullRefPtr.h"
  8. #include "AST.h"
  9. #include "Preprocessor.h"
  10. #include <AK/Noncopyable.h>
  11. #include <LibCpp/Lexer.h>
  12. namespace Cpp {
  13. class Parser final {
  14. AK_MAKE_NONCOPYABLE(Parser);
  15. public:
  16. explicit Parser(const StringView& program, const String& filename, Preprocessor::Definitions&& = {});
  17. ~Parser() = default;
  18. NonnullRefPtr<TranslationUnit> parse();
  19. bool eof() const;
  20. RefPtr<ASTNode> eof_node() const;
  21. RefPtr<ASTNode> node_at(Position) const;
  22. Optional<size_t> index_of_node_at(Position) const;
  23. Optional<Token> token_at(Position) const;
  24. Optional<size_t> index_of_token_at(Position) const;
  25. RefPtr<const TranslationUnit> root_node() const { return m_root_node; }
  26. String text_of_node(const ASTNode&) const;
  27. StringView text_of_token(const Cpp::Token& token) const;
  28. void print_tokens() const;
  29. const Vector<String>& errors() const { return m_state.errors; }
  30. const Preprocessor::Definitions& preprocessor_definitions() const { return m_preprocessor_definitions; }
  31. struct TodoEntry {
  32. String content;
  33. String filename;
  34. size_t line { 0 };
  35. size_t column { 0 };
  36. };
  37. Vector<TodoEntry> get_todo_entries() const;
  38. struct TokenAndPreprocessorDefinition {
  39. Token token;
  40. Preprocessor::DefinedValue preprocessor_value;
  41. };
  42. const Vector<TokenAndPreprocessorDefinition>& replaced_preprocessor_tokens() const { return m_replaced_preprocessor_tokens; }
  43. Vector<Token> tokens_in_range(Position start, Position end) const;
  44. private:
  45. enum class DeclarationType {
  46. Function,
  47. Variable,
  48. Enum,
  49. Class,
  50. Namespace,
  51. Constructor,
  52. Destructor,
  53. };
  54. Optional<DeclarationType> match_declaration_in_translation_unit();
  55. Optional<Parser::DeclarationType> match_class_member(const StringView& class_name);
  56. bool match_function_declaration();
  57. bool match_comment();
  58. bool match_preprocessor();
  59. bool match_whitespace();
  60. bool match_variable_declaration();
  61. bool match_expression();
  62. bool match_secondary_expression();
  63. bool match_enum_declaration();
  64. bool match_class_declaration();
  65. bool match_literal();
  66. bool match_unary_expression();
  67. bool match_boolean_literal();
  68. bool match_keyword(const String&);
  69. bool match_block_statement();
  70. bool match_namespace_declaration();
  71. bool match_template_arguments();
  72. bool match_name();
  73. bool match_cpp_cast_expression();
  74. bool match_c_style_cast_expression();
  75. bool match_sizeof_expression();
  76. bool match_braced_init_list();
  77. bool match_type();
  78. bool match_named_type();
  79. bool match_access_specifier();
  80. bool match_constructor(const StringView& class_name);
  81. bool match_destructor(const StringView& class_name);
  82. Optional<NonnullRefPtrVector<Parameter>> parse_parameter_list(ASTNode& parent);
  83. Optional<Token> consume_whitespace();
  84. void consume_preprocessor();
  85. NonnullRefPtr<Declaration> parse_declaration(ASTNode& parent, DeclarationType);
  86. NonnullRefPtr<FunctionDeclaration> parse_function_declaration(ASTNode& parent);
  87. NonnullRefPtr<FunctionDefinition> parse_function_definition(ASTNode& parent);
  88. NonnullRefPtr<Statement> parse_statement(ASTNode& parent);
  89. NonnullRefPtr<VariableDeclaration> parse_variable_declaration(ASTNode& parent, bool expect_semicolon = true);
  90. NonnullRefPtr<Expression> parse_expression(ASTNode& parent);
  91. NonnullRefPtr<Expression> parse_primary_expression(ASTNode& parent);
  92. NonnullRefPtr<Expression> parse_secondary_expression(ASTNode& parent, NonnullRefPtr<Expression> lhs);
  93. NonnullRefPtr<FunctionCall> parse_function_call(ASTNode& parent);
  94. NonnullRefPtr<StringLiteral> parse_string_literal(ASTNode& parent);
  95. NonnullRefPtr<ReturnStatement> parse_return_statement(ASTNode& parent);
  96. NonnullRefPtr<EnumDeclaration> parse_enum_declaration(ASTNode& parent);
  97. NonnullRefPtr<StructOrClassDeclaration> parse_class_declaration(ASTNode& parent);
  98. NonnullRefPtr<Expression> parse_literal(ASTNode& parent);
  99. NonnullRefPtr<UnaryExpression> parse_unary_expression(ASTNode& parent);
  100. NonnullRefPtr<BooleanLiteral> parse_boolean_literal(ASTNode& parent);
  101. NonnullRefPtr<Type> parse_type(ASTNode& parent);
  102. NonnullRefPtr<NamedType> parse_named_type(ASTNode& parent);
  103. NonnullRefPtr<BinaryExpression> parse_binary_expression(ASTNode& parent, NonnullRefPtr<Expression> lhs, BinaryOp);
  104. NonnullRefPtr<AssignmentExpression> parse_assignment_expression(ASTNode& parent, NonnullRefPtr<Expression> lhs, AssignmentOp);
  105. NonnullRefPtr<ForStatement> parse_for_statement(ASTNode& parent);
  106. NonnullRefPtr<BlockStatement> parse_block_statement(ASTNode& parent);
  107. NonnullRefPtr<Comment> parse_comment(ASTNode& parent);
  108. NonnullRefPtr<IfStatement> parse_if_statement(ASTNode& parent);
  109. NonnullRefPtr<NamespaceDeclaration> parse_namespace_declaration(ASTNode& parent, bool is_nested_namespace = false);
  110. NonnullRefPtrVector<Declaration> parse_declarations_in_translation_unit(ASTNode& parent);
  111. RefPtr<Declaration> parse_single_declaration_in_translation_unit(ASTNode& parent);
  112. NonnullRefPtrVector<Type> parse_template_arguments(ASTNode& parent);
  113. NonnullRefPtr<Name> parse_name(ASTNode& parent);
  114. NonnullRefPtr<CppCastExpression> parse_cpp_cast_expression(ASTNode& parent);
  115. NonnullRefPtr<SizeofExpression> parse_sizeof_expression(ASTNode& parent);
  116. NonnullRefPtr<BracedInitList> parse_braced_init_list(ASTNode& parent);
  117. NonnullRefPtr<CStyleCastExpression> parse_c_style_cast_expression(ASTNode& parent);
  118. NonnullRefPtrVector<Declaration> parse_class_members(StructOrClassDeclaration& parent);
  119. NonnullRefPtr<Constructor> parse_constructor(ASTNode& parent);
  120. NonnullRefPtr<Destructor> parse_destructor(ASTNode& parent);
  121. bool match(Token::Type);
  122. Token consume(Token::Type);
  123. Token consume();
  124. Token consume_keyword(const String&);
  125. Token peek(size_t offset = 0) const;
  126. Optional<Token> peek(Token::Type) const;
  127. Position position() const;
  128. String text_in_range(Position start, Position end) const;
  129. void save_state();
  130. void load_state();
  131. struct State {
  132. size_t token_index { 0 };
  133. Vector<String> errors;
  134. NonnullRefPtrVector<ASTNode> nodes;
  135. };
  136. void error(StringView message = {});
  137. template<class T, class... Args>
  138. NonnullRefPtr<T>
  139. create_ast_node(ASTNode& parent, const Position& start, Optional<Position> end, Args&&... args)
  140. {
  141. auto node = adopt_ref(*new T(&parent, start, end, m_filename, forward<Args>(args)...));
  142. if (!parent.is_dummy_node()) {
  143. m_state.nodes.append(node);
  144. }
  145. return node;
  146. }
  147. NonnullRefPtr<TranslationUnit>
  148. create_root_ast_node(const Position& start, Position end)
  149. {
  150. auto node = adopt_ref(*new TranslationUnit(nullptr, start, end, m_filename));
  151. m_state.nodes.append(node);
  152. m_root_node = node;
  153. return node;
  154. }
  155. DummyAstNode& get_dummy_node()
  156. {
  157. static NonnullRefPtr<DummyAstNode> dummy = adopt_ref(*new DummyAstNode(nullptr, {}, {}, {}));
  158. return dummy;
  159. }
  160. bool match_attribute_specification();
  161. void consume_attribute_specification();
  162. void consume_access_specifier();
  163. bool match_ellipsis();
  164. void initialize_program_tokens(const StringView& program);
  165. void add_tokens_for_preprocessor(Token& replaced_token, Preprocessor::DefinedValue&);
  166. Vector<StringView> parse_type_qualifiers();
  167. Vector<StringView> parse_function_qualifiers();
  168. enum class CtorOrDtor {
  169. Ctor,
  170. Dtor,
  171. };
  172. void parse_constructor_or_destructor_impl(FunctionDeclaration&, CtorOrDtor);
  173. Preprocessor::Definitions m_preprocessor_definitions;
  174. String m_filename;
  175. Vector<Token> m_tokens;
  176. State m_state;
  177. Vector<State> m_saved_states;
  178. RefPtr<TranslationUnit> m_root_node;
  179. Vector<TokenAndPreprocessorDefinition> m_replaced_preprocessor_tokens;
  180. };
  181. }