TextParser.cpp 25 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770
  1. /*
  2. * Copyright (c) 2023, Dan Klishch <danilklishch@gmail.com>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <AK/ScopeGuard.h>
  7. #include "Parser/SpecParser.h"
  8. #include "Parser/TextParser.h"
  9. namespace JSSpecCompiler {
  10. void TextParser::save_error(Variant<TokenType, StringView, CustomMessage>&& expected)
  11. {
  12. if (m_max_parsed_tokens > m_next_token_index)
  13. return;
  14. if (m_max_parsed_tokens < m_next_token_index)
  15. m_suitable_continuations.clear();
  16. m_max_parsed_tokens = m_next_token_index;
  17. m_suitable_continuations.append(move(expected));
  18. }
  19. void TextParser::retreat()
  20. {
  21. --m_next_token_index;
  22. }
  23. auto TextParser::rollback_point()
  24. {
  25. return ArmedScopeGuard {
  26. [this, index = this->m_next_token_index] {
  27. m_next_token_index = index;
  28. }
  29. };
  30. }
  31. Optional<Token> TextParser::peek_token()
  32. {
  33. if (m_next_token_index == m_tokens.size())
  34. return {};
  35. return m_tokens[m_next_token_index];
  36. }
  37. Optional<Token> TextParser::consume_token()
  38. {
  39. auto result = peek_token();
  40. if (result.has_value())
  41. ++m_next_token_index;
  42. return result;
  43. }
  44. TextParseErrorOr<Token> TextParser::consume_token_with_one_of_types(std::initializer_list<TokenType> types)
  45. {
  46. auto token = peek_token();
  47. if (token.has_value()) {
  48. for (TokenType type : types) {
  49. if (token->type == type) {
  50. (void)consume_token();
  51. return *token;
  52. } else {
  53. save_error(type);
  54. }
  55. }
  56. } else {
  57. for (TokenType type : types)
  58. save_error(type);
  59. }
  60. return TextParseError {};
  61. }
  62. TextParseErrorOr<Token> TextParser::consume_token_with_type(TokenType type)
  63. {
  64. return consume_token_with_one_of_types({ type });
  65. }
  66. TextParseErrorOr<void> TextParser::consume_token(TokenType type, StringView data)
  67. {
  68. auto token = consume_token();
  69. if (!token.has_value() || token->type != type || !token->data.equals_ignoring_ascii_case(data)) {
  70. retreat();
  71. save_error(data);
  72. return TextParseError {};
  73. }
  74. return {};
  75. }
  76. TextParseErrorOr<void> TextParser::consume_word(StringView word)
  77. {
  78. auto token = consume_token();
  79. if (!token.has_value() || token->type != TokenType::Word || !token->data.equals_ignoring_ascii_case(word)) {
  80. retreat();
  81. save_error(word);
  82. return TextParseError {};
  83. }
  84. return {};
  85. }
  86. TextParseErrorOr<void> TextParser::consume_words(std::initializer_list<StringView> words)
  87. {
  88. for (auto word : words)
  89. TRY(consume_word(word));
  90. return {};
  91. }
  92. bool TextParser::is_eof() const
  93. {
  94. return m_next_token_index == m_tokens.size();
  95. }
  96. TextParseErrorOr<void> TextParser::expect_eof()
  97. {
  98. if (!is_eof()) {
  99. save_error(CustomMessage { "EOF"sv });
  100. return TextParseError {};
  101. }
  102. return {};
  103. }
  104. // <record_initialization> :== (the)? <record_name> { (<name>: <value>,)* }
  105. TextParseErrorOr<Tree> TextParser::parse_record_direct_list_initialization()
  106. {
  107. auto rollback = rollback_point();
  108. (void)consume_word("the"sv);
  109. auto identifier = TRY(consume_token_with_type(TokenType::Identifier));
  110. TRY(consume_token_with_type(TokenType::BraceOpen));
  111. Vector<RecordDirectListInitialization::Argument> arguments;
  112. while (true) {
  113. auto name = TRY(consume_token_with_one_of_types({ TokenType::Identifier, TokenType::BraceClose }));
  114. if (name.is_bracket()) {
  115. break;
  116. } else {
  117. TRY(consume_token_with_type(TokenType::Colon));
  118. auto value = TRY(parse_expression());
  119. (void)consume_token_with_type(TokenType::Comma);
  120. arguments.append({ make_ref_counted<UnresolvedReference>(name.data), value });
  121. }
  122. }
  123. rollback.disarm();
  124. return make_ref_counted<RecordDirectListInitialization>(
  125. make_ref_counted<UnresolvedReference>(identifier.data), move(arguments));
  126. }
  127. // <function_arguments> :== '(' (<expr> (, <expr>)* )? ')'
  128. TextParseErrorOr<Vector<Tree>> TextParser::parse_function_arguments()
  129. {
  130. auto rollback = rollback_point();
  131. TRY(consume_token_with_type(TokenType::ParenOpen));
  132. if (!consume_token_with_type(TokenType::ParenClose).is_error()) {
  133. rollback.disarm();
  134. return Vector<Tree> {};
  135. }
  136. Vector<Tree> arguments;
  137. while (true) {
  138. arguments.append(TRY(parse_expression()));
  139. auto token = TRY(consume_token_with_one_of_types({ TokenType::ParenClose, TokenType::Comma }));
  140. if (token.type == TokenType::ParenClose)
  141. break;
  142. }
  143. rollback.disarm();
  144. return arguments;
  145. }
  146. // <list_initialization> :== « (<expr> (, <expr>)*)? »
  147. TextParseErrorOr<Tree> TextParser::parse_list_initialization()
  148. {
  149. auto rollback = rollback_point();
  150. TRY(consume_token_with_type(TokenType::ListStart));
  151. if (!consume_token_with_type(TokenType::ListEnd).is_error()) {
  152. rollback.disarm();
  153. return make_ref_counted<List>(Vector<Tree> {});
  154. }
  155. Vector<Tree> elements;
  156. while (true) {
  157. elements.append(TRY(parse_expression()));
  158. auto token = TRY(consume_token_with_one_of_types({ TokenType::ListEnd, TokenType::Comma }));
  159. if (token.type == TokenType::ListEnd)
  160. break;
  161. }
  162. rollback.disarm();
  163. return make_ref_counted<List>(move(elements));
  164. }
  165. TextParseErrorOr<Tree> TextParser::parse_the_this_value()
  166. {
  167. auto rollback = rollback_point();
  168. TRY(consume_word("the"sv));
  169. TRY(consume_token(TokenType::WellKnownValue, "this"sv));
  170. TRY(consume_word("value"sv));
  171. rollback.disarm();
  172. return make_ref_counted<WellKnownNode>(WellKnownNode::Type::This);
  173. }
  174. // <value> :== <identifier> | <well_known_value> | <enumerator> | <number> | <string> | <list_initialization> | <record_initialization>
  175. TextParseErrorOr<Tree> TextParser::parse_value()
  176. {
  177. if (auto identifier = consume_token_with_type(TokenType::Identifier); !identifier.is_error())
  178. return make_ref_counted<UnresolvedReference>(identifier.release_value().data);
  179. if (auto well_known_value = consume_token_with_type(TokenType::WellKnownValue); !well_known_value.is_error()) {
  180. static constexpr struct {
  181. StringView name;
  182. WellKnownNode::Type type;
  183. } translations[] = {
  184. { "false"sv, WellKnownNode::Type::False },
  185. { "null"sv, WellKnownNode::Type::Null },
  186. { "this"sv, WellKnownNode::Type::This },
  187. { "true"sv, WellKnownNode::Type::True },
  188. { "undefined"sv, WellKnownNode::Type::Undefined },
  189. };
  190. for (auto [name, type] : translations)
  191. if (well_known_value.value().data == name)
  192. return make_ref_counted<WellKnownNode>(type);
  193. VERIFY_NOT_REACHED();
  194. }
  195. if (auto enumerator = consume_token_with_type(TokenType::Enumerator); !enumerator.is_error())
  196. return m_ctx.translation_unit()->get_node_for_enumerator_value(enumerator.value().data);
  197. if (auto number = consume_token_with_type(TokenType::Number); !number.is_error())
  198. return make_ref_counted<MathematicalConstant>(MUST(Crypto::BigFraction::from_string(number.value().data)));
  199. if (auto string = consume_token_with_type(TokenType::String); !string.is_error())
  200. return make_ref_counted<StringLiteral>(string.value().data);
  201. if (auto list_initialization = parse_list_initialization(); !list_initialization.is_error())
  202. return list_initialization.release_value();
  203. if (auto record_initialization = parse_record_direct_list_initialization(); !record_initialization.is_error())
  204. return record_initialization.release_value();
  205. if (auto the_this_value = parse_the_this_value(); !the_this_value.is_error())
  206. return the_this_value.release_value();
  207. return TextParseError {};
  208. }
  209. // <expr>
  210. TextParseErrorOr<Tree> TextParser::parse_expression()
  211. {
  212. auto rollback = rollback_point();
  213. #define THROW_PARSE_ERROR_IF(expr) \
  214. do { \
  215. if (expr) { \
  216. save_error(CustomMessage { "valid expression continuation (not valid because " #expr ")"##sv }); \
  217. return TextParseError {}; \
  218. } \
  219. } while (false)
  220. #define THROW_PARSE_ERROR THROW_PARSE_ERROR_IF(true)
  221. Vector<Variant<Tree, Token>> stack;
  222. auto merge_stack = [&](i32 precedence) {
  223. if (!stack.last().has<Tree>())
  224. return;
  225. while (stack.size() >= 2) {
  226. auto const& maybe_operator = stack[stack.size() - 2];
  227. if (!maybe_operator.has<Token>())
  228. break;
  229. auto last_operator = maybe_operator.get<Token>();
  230. auto right = stack.last().get<Tree>();
  231. if (last_operator.is_unary_operator()) {
  232. auto operation = make_ref_counted<UnaryOperation>(last_operator.as_unary_operator(), right);
  233. stack.shrink(stack.size() - 2);
  234. stack.empend(operation);
  235. } else if (last_operator.is_binary_operator() && last_operator.precedence() < precedence) {
  236. auto left = stack[stack.size() - 3].get<Tree>();
  237. auto operation = make_ref_counted<BinaryOperation>(last_operator.as_binary_operator(), left, right);
  238. stack.shrink(stack.size() - 3);
  239. stack.empend(operation);
  240. } else {
  241. break;
  242. }
  243. }
  244. };
  245. auto merge_pre_merged = [&] {
  246. if (stack.size() < 3)
  247. return;
  248. auto const& maybe_left = stack[stack.size() - 3];
  249. auto const& maybe_operator = stack[stack.size() - 2];
  250. auto const& maybe_right = stack.last();
  251. if (!maybe_left.has<Tree>() || !maybe_operator.has<Token>() || !maybe_right.has<Tree>())
  252. return;
  253. auto last_operator = maybe_operator.get<Token>();
  254. if (!last_operator.is_pre_merged_binary_operator())
  255. return;
  256. auto expression = make_ref_counted<BinaryOperation>(last_operator.as_binary_operator(), maybe_left.get<Tree>(), maybe_right.get<Tree>());
  257. stack.shrink(stack.size() - 3);
  258. stack.empend(expression);
  259. };
  260. i32 bracket_balance = 0;
  261. while (true) {
  262. auto token_or_error = peek_token();
  263. if (!token_or_error.has_value())
  264. break;
  265. auto token = token_or_error.release_value();
  266. bool is_consumed = false;
  267. enum {
  268. NoneType,
  269. ExpressionType,
  270. PreMergedBinaryOperatorType,
  271. UnaryOperatorType,
  272. BinaryOperatorType,
  273. BracketType,
  274. } last_element_type;
  275. if (stack.is_empty())
  276. last_element_type = NoneType;
  277. else if (stack.last().has<Tree>())
  278. last_element_type = ExpressionType;
  279. else if (stack.last().get<Token>().is_pre_merged_binary_operator())
  280. last_element_type = PreMergedBinaryOperatorType;
  281. else if (stack.last().get<Token>().is_unary_operator())
  282. last_element_type = UnaryOperatorType;
  283. else if (stack.last().get<Token>().is_binary_operator())
  284. last_element_type = BinaryOperatorType;
  285. else if (stack.last().get<Token>().is_bracket())
  286. last_element_type = BracketType;
  287. else
  288. VERIFY_NOT_REACHED();
  289. if (token.is_ambiguous_operator()) {
  290. if (token.type == TokenType::AmbiguousMinus)
  291. token.type = last_element_type == ExpressionType ? TokenType::BinaryMinus : TokenType::UnaryMinus;
  292. else
  293. VERIFY_NOT_REACHED();
  294. }
  295. bracket_balance += token.is_opening_bracket();
  296. bracket_balance -= token.is_closing_bracket();
  297. if (bracket_balance < 0)
  298. break;
  299. if (token.type == TokenType::ParenOpen) {
  300. if (last_element_type == ExpressionType) {
  301. // This is a function call.
  302. auto arguments = TRY(parse_function_arguments());
  303. is_consumed = true;
  304. stack.append(Tree { make_ref_counted<FunctionCall>(stack.take_last().get<Tree>(), move(arguments)) });
  305. --bracket_balance;
  306. } else {
  307. // This is just an opening '(' in expression.
  308. stack.append(token);
  309. }
  310. } else if (token.is_pre_merged_binary_operator()) {
  311. THROW_PARSE_ERROR_IF(last_element_type != ExpressionType);
  312. stack.append(token);
  313. } else if (token.is_unary_operator()) {
  314. THROW_PARSE_ERROR_IF(last_element_type == PreMergedBinaryOperatorType);
  315. stack.append(token);
  316. } else if (token.is_binary_operator() || token.is_closing_bracket()) {
  317. if (bracket_balance == 0 && token.type == TokenType::Comma)
  318. break;
  319. THROW_PARSE_ERROR_IF(last_element_type != ExpressionType);
  320. merge_stack(token.precedence());
  321. if (token.is_closing_bracket()) {
  322. THROW_PARSE_ERROR_IF(stack.size() == 1);
  323. THROW_PARSE_ERROR_IF(!stack[stack.size() - 2].get<Token>().matches_with(token));
  324. stack.remove(stack.size() - 2);
  325. merge_pre_merged();
  326. } else {
  327. stack.append(token);
  328. }
  329. } else {
  330. if (auto expression = parse_value(); !expression.is_error()) {
  331. is_consumed = true;
  332. THROW_PARSE_ERROR_IF(last_element_type == ExpressionType);
  333. stack.append(expression.release_value());
  334. merge_pre_merged();
  335. } else {
  336. break;
  337. }
  338. }
  339. if (!is_consumed)
  340. VERIFY(consume_token().has_value());
  341. }
  342. THROW_PARSE_ERROR_IF(stack.is_empty());
  343. merge_stack(closing_bracket_precedence);
  344. THROW_PARSE_ERROR_IF(stack.size() != 1 || !stack[0].has<Tree>());
  345. rollback.disarm();
  346. return stack[0].get<Tree>();
  347. #undef THROW_PARSE_ERROR
  348. #undef THROW_PARSE_ERROR_IF
  349. }
  350. // <condition> :== <expr> | (<expr> is <expr> (or <expr>)?)
  351. TextParseErrorOr<Tree> TextParser::parse_condition()
  352. {
  353. auto rollback = rollback_point();
  354. auto expression = TRY(parse_expression());
  355. if (!consume_token_with_type(TokenType::Is).is_error()) {
  356. Vector compare_values { TRY(parse_expression()) };
  357. if (!consume_word("or"sv).is_error())
  358. compare_values.append(TRY(parse_expression()));
  359. rollback.disarm();
  360. return make_ref_counted<IsOneOfOperation>(expression, move(compare_values));
  361. }
  362. rollback.disarm();
  363. return expression;
  364. }
  365. // return <expr>
  366. TextParseErrorOr<Tree> TextParser::parse_return_statement()
  367. {
  368. auto rollback = rollback_point();
  369. TRY(consume_word("return"sv));
  370. auto return_value = TRY(parse_expression());
  371. rollback.disarm();
  372. return make_ref_counted<ReturnNode>(return_value);
  373. }
  374. // assert: <condition>
  375. TextParseErrorOr<Tree> TextParser::parse_assert()
  376. {
  377. auto rollback = rollback_point();
  378. TRY(consume_token(TokenType::Identifier, "assert"sv));
  379. TRY(consume_token_with_type(TokenType::Colon));
  380. auto condition = TRY(parse_condition());
  381. rollback.disarm();
  382. return make_ref_counted<AssertExpression>(condition);
  383. }
  384. // (let <expr> be <expr>) | (set <expr> to <expr>)
  385. TextParseErrorOr<Tree> TextParser::parse_assignment()
  386. {
  387. auto rollback = rollback_point();
  388. bool is_let = !consume_word("let"sv).is_error();
  389. if (!is_let)
  390. TRY(consume_word("set"sv));
  391. auto lvalue = TRY(parse_expression());
  392. TRY(consume_word(is_let ? "be"sv : "to"sv));
  393. auto rvalue = TRY(parse_expression());
  394. rollback.disarm();
  395. auto op = is_let ? BinaryOperator::Declaration : BinaryOperator::Assignment;
  396. return make_ref_counted<BinaryOperation>(op, lvalue, rvalue);
  397. }
  398. // perform <expr>
  399. TextParseErrorOr<Tree> TextParser::parse_perform()
  400. {
  401. auto rollback = rollback_point();
  402. TRY(consume_word("perform"sv));
  403. auto value = TRY(parse_expression());
  404. rollback.disarm();
  405. return value;
  406. }
  407. // <simple_step>
  408. TextParseErrorOr<Tree> TextParser::parse_simple_step_or_inline_if_branch()
  409. {
  410. auto rollback = rollback_point();
  411. // Return <expr>.$
  412. if (auto result = parse_return_statement(); !result.is_error()) {
  413. TRY(consume_token_with_type(TokenType::Dot));
  414. TRY(expect_eof());
  415. rollback.disarm();
  416. return result.release_value();
  417. }
  418. // Assert: <expr>.$
  419. if (auto result = parse_assert(); !result.is_error()) {
  420. TRY(consume_token_with_type(TokenType::Dot));
  421. TRY(expect_eof());
  422. rollback.disarm();
  423. return result.release_value();
  424. }
  425. // Let <expr> be <expr>.$
  426. // Set <expr> to <expr>.$
  427. if (auto result = parse_assignment(); !result.is_error()) {
  428. TRY(consume_token_with_type(TokenType::Dot));
  429. TRY(expect_eof());
  430. rollback.disarm();
  431. return result.release_value();
  432. }
  433. // Perform <expr>.$
  434. if (auto result = parse_perform(); !result.is_error()) {
  435. TRY(consume_token_with_type(TokenType::Dot));
  436. TRY(expect_eof());
  437. rollback.disarm();
  438. return result.release_value();
  439. }
  440. return TextParseError {};
  441. }
  442. // <if_condition> :== (If <condition>) | (Else) | (Else if <condition>),
  443. TextParseErrorOr<TextParser::IfConditionParseResult> TextParser::parse_if_beginning()
  444. {
  445. auto rollback = rollback_point();
  446. bool is_if_branch = !consume_word("if"sv).is_error();
  447. NullableTree condition = nullptr;
  448. if (is_if_branch) {
  449. condition = TRY(parse_condition());
  450. } else {
  451. TRY(consume_word("else"sv));
  452. if (!consume_word("if"sv).is_error())
  453. condition = TRY(parse_condition());
  454. }
  455. TRY(consume_token_with_type(TokenType::Comma));
  456. rollback.disarm();
  457. return IfConditionParseResult { is_if_branch, condition };
  458. }
  459. // <inline_if> :== <if_condition> <simple_step>.$
  460. TextParseErrorOr<Tree> TextParser::parse_inline_if_else()
  461. {
  462. auto rollback = rollback_point();
  463. auto [is_if_branch, condition] = TRY(parse_if_beginning());
  464. auto then_branch = TRY(parse_simple_step_or_inline_if_branch());
  465. rollback.disarm();
  466. if (is_if_branch)
  467. return make_ref_counted<IfBranch>(condition.release_nonnull(), then_branch);
  468. return make_ref_counted<ElseIfBranch>(condition, then_branch);
  469. }
  470. // <if> :== <if_condition> then$ <substeps>
  471. TextParseErrorOr<Tree> TextParser::parse_if(Tree then_branch)
  472. {
  473. auto rollback = rollback_point();
  474. auto [is_if_branch, condition] = TRY(parse_if_beginning());
  475. TRY(consume_word("then"sv));
  476. TRY(expect_eof());
  477. rollback.disarm();
  478. if (is_if_branch)
  479. return make_ref_counted<IfBranch>(*condition, then_branch);
  480. else
  481. return make_ref_counted<ElseIfBranch>(condition, then_branch);
  482. }
  483. // <else> :== Else,$ <substeps>
  484. TextParseErrorOr<Tree> TextParser::parse_else(Tree else_branch)
  485. {
  486. auto rollback = rollback_point();
  487. TRY(consume_word("else"sv));
  488. TRY(consume_token_with_type(TokenType::Comma));
  489. TRY(expect_eof());
  490. rollback.disarm();
  491. return make_ref_counted<ElseIfBranch>(nullptr, else_branch);
  492. }
  493. // <simple_step> | <inline_if>
  494. TextParseErrorOr<Tree> TextParser::parse_step_without_substeps()
  495. {
  496. auto rollback = rollback_point();
  497. // <simple_step>
  498. if (auto result = parse_simple_step_or_inline_if_branch(); !result.is_error()) {
  499. rollback.disarm();
  500. return result.release_value();
  501. }
  502. // <inline_if>
  503. if (auto result = parse_inline_if_else(); !result.is_error()) {
  504. rollback.disarm();
  505. return result.release_value();
  506. }
  507. return TextParseError {};
  508. }
  509. // <if> | <else>
  510. TextParseErrorOr<Tree> TextParser::parse_step_with_substeps(Tree substeps)
  511. {
  512. auto rollback = rollback_point();
  513. // <if>
  514. if (auto result = parse_if(substeps); !result.is_error()) {
  515. rollback.disarm();
  516. return result.release_value();
  517. }
  518. // <else>
  519. if (auto result = parse_else(substeps); !result.is_error()) {
  520. rollback.disarm();
  521. return result.release_value();
  522. }
  523. return TextParseError {};
  524. }
  525. // <qualified_name> :== <word> (. <word>)*
  526. TextParseErrorOr<Vector<StringView>> TextParser::parse_qualified_name()
  527. {
  528. Vector<StringView> qualified_name;
  529. qualified_name.append(TRY(consume_token_with_type(TokenType::Word)).data);
  530. while (true) {
  531. auto token_or_error = consume_token_with_type(TokenType::MemberAccess);
  532. if (token_or_error.is_error())
  533. return qualified_name;
  534. qualified_name.append(TRY(consume_token_with_type(TokenType::Word)).data);
  535. }
  536. }
  537. // <function_arguments> :== '(' (<word> (, <word>)*)? ')'
  538. TextParseErrorOr<Vector<FunctionArgument>> TextParser::parse_function_arguments_in_declaration()
  539. {
  540. Vector<FunctionArgument> arguments;
  541. TRY(consume_token_with_type(TokenType::ParenOpen));
  542. while (true) {
  543. if (arguments.is_empty()) {
  544. auto argument = TRY(consume_token_with_one_of_types({ TokenType::ParenClose, TokenType::Identifier }));
  545. if (argument.type == TokenType::ParenClose)
  546. break;
  547. arguments.append({ argument.data });
  548. } else {
  549. arguments.append({ TRY(consume_token_with_type(TokenType::Identifier)).data });
  550. }
  551. auto next_token = TRY(consume_token_with_one_of_types({ TokenType::ParenClose, TokenType::Comma }));
  552. if (next_token.type == TokenType::ParenClose)
  553. break;
  554. }
  555. return arguments;
  556. }
  557. // <ao_declaration> :== <word> <function_arguments> $
  558. TextParseErrorOr<ClauseHeader::AbstractOperation> TextParser::parse_abstract_operation_declaration()
  559. {
  560. auto rollback = rollback_point();
  561. ClauseHeader::AbstractOperation function_definition;
  562. function_definition.name = TRY(consume_token_with_type(TokenType::Word)).data;
  563. function_definition.arguments = TRY(parse_function_arguments_in_declaration());
  564. TRY(expect_eof());
  565. rollback.disarm();
  566. return function_definition;
  567. }
  568. // <accessor_declaration> :== get <qualified_name> $
  569. TextParseErrorOr<ClauseHeader::Accessor> TextParser::parse_accessor_declaration()
  570. {
  571. auto rollback = rollback_point();
  572. TRY(consume_word("get"sv));
  573. ClauseHeader::Accessor accessor;
  574. accessor.qualified_name = TRY(parse_qualified_name());
  575. TRY(expect_eof());
  576. rollback.disarm();
  577. return accessor;
  578. }
  579. // <clause_header> :== <section_number> <ao_declaration> | <accessor_declaration>
  580. TextParseErrorOr<ClauseHeader> TextParser::parse_clause_header()
  581. {
  582. ClauseHeader result;
  583. auto section_number_token = TRY(consume_token_with_type(TokenType::SectionNumber));
  584. result.section_number = section_number_token.data;
  585. if (auto ao_declaration = parse_abstract_operation_declaration(); !ao_declaration.is_error()) {
  586. result.header = ao_declaration.release_value();
  587. } else if (auto accessor = parse_accessor_declaration(); !accessor.is_error()) {
  588. result.header = accessor.release_value();
  589. } else {
  590. return TextParseError {};
  591. }
  592. return result;
  593. }
  594. FailedTextParseDiagnostic TextParser::get_diagnostic() const
  595. {
  596. StringBuilder message;
  597. message.append("unexpected "sv);
  598. if (m_max_parsed_tokens == m_tokens.size()) {
  599. message.append("EOF"sv);
  600. } else {
  601. auto token = m_tokens[m_max_parsed_tokens];
  602. if (token.type == TokenType::Word)
  603. message.appendff("'{}'", token.data);
  604. else if (token.type == TokenType::Identifier)
  605. message.appendff("identifier '{}'", token.data);
  606. else
  607. message.append(token.name_for_diagnostic());
  608. }
  609. message.appendff(", expected ");
  610. size_t size = m_suitable_continuations.size();
  611. VERIFY(size > 0);
  612. for (size_t i = 0; i < size; ++i) {
  613. m_suitable_continuations[i].visit(
  614. [&](TokenType type) { message.append(token_info[to_underlying(type)].name_for_diagnostic); },
  615. [&](StringView word) { message.appendff("'{}'", word); },
  616. [&](CustomMessage continuation) { message.append(continuation.message); });
  617. if (i + 1 != size) {
  618. if (size == 2)
  619. message.append(" or "sv);
  620. else if (i + 2 == size)
  621. message.append(", or "sv);
  622. else
  623. message.append(", "sv);
  624. }
  625. }
  626. Location location = Location::global_scope();
  627. if (m_max_parsed_tokens < m_tokens.size()) {
  628. location = m_tokens[m_max_parsed_tokens].location;
  629. } else {
  630. // FIXME: Would be nice to point to the closing tag not the opening one. This is also the
  631. // only place where we use m_location.
  632. location = m_ctx.location_from_xml_offset(m_node->offset);
  633. }
  634. return { location, MUST(message.to_string()) };
  635. }
  636. }