12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922 |
- /*
- * Copyright (c) 2022, Ali Mohammad Pur <mpfard@serenityos.org>
- *
- * SPDX-License-Identifier: BSD-2-Clause
- */
- #include <AK/CharacterTypes.h>
- #include <AK/Debug.h>
- #include <AK/StringUtils.h>
- #include <Shell/PosixParser.h>
- template<typename T, typename... Ts>
- static inline bool is_one_of(T const& value, Ts const&... values)
- {
- return ((value == values) || ...);
- }
- static inline bool is_io_operator(Shell::Posix::Token const& token)
- {
- using namespace Shell::Posix;
- return is_one_of(token.type,
- Token::Type::Less, Token::Type::Great,
- Token::Type::LessAnd, Token::Type::GreatAnd,
- Token::Type::DoubleLess, Token::Type::DoubleGreat,
- Token::Type::LessGreat, Token::Type::Clobber);
- }
- static inline bool is_separator(Shell::Posix::Token const& token)
- {
- using namespace Shell::Posix;
- return is_one_of(token.type,
- Token::Type::Semicolon, Token::Type::Newline,
- Token::Type::AndIf, Token::Type::OrIf,
- Token::Type::Pipe,
- Token::Type::And);
- }
- static inline bool is_a_reserved_word_position(Shell::Posix::Token const& token, Optional<Shell::Posix::Token> const& previous_token, Optional<Shell::Posix::Token> const& previous_previous_token)
- {
- using namespace Shell::Posix;
- auto is_start_of_command = !previous_token.has_value()
- || previous_token->value.is_empty()
- || is_separator(*previous_token)
- || is_one_of(previous_token->type,
- Token::Type::OpenParen, Token::Type::CloseParen, Token::Type::Newline, Token::Type::DoubleSemicolon,
- Token::Type::Semicolon, Token::Type::Pipe, Token::Type::OrIf, Token::Type::AndIf);
- if (is_start_of_command)
- return true;
- if (!previous_token.has_value())
- return false;
- auto previous_is_reserved_word = is_one_of(previous_token->value,
- "for"sv, "in"sv, "case"sv, "if"sv, "then"sv, "else"sv,
- "elif"sv, "while"sv, "until"sv, "do"sv, "done"sv, "esac"sv,
- "fi"sv, "!"sv, "{"sv, "}"sv);
- if (previous_is_reserved_word)
- return true;
- if (!previous_previous_token.has_value())
- return false;
- auto is_third_in_case = previous_previous_token->value == "case"sv
- && token.type == Token::Type::Token && token.value == "in"sv;
- if (is_third_in_case)
- return true;
- auto is_third_in_for = previous_previous_token->value == "for"sv
- && token.type == Token::Type::Token && is_one_of(token.value, "in"sv, "do"sv);
- return is_third_in_for;
- }
- static inline bool is_reserved(Shell::Posix::Token const& token)
- {
- using namespace Shell::Posix;
- return is_one_of(token.type,
- Token::Type::If, Token::Type::Then, Token::Type::Else,
- Token::Type::Elif, Token::Type::Fi, Token::Type::Do,
- Token::Type::Done, Token::Type::Case, Token::Type::Esac,
- Token::Type::While, Token::Type::Until, Token::Type::For,
- Token::Type::In, Token::Type::OpenBrace, Token::Type::CloseBrace,
- Token::Type::Bang);
- }
- static inline bool is_valid_name(StringView word)
- {
- // Dr.POSIX: a word consisting solely of underscores, digits, and alphabetics from the portable character set. The first character of a name is not a digit.
- return !word.is_empty()
- && !is_ascii_digit(word[0])
- && all_of(word, [](auto ch) { return is_ascii_alphanumeric(ch) || ch == '_'; });
- }
- namespace Shell::Posix {
- void Parser::fill_token_buffer()
- {
- for (;;) {
- auto token = next_expanded_token();
- if (!token.has_value())
- break;
- #if SHELL_POSIX_PARSER_DEBUG
- DeprecatedString position = "(~)";
- if (token->position.has_value())
- position = DeprecatedString::formatted("{}:{}", token->position->start_offset, token->position->end_offset);
- DeprecatedString expansions = "";
- for (auto& exp : token->resolved_expansions)
- exp.visit(
- [&](ResolvedParameterExpansion& x) { expansions = DeprecatedString::formatted("{}param({}),", expansions, x.to_deprecated_string()); },
- [&](ResolvedCommandExpansion& x) { expansions = DeprecatedString::formatted("{}command({:p})", expansions, x.command.ptr()); });
- DeprecatedString rexpansions = "";
- for (auto& exp : token->expansions)
- exp.visit(
- [&](ParameterExpansion& x) { rexpansions = DeprecatedString::formatted("{}param({}) from {} to {},", rexpansions, x.parameter.string_view(), x.range.start, x.range.length); },
- [&](auto&) { rexpansions = DeprecatedString::formatted("{}...,", rexpansions); });
- dbgln("Token @ {}: '{}' (type {}) - parsed expansions: {} - raw expansions: {}", position, token->value.replace("\n"sv, "\\n"sv, ReplaceMode::All), token->type_name(), expansions, rexpansions);
- #endif
- }
- m_token_index = 0;
- }
- RefPtr<AST::Node> Parser::parse()
- {
- return parse_complete_command();
- }
- Optional<Token> Parser::next_expanded_token()
- {
- while (m_token_buffer.find_if([](auto& token) { return token.type == Token::Type::Eof; }).is_end()) {
- auto tokens = m_lexer.batch_next();
- auto expanded = perform_expansions(move(tokens));
- m_token_buffer.extend(expanded);
- }
- if (m_token_buffer.size() == m_token_index)
- return {};
- return m_token_buffer[m_token_index++];
- }
- Vector<Token> Parser::perform_expansions(Vector<Token> tokens)
- {
- if (tokens.is_empty())
- return {};
- Vector<Token> expanded_tokens;
- auto previous_token = Optional<Token>();
- auto previous_previous_token = Optional<Token>();
- auto tokens_taken_from_buffer = 0;
- expanded_tokens.ensure_capacity(tokens.size());
- auto swap_expansions = [&] {
- if (previous_previous_token.has_value())
- expanded_tokens.append(previous_previous_token.release_value());
- if (previous_token.has_value())
- expanded_tokens.append(previous_token.release_value());
- for (; tokens_taken_from_buffer > 0; tokens_taken_from_buffer--)
- m_token_buffer.append(expanded_tokens.take_first());
- swap(tokens, expanded_tokens);
- expanded_tokens.clear_with_capacity();
- };
- // (1) join all consecutive newlines (this works around a grammar ambiguity)
- auto previous_was_newline = !m_token_buffer.is_empty() && m_token_buffer.last().type == Token::Type::Newline;
- for (auto& token : tokens) {
- if (token.type == Token::Type::Newline) {
- if (previous_was_newline)
- continue;
- previous_was_newline = true;
- } else {
- previous_was_newline = false;
- }
- expanded_tokens.append(move(token));
- }
- swap_expansions();
- // (2) Detect reserved words
- if (m_token_buffer.size() >= 1) {
- previous_token = m_token_buffer.take_last();
- tokens_taken_from_buffer++;
- }
- if (m_token_buffer.size() >= 1) {
- previous_previous_token = m_token_buffer.take_last();
- tokens_taken_from_buffer++;
- }
- auto check_reserved_word = [&](auto& token) {
- if (is_a_reserved_word_position(token, previous_token, previous_previous_token)) {
- if (token.value == "if"sv)
- token.type = Token::Type::If;
- else if (token.value == "then"sv)
- token.type = Token::Type::Then;
- else if (token.value == "else"sv)
- token.type = Token::Type::Else;
- else if (token.value == "elif"sv)
- token.type = Token::Type::Elif;
- else if (token.value == "fi"sv)
- token.type = Token::Type::Fi;
- else if (token.value == "while"sv)
- token.type = Token::Type::While;
- else if (token.value == "until"sv)
- token.type = Token::Type::Until;
- else if (token.value == "do"sv)
- token.type = Token::Type::Do;
- else if (token.value == "done"sv)
- token.type = Token::Type::Done;
- else if (token.value == "case"sv)
- token.type = Token::Type::Case;
- else if (token.value == "esac"sv)
- token.type = Token::Type::Esac;
- else if (token.value == "for"sv)
- token.type = Token::Type::For;
- else if (token.value == "in"sv)
- token.type = Token::Type::In;
- else if (token.value == "!"sv)
- token.type = Token::Type::Bang;
- else if (token.value == "{"sv)
- token.type = Token::Type::OpenBrace;
- else if (token.value == "}"sv)
- token.type = Token::Type::CloseBrace;
- else if (token.type == Token::Type::Token)
- token.type = Token::Type::Word;
- } else if (token.type == Token::Type::Token) {
- token.type = Token::Type::Word;
- }
- };
- for (auto& token : tokens) {
- if (!previous_token.has_value()) {
- check_reserved_word(token);
- previous_token = token;
- continue;
- }
- if (!previous_previous_token.has_value()) {
- check_reserved_word(token);
- previous_previous_token = move(previous_token);
- previous_token = token;
- continue;
- }
- check_reserved_word(token);
- expanded_tokens.append(exchange(*previous_previous_token, exchange(*previous_token, move(token))));
- }
- swap_expansions();
- // (3) Detect io_number tokens
- previous_token = Optional<Token>();
- tokens_taken_from_buffer = 0;
- if (m_token_buffer.size() >= 1) {
- previous_token = m_token_buffer.take_last();
- tokens_taken_from_buffer++;
- }
- for (auto& token : tokens) {
- if (!previous_token.has_value()) {
- previous_token = token;
- continue;
- }
- if (is_io_operator(token) && previous_token->type == Token::Type::Word && all_of(previous_token->value, is_ascii_digit)) {
- previous_token->type = Token::Type::IoNumber;
- }
- expanded_tokens.append(exchange(*previous_token, move(token)));
- }
- swap_expansions();
- // (4) Try to identify simple commands
- previous_token = Optional<Token>();
- tokens_taken_from_buffer = 0;
- if (m_token_buffer.size() >= 1) {
- previous_token = m_token_buffer.take_last();
- tokens_taken_from_buffer++;
- }
- for (auto& token : tokens) {
- if (!previous_token.has_value()) {
- token.could_be_start_of_a_simple_command = true;
- previous_token = token;
- continue;
- }
- token.could_be_start_of_a_simple_command = is_one_of(previous_token->type, Token::Type::OpenParen, Token::Type::CloseParen, Token::Type::Newline)
- || is_separator(*previous_token)
- || (!is_reserved(*previous_token) && is_reserved(token));
- expanded_tokens.append(exchange(*previous_token, move(token)));
- }
- swap_expansions();
- // (5) Detect assignment words
- for (auto& token : tokens) {
- if (token.could_be_start_of_a_simple_command)
- m_disallow_command_prefix = false;
- // Check if we're in a command prefix (could be an assignment)
- if (!m_disallow_command_prefix && token.type == Token::Type::Word && token.value.contains('=')) {
- // If the word before '=' is a valid name, this is an assignment
- auto parts = token.value.split_limit('=', 2);
- if (is_valid_name(parts[0]))
- token.type = Token::Type::AssignmentWord;
- else
- m_disallow_command_prefix = true;
- } else {
- m_disallow_command_prefix = true;
- }
- expanded_tokens.append(move(token));
- }
- swap_expansions();
- // (6) Parse expansions
- for (auto& token : tokens) {
- if (!is_one_of(token.type, Token::Type::Word, Token::Type::AssignmentWord)) {
- expanded_tokens.append(move(token));
- continue;
- }
- Vector<ResolvedExpansion> resolved_expansions;
- for (auto& expansion : token.expansions) {
- auto resolved = expansion.visit(
- [&](ParameterExpansion const& expansion) -> ResolvedExpansion {
- auto text = expansion.parameter.string_view();
- // ${NUMBER}
- if (all_of(text, is_ascii_digit)) {
- return ResolvedParameterExpansion {
- .parameter = expansion.parameter.to_deprecated_string(),
- .argument = {},
- .range = expansion.range,
- .op = ResolvedParameterExpansion::Op::GetPositionalParameter,
- };
- }
- if (text.length() == 1) {
- ResolvedParameterExpansion::Op op;
- switch (text[0]) {
- case '!':
- op = ResolvedParameterExpansion::Op::GetLastBackgroundPid;
- break;
- case '@':
- op = ResolvedParameterExpansion::Op::GetPositionalParameterList;
- break;
- case '-':
- op = ResolvedParameterExpansion::Op::GetCurrentOptionFlags;
- break;
- case '#':
- op = ResolvedParameterExpansion::Op::GetPositionalParameterCount;
- break;
- case '?':
- op = ResolvedParameterExpansion::Op::GetLastExitStatus;
- break;
- case '*':
- op = ResolvedParameterExpansion::Op::GetPositionalParameterListAsString;
- break;
- case '$':
- op = ResolvedParameterExpansion::Op::GetShellProcessId;
- break;
- default:
- if (is_valid_name(text)) {
- op = ResolvedParameterExpansion::Op::GetVariable;
- } else {
- error(token, "Unknown parameter expansion: {}", text);
- return ResolvedParameterExpansion {
- .parameter = expansion.parameter.to_deprecated_string(),
- .argument = {},
- .range = expansion.range,
- .op = ResolvedParameterExpansion::Op::StringLength,
- };
- }
- }
- return ResolvedParameterExpansion {
- .parameter = {},
- .argument = {},
- .range = expansion.range,
- .op = op,
- };
- }
- if (text.starts_with('#')) {
- return ResolvedParameterExpansion {
- .parameter = text.substring_view(1).to_deprecated_string(),
- .argument = {},
- .range = expansion.range,
- .op = ResolvedParameterExpansion::Op::StringLength,
- };
- }
- GenericLexer lexer { text };
- auto parameter = lexer.consume_while([first = true](char c) mutable {
- if (first) {
- first = false;
- return is_ascii_alpha(c) || c == '_';
- }
- return is_ascii_alphanumeric(c) || c == '_';
- });
- StringView argument;
- ResolvedParameterExpansion::Op op;
- switch (lexer.peek()) {
- case ':':
- lexer.ignore();
- switch (lexer.is_eof() ? 0 : lexer.consume()) {
- case '-':
- argument = lexer.consume_all();
- op = ResolvedParameterExpansion::Op::UseDefaultValue;
- break;
- case '=':
- argument = lexer.consume_all();
- op = ResolvedParameterExpansion::Op::AssignDefaultValue;
- break;
- case '?':
- argument = lexer.consume_all();
- op = ResolvedParameterExpansion::Op::IndicateErrorIfEmpty;
- break;
- case '+':
- argument = lexer.consume_all();
- op = ResolvedParameterExpansion::Op::UseAlternativeValue;
- break;
- default:
- error(token, "Unknown parameter expansion: {}", text);
- return ResolvedParameterExpansion {
- .parameter = parameter.to_deprecated_string(),
- .argument = {},
- .range = expansion.range,
- .op = ResolvedParameterExpansion::Op::StringLength,
- };
- }
- break;
- case '-':
- lexer.ignore();
- argument = lexer.consume_all();
- op = ResolvedParameterExpansion::Op::UseDefaultValueIfUnset;
- break;
- case '=':
- lexer.ignore();
- argument = lexer.consume_all();
- op = ResolvedParameterExpansion::Op::AssignDefaultValueIfUnset;
- break;
- case '?':
- lexer.ignore();
- argument = lexer.consume_all();
- op = ResolvedParameterExpansion::Op::IndicateErrorIfUnset;
- break;
- case '+':
- lexer.ignore();
- argument = lexer.consume_all();
- op = ResolvedParameterExpansion::Op::UseAlternativeValueIfUnset;
- break;
- case '%':
- if (lexer.consume_specific('%'))
- op = ResolvedParameterExpansion::Op::RemoveLargestSuffixByPattern;
- else
- op = ResolvedParameterExpansion::Op::RemoveSmallestSuffixByPattern;
- argument = lexer.consume_all();
- break;
- case '#':
- if (lexer.consume_specific('#'))
- op = ResolvedParameterExpansion::Op::RemoveLargestPrefixByPattern;
- else
- op = ResolvedParameterExpansion::Op::RemoveSmallestPrefixByPattern;
- argument = lexer.consume_all();
- break;
- default:
- if (is_valid_name(text)) {
- op = ResolvedParameterExpansion::Op::GetVariable;
- } else {
- error(token, "Unknown parameter expansion: {}", text);
- return ResolvedParameterExpansion {
- .parameter = parameter.to_deprecated_string(),
- .argument = {},
- .range = expansion.range,
- .op = ResolvedParameterExpansion::Op::StringLength,
- };
- }
- }
- VERIFY(lexer.is_eof());
- return ResolvedParameterExpansion {
- .parameter = parameter.to_deprecated_string(),
- .argument = argument.to_deprecated_string(),
- .range = expansion.range,
- .op = op,
- .expand = ResolvedParameterExpansion::Expand::Word,
- };
- },
- [&](ArithmeticExpansion const& expansion) -> ResolvedExpansion {
- error(token, "Arithmetic expansion is not supported");
- return ResolvedParameterExpansion {
- .parameter = ""sv,
- .argument = ""sv,
- .range = expansion.range,
- .op = ResolvedParameterExpansion::Op::StringLength,
- .expand = ResolvedParameterExpansion::Expand::Nothing,
- };
- },
- [&](CommandExpansion const& expansion) -> ResolvedExpansion {
- Parser parser { expansion.command.string_view() };
- auto node = parser.parse();
- m_errors.extend(move(parser.m_errors));
- return ResolvedCommandExpansion {
- move(node),
- expansion.range,
- };
- });
- resolved_expansions.append(move(resolved));
- }
- token.resolved_expansions = move(resolved_expansions);
- expanded_tokens.append(move(token));
- }
- swap_expansions();
- // (7) Loop variables
- previous_token = {};
- tokens_taken_from_buffer = 0;
- if (m_token_buffer.size() >= 1) {
- previous_token = m_token_buffer.take_last();
- tokens_taken_from_buffer++;
- }
- for (auto& token : tokens) {
- if (!previous_token.has_value()) {
- previous_token = token;
- continue;
- }
- if (previous_token->type == Token::Type::For && token.type == Token::Type::Word && is_valid_name(token.value)) {
- token.type = Token::Type::VariableName;
- }
- expanded_tokens.append(exchange(*previous_token, token));
- }
- swap_expansions();
- // (8) Function names
- previous_token = {};
- previous_previous_token = {};
- tokens_taken_from_buffer = 0;
- if (m_token_buffer.size() >= 1) {
- previous_token = m_token_buffer.take_last();
- tokens_taken_from_buffer++;
- }
- if (m_token_buffer.size() >= 1) {
- previous_previous_token = m_token_buffer.take_last();
- tokens_taken_from_buffer++;
- }
- for (auto& token : tokens) {
- if (!previous_token.has_value()) {
- previous_token = token;
- continue;
- }
- if (!previous_previous_token.has_value()) {
- previous_previous_token = move(previous_token);
- previous_token = token;
- continue;
- }
- // NAME ( )
- if (previous_previous_token->could_be_start_of_a_simple_command
- && previous_previous_token->type == Token::Type::Word
- && previous_token->type == Token::Type::OpenParen
- && token.type == Token::Type::CloseParen) {
- previous_previous_token->type = Token::Type::VariableName;
- }
- expanded_tokens.append(exchange(*previous_previous_token, exchange(*previous_token, token)));
- }
- swap_expansions();
- return tokens;
- }
- static AST::Position empty_position()
- {
- return { 0, 0, { 0, 0 }, { 0, 0 } };
- }
- RefPtr<AST::Node> Parser::parse_complete_command()
- {
- auto list = [&] {
- // separator...
- while (is_separator(peek()))
- skip();
- // list EOF
- auto list = parse_list();
- if (eof())
- return list;
- // list separator EOF
- while (is_separator(peek()))
- skip();
- if (eof())
- return list;
- auto position = peek().position;
- auto syntax_error = make_ref_counted<AST::SyntaxError>(
- position.value_or(empty_position()),
- "Extra tokens after complete command"sv);
- if (list)
- list->set_is_syntax_error(*syntax_error);
- else
- list = syntax_error;
- return list;
- }();
- if (!list)
- return nullptr;
- return make_ref_counted<AST::Execute>(list->position(), *list);
- }
- RefPtr<AST::Node> Parser::parse_list()
- {
- NonnullRefPtrVector<AST::Node> nodes;
- Vector<AST::Position> positions;
- auto start_position = peek().position.value_or(empty_position());
- for (;;) {
- auto new_node = parse_and_or();
- if (!new_node)
- break;
- if (peek().type == Token::Type::And) {
- new_node = make_ref_counted<AST::Background>(
- new_node->position(),
- *new_node);
- }
- nodes.append(new_node.release_nonnull());
- if (!is_separator(peek()) || eof())
- break;
- auto position = consume().position;
- if (position.has_value())
- positions.append(position.release_value());
- }
- auto end_position = peek().position.value_or(empty_position());
- return make_ref_counted<AST::Sequence>(
- AST::Position {
- start_position.start_offset,
- end_position.end_offset,
- start_position.start_line,
- start_position.end_line,
- },
- move(nodes),
- move(positions));
- }
- RefPtr<AST::Node> Parser::parse_and_or()
- {
- auto node = parse_pipeline();
- if (!node)
- return {};
- for (;;) {
- if (peek().type == Token::Type::AndIf) {
- auto and_token = consume();
- while (peek().type == Token::Type::Newline)
- skip();
- auto rhs = parse_pipeline();
- if (!rhs)
- return {};
- node = make_ref_counted<AST::And>(
- node->position(),
- *node,
- rhs.release_nonnull(),
- and_token.position.value_or(empty_position()));
- continue;
- }
- if (peek().type == Token::Type::OrIf) {
- auto or_token = consume();
- while (peek().type == Token::Type::Newline)
- skip();
- auto rhs = parse_pipeline();
- if (!rhs)
- return {};
- node = make_ref_counted<AST::And>(
- node->position(),
- *node,
- rhs.release_nonnull(),
- or_token.position.value_or(empty_position()));
- continue;
- }
- break;
- }
- return node;
- }
- RefPtr<AST::Node> Parser::parse_pipeline()
- {
- return parse_pipe_sequence();
- }
- RefPtr<AST::Node> Parser::parse_pipe_sequence()
- {
- auto node = parse_command();
- if (!node)
- return {};
- for (;;) {
- if (peek().type != Token::Type::Pipe)
- break;
- consume();
- while (peek().type == Token::Type::Newline)
- skip();
- auto rhs = parse_command();
- if (!rhs)
- return {};
- node = make_ref_counted<AST::Pipe>(
- node->position(),
- *node,
- rhs.release_nonnull());
- }
- return node;
- }
- RefPtr<AST::Node> Parser::parse_command()
- {
- auto node = [this] {
- if (auto node = parse_function_definition())
- return node;
- if (auto node = parse_simple_command())
- return node;
- auto node = parse_compound_command();
- if (!node)
- return node;
- if (auto list = parse_redirect_list()) {
- auto position = list->position();
- node = make_ref_counted<AST::Join>(
- node->position().with_end(position),
- *node,
- list.release_nonnull());
- }
- return node;
- }();
- if (!node)
- return nullptr;
- return make_ref_counted<AST::CastToCommand>(node->position(), *node);
- }
- RefPtr<AST::Node> Parser::parse_function_definition()
- {
- // NAME OPEN_PAREN CLOSE_PAREN newline* function_body
- auto start_index = m_token_index;
- ArmedScopeGuard reset = [&] {
- m_token_index = start_index;
- };
- if (peek().type != Token::Type::VariableName) {
- return nullptr;
- }
- auto name = consume();
- if (consume().type != Token::Type::OpenParen)
- return nullptr;
- if (consume().type != Token::Type::CloseParen)
- return nullptr;
- while (peek().type == Token::Type::Newline)
- skip();
- auto body = parse_function_body();
- if (!body)
- return nullptr;
- reset.disarm();
- return make_ref_counted<AST::FunctionDeclaration>(
- name.position.value_or(empty_position()).with_end(peek().position.value_or(empty_position())),
- AST::NameWithPosition { name.value, name.position.value_or(empty_position()) },
- Vector<AST::NameWithPosition> {},
- body.release_nonnull());
- }
- RefPtr<AST::Node> Parser::parse_function_body()
- {
- // compound_command redirect_list?
- auto node = parse_compound_command();
- if (!node)
- return nullptr;
- if (auto list = parse_redirect_list()) {
- auto position = list->position();
- node = make_ref_counted<AST::Join>(
- node->position().with_end(position),
- *node,
- list.release_nonnull());
- }
- return node;
- }
- RefPtr<AST::Node> Parser::parse_redirect_list()
- {
- // io_redirect*
- RefPtr<AST::Node> node;
- for (;;) {
- auto new_node = parse_io_redirect();
- if (!new_node)
- break;
- if (node) {
- node = make_ref_counted<AST::Join>(
- node->position().with_end(new_node->position()),
- *node,
- new_node.release_nonnull());
- } else {
- node = new_node;
- }
- }
- return node;
- }
- RefPtr<AST::Node> Parser::parse_compound_command()
- {
- if (auto node = parse_brace_group())
- return node;
- if (auto node = parse_subshell())
- return node;
- if (auto node = parse_if_clause())
- return node;
- if (auto node = parse_for_clause())
- return node;
- if (auto node = parse_case_clause())
- return node;
- if (auto node = parse_while_clause())
- return node;
- if (auto node = parse_until_clause())
- return node;
- return {};
- }
- RefPtr<AST::Node> Parser::parse_while_clause()
- {
- if (peek().type != Token::Type::While)
- return nullptr;
- auto start_position = consume().position.value_or(empty_position());
- auto condition = parse_compound_list();
- if (!condition)
- condition = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- "Expected condition after 'while'"sv);
- auto do_group = parse_do_group();
- if (!do_group)
- do_group = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- "Expected 'do' after 'while'"sv);
- // while foo; bar -> loop { if foo { bar } else { break } }
- return make_ref_counted<AST::ForLoop>(
- start_position.with_end(peek().position.value_or(empty_position())),
- Optional<AST::NameWithPosition> {},
- Optional<AST::NameWithPosition> {},
- nullptr,
- make_ref_counted<AST::IfCond>(
- start_position.with_end(peek().position.value_or(empty_position())),
- Optional<AST::Position> {},
- condition.release_nonnull(),
- do_group.release_nonnull(),
- make_ref_counted<AST::ContinuationControl>(
- start_position,
- AST::ContinuationControl::ContinuationKind::Break)));
- }
- RefPtr<AST::Node> Parser::parse_until_clause()
- {
- if (peek().type != Token::Type::Until)
- return nullptr;
- auto start_position = consume().position.value_or(empty_position());
- auto condition = parse_compound_list();
- if (!condition)
- condition = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- "Expected condition after 'until'"sv);
- auto do_group = parse_do_group();
- if (!do_group)
- do_group = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- "Expected 'do' after 'until'"sv);
- // until foo; bar -> loop { if foo { break } else { bar } }
- return make_ref_counted<AST::ForLoop>(
- start_position.with_end(peek().position.value_or(empty_position())),
- Optional<AST::NameWithPosition> {},
- Optional<AST::NameWithPosition> {},
- nullptr,
- make_ref_counted<AST::IfCond>(
- start_position.with_end(peek().position.value_or(empty_position())),
- Optional<AST::Position> {},
- condition.release_nonnull(),
- make_ref_counted<AST::ContinuationControl>(
- start_position,
- AST::ContinuationControl::ContinuationKind::Break),
- do_group.release_nonnull()));
- }
- RefPtr<AST::Node> Parser::parse_brace_group()
- {
- if (peek().type != Token::Type::OpenBrace)
- return nullptr;
- consume();
- auto list = parse_compound_list();
- RefPtr<AST::SyntaxError> error;
- if (peek().type != Token::Type::CloseBrace) {
- error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected '}}', not {}", peek().type_name()));
- } else {
- consume();
- }
- if (error) {
- if (list)
- list->set_is_syntax_error(*error);
- else
- list = error;
- }
- return make_ref_counted<AST::Execute>(list->position(), *list);
- }
- RefPtr<AST::Node> Parser::parse_case_clause()
- {
- auto start_position = peek().position.value_or(empty_position());
- if (peek().type != Token::Type::Case)
- return nullptr;
- skip();
- RefPtr<AST::SyntaxError> syntax_error;
- auto expr = parse_word();
- if (!expr)
- expr = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected a word, not {}", peek().type_name()));
- if (peek().type != Token::Type::In) {
- syntax_error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected 'in', not {}", peek().type_name()));
- } else {
- skip();
- }
- while (peek().type == Token::Type::Newline)
- skip();
- Vector<AST::MatchEntry> entries;
- for (;;) {
- if (eof() || peek().type == Token::Type::Esac)
- break;
- if (peek().type == Token::Type::Newline) {
- skip();
- continue;
- }
- // Parse a pattern list
- auto needs_dsemi = true;
- if (peek().type == Token::Type::OpenParen) {
- skip();
- needs_dsemi = false;
- }
- auto result = parse_case_list();
- if (peek().type == Token::Type::CloseParen) {
- skip();
- } else {
- if (!syntax_error)
- syntax_error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected ')', not {}", peek().type_name()));
- break;
- }
- while (peek().type == Token::Type::Newline)
- skip();
- auto compound_list = parse_compound_list();
- if (peek().type == Token::Type::DoubleSemicolon) {
- skip();
- } else if (needs_dsemi) {
- if (!syntax_error)
- syntax_error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected ';;', not {}", peek().type_name()));
- }
- if (syntax_error) {
- if (compound_list)
- compound_list->set_is_syntax_error(*syntax_error);
- else
- compound_list = syntax_error;
- syntax_error = nullptr;
- }
- entries.append(AST::MatchEntry {
- .options = move(result.nodes),
- .match_names = {},
- .match_as_position = {},
- .pipe_positions = move(result.pipe_positions),
- .body = move(compound_list),
- });
- }
- if (peek().type != Token::Type::Esac) {
- syntax_error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected 'esac', not {}", peek().type_name()));
- } else {
- skip();
- }
- auto node = make_ref_counted<AST::MatchExpr>(
- start_position.with_end(peek().position.value_or(empty_position())),
- expr.release_nonnull(),
- DeprecatedString {},
- Optional<AST::Position> {},
- move(entries));
- if (syntax_error)
- node->set_is_syntax_error(*syntax_error);
- return node;
- }
- Parser::CaseItemsResult Parser::parse_case_list()
- {
- // Just a list of words split by '|', delimited by ')'
- NonnullRefPtrVector<AST::Node> nodes;
- Vector<AST::Position> pipes;
- for (;;) {
- if (eof() || peek().type == Token::Type::CloseParen)
- break;
- if (peek().type != Token::Type::Word)
- break;
- auto node = parse_word();
- if (!node)
- node = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected a word, not {}", peek().type_name()));
- nodes.append(node.release_nonnull());
- if (peek().type == Token::Type::Pipe) {
- pipes.append(peek().position.value_or(empty_position()));
- skip();
- } else {
- break;
- }
- }
- if (nodes.is_empty())
- nodes.append(make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected a word, not {}", peek().type_name())));
- return { move(pipes), move(nodes) };
- }
- RefPtr<AST::Node> Parser::parse_if_clause()
- {
- // If compound_list Then compound_list {Elif compound_list Then compound_list (Fi|Else)?} [(?=Else) compound_list] (?!=Fi) Fi
- auto start_position = peek().position.value_or(empty_position());
- if (peek().type != Token::Type::If)
- return nullptr;
- skip();
- auto main_condition = parse_compound_list();
- if (!main_condition)
- main_condition = make_ref_counted<AST::SyntaxError>(empty_position(), "Expected compound list after 'if'");
- RefPtr<AST::SyntaxError> syntax_error;
- if (peek().type != Token::Type::Then) {
- syntax_error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected 'then', not {}", peek().type_name()));
- } else {
- skip();
- }
- auto main_consequence = parse_compound_list();
- if (!main_consequence)
- main_consequence = make_ref_counted<AST::SyntaxError>(empty_position(), "Expected compound list after 'then'");
- auto node = make_ref_counted<AST::IfCond>(start_position, Optional<AST::Position>(), main_condition.release_nonnull(), main_consequence.release_nonnull(), nullptr);
- auto active_node = node;
- while (peek().type == Token::Type::Elif) {
- skip();
- auto condition = parse_compound_list();
- if (!condition)
- condition = make_ref_counted<AST::SyntaxError>(empty_position(), "Expected compound list after 'elif'");
- if (peek().type != Token::Type::Then) {
- if (!syntax_error)
- syntax_error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected 'then', not {}", peek().type_name()));
- } else {
- skip();
- }
- auto consequence = parse_compound_list();
- if (!consequence)
- consequence = make_ref_counted<AST::SyntaxError>(empty_position(), "Expected compound list after 'then'");
- auto new_node = make_ref_counted<AST::IfCond>(start_position, Optional<AST::Position>(), condition.release_nonnull(), consequence.release_nonnull(), nullptr);
- active_node->false_branch() = new_node;
- active_node = move(new_node);
- }
- auto needs_fi = true;
- switch (peek().type) {
- case Token::Type::Else:
- skip();
- active_node->false_branch() = parse_compound_list();
- if (!active_node->false_branch())
- active_node->false_branch() = make_ref_counted<AST::SyntaxError>(empty_position(), "Expected compound list after 'else'");
- break;
- case Token::Type::Fi:
- needs_fi = false;
- break;
- default:
- if (!syntax_error)
- syntax_error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected 'else' or 'fi', not {}", peek().type_name()));
- break;
- }
- if (needs_fi) {
- if (peek().type != Token::Type::Fi) {
- if (!syntax_error)
- syntax_error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected 'fi', not {}", peek().type_name()));
- } else {
- skip();
- }
- }
- if (syntax_error)
- node->set_is_syntax_error(*syntax_error);
- return node;
- }
- RefPtr<AST::Node> Parser::parse_subshell()
- {
- auto start_position = peek().position.value_or(empty_position());
- if (peek().type != Token::Type::OpenParen)
- return nullptr;
- skip();
- RefPtr<AST::SyntaxError> error;
- auto list = parse_compound_list();
- if (!list)
- error = make_ref_counted<AST::SyntaxError>(peek().position.value_or(empty_position()), "Expected compound list after ("sv);
- if (peek().type != Token::Type::CloseParen)
- error = make_ref_counted<AST::SyntaxError>(peek().position.value_or(empty_position()), "Expected ) after compound list"sv);
- else
- skip();
- if (!list)
- return error;
- return make_ref_counted<AST::Subshell>(
- start_position.with_end(peek().position.value_or(empty_position())),
- list.release_nonnull());
- }
- RefPtr<AST::Node> Parser::parse_compound_list()
- {
- while (peek().type == Token::Type::Newline)
- skip();
- auto term = parse_term();
- if (!term)
- return term;
- if (is_separator(peek())) {
- if (consume().type == Token::Type::And) {
- term = make_ref_counted<AST::Background>(
- term->position().with_end(peek().position.value_or(empty_position())),
- *term);
- }
- }
- return term;
- }
- RefPtr<AST::Node> Parser::parse_term()
- {
- NonnullRefPtrVector<AST::Node> nodes;
- Vector<AST::Position> positions;
- auto start_position = peek().position.value_or(empty_position());
- for (;;) {
- auto new_node = parse_and_or();
- if (!new_node)
- break;
- nodes.append(new_node.release_nonnull());
- if (!is_separator(peek()))
- break;
- auto position = consume().position;
- if (position.has_value())
- positions.append(position.release_value());
- }
- auto end_position = peek().position.value_or(empty_position());
- return make_ref_counted<AST::Sequence>(
- start_position.with_end(end_position),
- move(nodes),
- move(positions));
- }
- RefPtr<AST::Node> Parser::parse_for_clause()
- {
- // FOR NAME newline+ do_group
- // FOR NAME newline+ IN separator do_group
- // FOR NAME IN separator do_group
- // FOR NAME IN wordlist separator do_group
- if (peek().type != Token::Type::For)
- return nullptr;
- auto start_position = consume().position.value_or(empty_position());
- DeprecatedString name;
- Optional<AST::Position> name_position;
- if (peek().type == Token::Type::VariableName) {
- name_position = peek().position;
- name = consume().value;
- } else {
- name = "it";
- error(peek(), "Expected a variable name, not {}", peek().type_name());
- }
- auto saw_newline = false;
- while (peek().type == Token::Type::Newline) {
- saw_newline = true;
- skip();
- }
- auto saw_in = false;
- Optional<AST::Position> in_kw_position;
- if (peek().type == Token::Type::In) {
- saw_in = true;
- in_kw_position = peek().position;
- skip();
- } else if (!saw_newline) {
- error(peek(), "Expected 'in' or a newline, not {}", peek().type_name());
- }
- RefPtr<AST::Node> iterated_expression;
- if (!saw_newline)
- iterated_expression = parse_word_list();
- if (saw_in) {
- if (peek().type == Token::Type::Semicolon)
- skip();
- else
- error(peek(), "Expected a semicolon, not {}", peek().type_name());
- }
- auto body = parse_do_group();
- return AST::make_ref_counted<AST::ForLoop>(
- start_position.with_end(peek().position.value_or(empty_position())),
- AST::NameWithPosition { move(name), name_position.value_or(empty_position()) },
- Optional<AST::NameWithPosition> {},
- move(iterated_expression),
- move(body),
- move(in_kw_position),
- Optional<AST::Position> {});
- }
- RefPtr<AST::Node> Parser::parse_word_list()
- {
- NonnullRefPtrVector<AST::Node> nodes;
- auto start_position = peek().position.value_or(empty_position());
- for (; peek().type == Token::Type::Word;) {
- auto word = parse_word();
- nodes.append(word.release_nonnull());
- }
- return make_ref_counted<AST::ListConcatenate>(
- start_position.with_end(peek().position.value_or(empty_position())),
- move(nodes));
- }
- RefPtr<AST::Node> Parser::parse_word()
- {
- if (peek().type != Token::Type::Word)
- return nullptr;
- auto token = consume();
- RefPtr<AST::Node> word;
- enum class Quote {
- None,
- Single,
- Double,
- } in_quote { Quote::None };
- auto append_bareword = [&](StringView string) {
- if (!word && string.starts_with('~')) {
- GenericLexer lexer { string };
- lexer.ignore();
- auto user = lexer.consume_while(is_ascii_alphanumeric);
- string = lexer.remaining();
- word = make_ref_counted<AST::Tilde>(token.position.value_or(empty_position()), user);
- }
- if (string.is_empty())
- return;
- auto node = make_ref_counted<AST::BarewordLiteral>(token.position.value_or(empty_position()), string);
- if (word) {
- word = make_ref_counted<AST::Juxtaposition>(
- word->position().with_end(token.position.value_or(empty_position())),
- *word,
- move(node),
- AST::Juxtaposition::Mode::StringExpand);
- } else {
- word = move(node);
- }
- };
- auto append_string_literal = [&](StringView string) {
- if (string.is_empty())
- return;
- auto node = make_ref_counted<AST::StringLiteral>(token.position.value_or(empty_position()), string, AST::StringLiteral::EnclosureType::SingleQuotes);
- if (word) {
- word = make_ref_counted<AST::Juxtaposition>(
- word->position().with_end(token.position.value_or(empty_position())),
- *word,
- move(node),
- AST::Juxtaposition::Mode::StringExpand);
- } else {
- word = move(node);
- }
- };
- auto append_string_part = [&](StringView string) {
- if (string.is_empty())
- return;
- auto node = make_ref_counted<AST::StringLiteral>(token.position.value_or(empty_position()), string, AST::StringLiteral::EnclosureType::DoubleQuotes);
- if (word) {
- word = make_ref_counted<AST::Juxtaposition>(
- word->position().with_end(token.position.value_or(empty_position())),
- *word,
- move(node),
- AST::Juxtaposition::Mode::StringExpand);
- } else {
- word = move(node);
- }
- };
- auto append_parameter_expansion = [&](ResolvedParameterExpansion const& x) {
- DeprecatedString immediate_function_name;
- RefPtr<AST::Node> node;
- switch (x.op) {
- case ResolvedParameterExpansion::Op::UseDefaultValue:
- immediate_function_name = "value_or_default";
- break;
- case ResolvedParameterExpansion::Op::AssignDefaultValue:
- immediate_function_name = "assign_default";
- break;
- case ResolvedParameterExpansion::Op::IndicateErrorIfEmpty:
- immediate_function_name = "error_if_empty";
- break;
- case ResolvedParameterExpansion::Op::UseAlternativeValue:
- immediate_function_name = "null_or_alternative";
- break;
- case ResolvedParameterExpansion::Op::UseDefaultValueIfUnset:
- immediate_function_name = "defined_value_or_default";
- break;
- case ResolvedParameterExpansion::Op::AssignDefaultValueIfUnset:
- immediate_function_name = "assign_defined_default";
- break;
- case ResolvedParameterExpansion::Op::IndicateErrorIfUnset:
- immediate_function_name = "error_if_unset";
- break;
- case ResolvedParameterExpansion::Op::UseAlternativeValueIfUnset:
- immediate_function_name = "null_if_unset_or_alternative";
- break;
- case ResolvedParameterExpansion::Op::RemoveLargestSuffixByPattern:
- // FIXME: Implement this
- case ResolvedParameterExpansion::Op::RemoveSmallestSuffixByPattern:
- immediate_function_name = "remove_suffix";
- break;
- case ResolvedParameterExpansion::Op::RemoveLargestPrefixByPattern:
- // FIXME: Implement this
- case ResolvedParameterExpansion::Op::RemoveSmallestPrefixByPattern:
- immediate_function_name = "remove_prefix";
- break;
- case ResolvedParameterExpansion::Op::StringLength:
- immediate_function_name = "length_of_variable";
- break;
- case ResolvedParameterExpansion::Op::GetPositionalParameter:
- case ResolvedParameterExpansion::Op::GetVariable:
- node = make_ref_counted<AST::SimpleVariable>(
- token.position.value_or(empty_position()),
- x.parameter);
- break;
- case ResolvedParameterExpansion::Op::GetLastBackgroundPid:
- node = make_ref_counted<AST::SyntaxError>(
- token.position.value_or(empty_position()),
- "$! not implemented");
- break;
- case ResolvedParameterExpansion::Op::GetPositionalParameterList:
- node = make_ref_counted<AST::SpecialVariable>(
- token.position.value_or(empty_position()),
- '*');
- break;
- case ResolvedParameterExpansion::Op::GetCurrentOptionFlags:
- node = make_ref_counted<AST::SyntaxError>(
- token.position.value_or(empty_position()),
- "The current option flags are not available in parameter expansions");
- break;
- case ResolvedParameterExpansion::Op::GetPositionalParameterCount:
- node = make_ref_counted<AST::SpecialVariable>(
- token.position.value_or(empty_position()),
- '#');
- break;
- case ResolvedParameterExpansion::Op::GetLastExitStatus:
- node = make_ref_counted<AST::SpecialVariable>(
- token.position.value_or(empty_position()),
- '?');
- break;
- case ResolvedParameterExpansion::Op::GetPositionalParameterListAsString:
- node = make_ref_counted<AST::SyntaxError>(
- token.position.value_or(empty_position()),
- "$* not implemented");
- break;
- case ResolvedParameterExpansion::Op::GetShellProcessId:
- node = make_ref_counted<AST::SpecialVariable>(
- token.position.value_or(empty_position()),
- '$');
- break;
- }
- if (!node) {
- NonnullRefPtrVector<AST::Node> arguments;
- arguments.append(make_ref_counted<AST::BarewordLiteral>(
- token.position.value_or(empty_position()),
- x.parameter));
- if (!x.argument.is_empty()) {
- // dbgln("Will parse {}", x.argument);
- arguments.append(*Parser { x.argument }.parse_word());
- }
- node = make_ref_counted<AST::ImmediateExpression>(
- token.position.value_or(empty_position()),
- AST::NameWithPosition {
- immediate_function_name,
- token.position.value_or(empty_position()),
- },
- move(arguments),
- Optional<AST::Position> {});
- }
- if (x.expand == ResolvedParameterExpansion::Expand::Word) {
- node = make_ref_counted<AST::ImmediateExpression>(
- token.position.value_or(empty_position()),
- AST::NameWithPosition {
- "reexpand",
- token.position.value_or(empty_position()),
- },
- Vector { node.release_nonnull() },
- Optional<AST::Position> {});
- }
- if (word) {
- word = make_ref_counted<AST::Juxtaposition>(
- word->position().with_end(token.position.value_or(empty_position())),
- *word,
- node.release_nonnull(),
- AST::Juxtaposition::Mode::StringExpand);
- } else {
- word = move(node);
- }
- };
- auto append_command_expansion = [&](ResolvedCommandExpansion const& x) {
- if (!x.command)
- return;
- RefPtr<AST::Execute> execute_node;
- if (x.command->is_execute()) {
- execute_node = const_cast<AST::Execute&>(static_cast<AST::Execute const&>(*x.command));
- execute_node->capture_stdout();
- } else {
- execute_node = make_ref_counted<AST::Execute>(
- word ? word->position() : empty_position(),
- *x.command,
- true);
- }
- if (word) {
- word = make_ref_counted<AST::Juxtaposition>(
- word->position(),
- *word,
- execute_node.release_nonnull(),
- AST::Juxtaposition::Mode::StringExpand);
- } else {
- word = move(execute_node);
- }
- };
- auto append_string = [&](StringView string) {
- if (string.is_empty())
- return;
- Optional<size_t> run_start;
- auto escape = false;
- for (size_t i = 0; i < string.length(); ++i) {
- auto ch = string[i];
- switch (ch) {
- case '\\':
- if (!escape && i + 1 < string.length()) {
- if (is_one_of(string[i + 1], '"', '\'', '$', '`', '\\')) {
- escape = in_quote != Quote::Single;
- continue;
- }
- }
- break;
- case '\'':
- if (in_quote == Quote::Single) {
- in_quote = Quote::None;
- append_string_literal(string.substring_view(*run_start, i - *run_start));
- run_start = i + 1;
- continue;
- }
- if (in_quote == Quote::Double) {
- escape = false;
- continue;
- }
- [[fallthrough]];
- case '"':
- if (ch == '\'' && in_quote == Quote::Single) {
- escape = false;
- continue;
- }
- if (!escape) {
- if (ch == '"' && in_quote == Quote::Double) {
- in_quote = Quote::None;
- if (run_start.has_value())
- append_string_part(string.substring_view(*run_start, i - *run_start));
- run_start = i + 1;
- continue;
- }
- if (run_start.has_value())
- append_bareword(string.substring_view(*run_start, i - *run_start));
- in_quote = ch == '\'' ? Quote::Single : Quote::Double;
- run_start = i + 1;
- }
- escape = false;
- [[fallthrough]];
- default:
- if (!run_start.has_value())
- run_start = i;
- escape = false;
- continue;
- }
- }
- if (run_start.has_value())
- append_bareword(string.substring_view(*run_start, string.length() - *run_start));
- };
- size_t current_offset = 0;
- for (auto& expansion : token.resolved_expansions) {
- expansion.visit(
- [&](ResolvedParameterExpansion const& x) {
- if (x.range.start >= token.value.length()) {
- dbgln("Parameter expansion range {}-{} is out of bounds for '{}'", x.range.start, x.range.length, token.value);
- return;
- }
- if (x.range.start != current_offset) {
- append_string(token.value.substring_view(current_offset, x.range.start - current_offset));
- current_offset = x.range.start;
- }
- current_offset += x.range.length;
- append_parameter_expansion(x);
- },
- [&](ResolvedCommandExpansion const& x) {
- if (x.range.start >= token.value.length()) {
- dbgln("Parameter expansion range {}-{} is out of bounds for '{}'", x.range.start, x.range.length, token.value);
- return;
- }
- if (x.range.start != current_offset) {
- append_string(token.value.substring_view(current_offset, x.range.start - current_offset));
- current_offset = x.range.start;
- }
- current_offset += x.range.length;
- append_command_expansion(x);
- });
- }
- if (current_offset >= token.value.length()) {
- dbgln("Parameter expansion range {}- is out of bounds for '{}'", current_offset, token.value);
- return word;
- }
- if (current_offset != token.value.length())
- append_string(token.value.substring_view(current_offset));
- return word;
- }
- RefPtr<AST::Node> Parser::parse_do_group()
- {
- if (peek().type != Token::Type::Do) {
- return make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected 'do', not {}", peek().type_name()));
- }
- consume();
- auto list = parse_compound_list();
- RefPtr<AST::SyntaxError> error;
- if (peek().type != Token::Type::Done) {
- error = make_ref_counted<AST::SyntaxError>(
- peek().position.value_or(empty_position()),
- DeprecatedString::formatted("Expected 'done', not {}", peek().type_name()));
- } else {
- consume();
- }
- if (error) {
- if (list)
- list->set_is_syntax_error(*error);
- else
- list = error;
- }
- return make_ref_counted<AST::Execute>(list->position(), *list);
- }
- RefPtr<AST::Node> Parser::parse_simple_command()
- {
- auto start_position = peek().position.value_or(empty_position());
- Vector<DeprecatedString> definitions;
- NonnullRefPtrVector<AST::Node> nodes;
- for (;;) {
- if (auto io_redirect = parse_io_redirect())
- nodes.append(*io_redirect);
- else
- break;
- }
- while (peek().type == Token::Type::AssignmentWord) {
- definitions.append(peek().value);
- if (!nodes.is_empty()) {
- nodes.append(
- make_ref_counted<AST::BarewordLiteral>(
- peek().position.value_or(empty_position()),
- consume().value));
- } else {
- // env (assignments) (command)
- nodes.append(make_ref_counted<AST::BarewordLiteral>(
- empty_position(),
- "env"));
- nodes.append(
- make_ref_counted<AST::BarewordLiteral>(
- peek().position.value_or(empty_position()),
- consume().value));
- }
- }
- // WORD or io_redirect: IO_NUMBER or io_file
- if (!is_one_of(peek().type,
- Token::Type::Word, Token::Type::IoNumber,
- Token::Type::Less, Token::Type::LessAnd, Token::Type::Great, Token::Type::GreatAnd,
- Token::Type::DoubleGreat, Token::Type::LessGreat, Token::Type::Clobber)) {
- if (!nodes.is_empty()) {
- Vector<AST::VariableDeclarations::Variable> variables;
- for (auto& definition : definitions) {
- auto parts = definition.split_limit('=', 2, SplitBehavior::KeepEmpty);
- auto name = make_ref_counted<AST::BarewordLiteral>(
- empty_position(),
- parts[0]);
- auto value = make_ref_counted<AST::BarewordLiteral>(
- empty_position(),
- parts.size() > 1 ? parts[1] : "");
- variables.append({ move(name), move(value) });
- }
- return make_ref_counted<AST::VariableDeclarations>(empty_position(), move(variables));
- }
- return nullptr;
- }
- // auto first = true;
- for (;;) {
- if (peek().type == Token::Type::Word) {
- auto new_word = parse_word();
- if (!new_word)
- break;
- // if (first) {
- // first = false;
- // new_word = make_ref_counted<AST::ImmediateExpression>(
- // new_word->position(),
- // AST::NameWithPosition {
- // "substitute_aliases"sv,
- // empty_position(),
- // },
- // NonnullRefPtrVector<AST::Node> { *new_word },
- // Optional<AST::Position> {});
- // }
- nodes.append(new_word.release_nonnull());
- } else if (auto io_redirect = parse_io_redirect()) {
- nodes.append(io_redirect.release_nonnull());
- } else {
- break;
- }
- }
- auto node = make_ref_counted<AST::ListConcatenate>(
- start_position.with_end(peek().position.value_or(empty_position())),
- move(nodes));
- return node;
- }
- RefPtr<AST::Node> Parser::parse_io_redirect()
- {
- auto start_position = peek().position.value_or(empty_position());
- auto start_index = m_token_index;
- // io_redirect: IO_NUMBER? io_file | IO_NUMBER? io_here
- Optional<int> io_number;
- if (peek().type == Token::Type::IoNumber)
- io_number = consume().value.to_int(TrimWhitespace::No);
- if (auto io_file = parse_io_file(start_position, io_number))
- return io_file;
- // if (auto io_here = parse_io_here(start_position, io_number))
- // return io_here;
- m_token_index = start_index;
- return nullptr;
- }
- RefPtr<AST::Node> Parser::parse_io_file(AST::Position start_position, Optional<int> fd)
- {
- auto start_index = m_token_index;
- // io_file = (LESS | LESSAND | GREAT | GREATAND | DGREAT | LESSGREAT | CLOBBER) WORD
- auto io_operator = peek().type;
- if (!is_one_of(io_operator,
- Token::Type::Less, Token::Type::LessAnd, Token::Type::Great, Token::Type::GreatAnd,
- Token::Type::DoubleGreat, Token::Type::LessGreat, Token::Type::Clobber))
- return nullptr;
- auto io_operator_token = consume();
- auto word = parse_word();
- if (!word) {
- m_token_index = start_index;
- return nullptr;
- }
- auto position = start_position.with_end(peek().position.value_or(empty_position()));
- switch (io_operator) {
- case Token::Type::Less:
- return make_ref_counted<AST::ReadRedirection>(
- position,
- fd.value_or(0),
- word.release_nonnull());
- case Token::Type::Clobber:
- // FIXME: Add support for clobber (and 'noclobber')
- case Token::Type::Great:
- return make_ref_counted<AST::WriteRedirection>(
- position,
- fd.value_or(1),
- word.release_nonnull());
- case Token::Type::DoubleGreat:
- return make_ref_counted<AST::WriteAppendRedirection>(
- position,
- fd.value_or(1),
- word.release_nonnull());
- case Token::Type::LessGreat:
- return make_ref_counted<AST::ReadWriteRedirection>(
- position,
- fd.value_or(0),
- word.release_nonnull());
- case Token::Type::LessAnd:
- case Token::Type::GreatAnd: {
- auto is_less = io_operator == Token::Type::LessAnd;
- auto source_fd = fd.value_or(is_less ? 0 : 1);
- if (word->is_bareword()) {
- auto maybe_target_fd = static_ptr_cast<AST::BarewordLiteral>(word)->text().to_int(AK::TrimWhitespace::No);
- if (maybe_target_fd.has_value()) {
- auto target_fd = maybe_target_fd.release_value();
- if (is_less)
- swap(source_fd, target_fd);
- return make_ref_counted<AST::Fd2FdRedirection>(
- position,
- source_fd,
- target_fd);
- }
- }
- if (is_less) {
- return make_ref_counted<AST::ReadRedirection>(
- position,
- source_fd,
- word.release_nonnull());
- }
- return make_ref_counted<AST::WriteRedirection>(
- position,
- source_fd,
- word.release_nonnull());
- }
- default:
- VERIFY_NOT_REACHED();
- }
- }
- }
|