/* * Copyright (c) 2020, Stephan Unverwerth * Copyright (c) 2021-2022, David Tuin * * SPDX-License-Identifier: BSD-2-Clause */ #pragma once #include #include #include #include #include #include #include #include #include #include #include namespace JS { enum class Associativity { Left, Right }; struct FunctionNodeParseOptions { enum { CheckForFunctionAndName = 1 << 0, AllowSuperPropertyLookup = 1 << 1, AllowSuperConstructorCall = 1 << 2, IsGetterFunction = 1 << 3, IsSetterFunction = 1 << 4, IsArrowFunction = 1 << 5, IsGeneratorFunction = 1 << 6, IsAsyncFunction = 1 << 7, }; }; class ScopePusher; class Parser { public: struct EvalInitialState { bool in_eval_function_context { false }; bool allow_super_property_lookup { false }; bool allow_super_constructor_call { false }; bool in_class_field_initializer { false }; }; explicit Parser(Lexer lexer, Program::Type program_type = Program::Type::Script, Optional initial_state_for_eval = {}); NonnullRefPtr parse_program(bool starts_in_strict_mode = false); template NonnullRefPtr parse_function_node(u8 parse_options = FunctionNodeParseOptions::CheckForFunctionAndName, Optional const& function_start = {}); Vector parse_formal_parameters(int& function_length, u8 parse_options = 0); enum class AllowDuplicates { Yes, No }; enum class AllowMemberExpressions { Yes, No }; RefPtr parse_binding_pattern(AllowDuplicates is_var_declaration = AllowDuplicates::No, AllowMemberExpressions allow_member_expressions = AllowMemberExpressions::No); struct PrimaryExpressionParseResult { NonnullRefPtr result; bool should_continue_parsing_as_expression { true }; }; NonnullRefPtr parse_declaration(); enum class AllowLabelledFunction { No, Yes }; NonnullRefPtr parse_statement(AllowLabelledFunction allow_labelled_function = AllowLabelledFunction::No); NonnullRefPtr parse_block_statement(); NonnullRefPtr parse_function_body(Vector const& parameters, FunctionKind function_kind, bool& contains_direct_call_to_eval); NonnullRefPtr parse_return_statement(); NonnullRefPtr parse_variable_declaration(bool for_loop_variable_declaration = false); NonnullRefPtr parse_for_statement(); enum class IsForAwaitLoop { No, Yes }; struct ForbiddenTokens { ForbiddenTokens(std::initializer_list const& forbidden); ForbiddenTokens merge(ForbiddenTokens other) const; bool allows(TokenType token) const; ForbiddenTokens forbid(std::initializer_list const& forbidden) const; private: void forbid_tokens(std::initializer_list const& forbidden); bool m_forbid_in_token : 1 { false }; bool m_forbid_logical_tokens : 1 { false }; bool m_forbid_coalesce_token : 1 { false }; bool m_forbid_paren_open : 1 { false }; bool m_forbid_question_mark_period : 1 { false }; bool m_forbid_equals : 1 { false }; }; struct ExpressionResult { template ExpressionResult(NonnullRefPtr expression, ForbiddenTokens forbidden = {}) : expression(expression) , forbidden(forbidden) { } NonnullRefPtr expression; ForbiddenTokens forbidden; }; NonnullRefPtr parse_for_in_of_statement(NonnullRefPtr lhs, IsForAwaitLoop is_await); NonnullRefPtr parse_if_statement(); NonnullRefPtr parse_throw_statement(); NonnullRefPtr parse_try_statement(); NonnullRefPtr parse_catch_clause(); NonnullRefPtr parse_switch_statement(); NonnullRefPtr parse_switch_case(); NonnullRefPtr parse_break_statement(); NonnullRefPtr parse_continue_statement(); NonnullRefPtr parse_do_while_statement(); NonnullRefPtr parse_while_statement(); NonnullRefPtr parse_with_statement(); NonnullRefPtr parse_debugger_statement(); NonnullRefPtr parse_conditional_expression(NonnullRefPtr test, ForbiddenTokens); NonnullRefPtr parse_optional_chain(NonnullRefPtr base); NonnullRefPtr parse_expression(int min_precedence, Associativity associate = Associativity::Right, ForbiddenTokens forbidden = {}); PrimaryExpressionParseResult parse_primary_expression(); NonnullRefPtr parse_unary_prefixed_expression(); NonnullRefPtr parse_regexp_literal(); NonnullRefPtr parse_object_expression(); NonnullRefPtr parse_array_expression(); NonnullRefPtr parse_string_literal(Token const& token, bool in_template_literal = false); NonnullRefPtr parse_template_literal(bool is_tagged); ExpressionResult parse_secondary_expression(NonnullRefPtr, int min_precedence, Associativity associate = Associativity::Right, ForbiddenTokens forbidden = {}); NonnullRefPtr parse_call_expression(NonnullRefPtr); NonnullRefPtr parse_new_expression(); NonnullRefPtr parse_class_declaration(); NonnullRefPtr parse_class_expression(bool expect_class_name); NonnullRefPtr parse_yield_expression(); NonnullRefPtr parse_await_expression(); NonnullRefPtr parse_property_key(); NonnullRefPtr parse_assignment_expression(AssignmentOp, NonnullRefPtr lhs, int min_precedence, Associativity, ForbiddenTokens forbidden = {}); NonnullRefPtr parse_identifier(); NonnullRefPtr parse_import_statement(Program& program); NonnullRefPtr parse_export_statement(Program& program); RefPtr try_parse_arrow_function_expression(bool expect_parens, bool is_async = false); RefPtr try_parse_labelled_statement(AllowLabelledFunction allow_function); RefPtr try_parse_new_target_expression(); RefPtr try_parse_import_meta_expression(); NonnullRefPtr parse_import_call(); Vector parse_arguments(); struct Error { String message; Optional position; String to_string() const { if (!position.has_value()) return message; return String::formatted("{} (line: {}, column: {})", message, position.value().line, position.value().column); } String source_location_hint(StringView source, char const spacer = ' ', char const indicator = '^') const { if (!position.has_value()) return {}; // We need to modify the source to match what the lexer considers one line - normalizing // line terminators to \n is easier than splitting using all different LT characters. String source_string = source.replace("\r\n"sv, "\n"sv, ReplaceMode::All).replace("\r"sv, "\n"sv, ReplaceMode::All).replace(LINE_SEPARATOR_STRING, "\n"sv, ReplaceMode::All).replace(PARAGRAPH_SEPARATOR_STRING, "\n"sv, ReplaceMode::All); StringBuilder builder; builder.append(source_string.split_view('\n', true)[position.value().line - 1]); builder.append('\n'); for (size_t i = 0; i < position.value().column - 1; ++i) builder.append(spacer); builder.append(indicator); return builder.build(); } }; bool has_errors() const { return m_state.errors.size(); } Vector const& errors() const { return m_state.errors; } void print_errors(bool print_hint = true) const { for (auto& error : m_state.errors) { if (print_hint) { auto hint = error.source_location_hint(m_state.lexer.source()); if (!hint.is_empty()) warnln("{}", hint); } warnln("SyntaxError: {}", error.to_string()); } } struct TokenMemoization { bool try_parse_arrow_function_expression_failed; }; // Needs to mess with m_state, and we're not going to expose a non-const getter for that :^) friend ThrowCompletionOr FunctionConstructor::create_dynamic_function(GlobalObject&, FunctionObject&, FunctionObject*, FunctionKind, MarkedVector const&); private: friend class ScopePusher; void parse_script(Program& program, bool starts_in_strict_mode); void parse_module(Program& program); Associativity operator_associativity(TokenType) const; bool match_expression() const; bool match_unary_prefixed_expression() const; bool match_secondary_expression(ForbiddenTokens forbidden = {}) const; bool match_statement() const; bool match_export_or_import() const; bool match_assert_clause() const; bool match_declaration() const; bool try_match_let_declaration() const; bool match_variable_declaration() const; bool match_identifier() const; bool match_identifier_name() const; bool match_property_key() const; bool is_private_identifier_valid() const; bool match(TokenType type) const; bool done() const; void expected(char const* what); void syntax_error(String const& message, Optional = {}); Token consume(); Token consume_identifier(); Token consume_identifier_reference(); Token consume(TokenType type); Token consume_and_validate_numeric_literal(); void consume_or_insert_semicolon(); void save_state(); void load_state(); void discard_saved_state(); Position position() const; RefPtr synthesize_binding_pattern(Expression const& expression); Token next_token(size_t steps = 1) const; void check_identifier_name_for_assignment_validity(FlyString const&, bool force_strict = false); bool try_parse_arrow_function_expression_failed_at_position(Position const&) const; void set_try_parse_arrow_function_expression_failed_at_position(Position const&, bool); bool match_invalid_escaped_keyword() const; bool parse_directive(ScopeNode& body); void parse_statement_list(ScopeNode& output_node, AllowLabelledFunction allow_labelled_functions = AllowLabelledFunction::No); FlyString consume_string_value(); ModuleRequest parse_module_request(); struct RulePosition { AK_MAKE_NONCOPYABLE(RulePosition); AK_MAKE_NONMOVABLE(RulePosition); public: RulePosition(Parser& parser, Position position) : m_parser(parser) , m_position(position) { m_parser.m_rule_starts.append(position); } ~RulePosition() { auto last = m_parser.m_rule_starts.take_last(); VERIFY(last.line == m_position.line); VERIFY(last.column == m_position.column); } Position const& position() const { return m_position; } private: Parser& m_parser; Position m_position; }; [[nodiscard]] RulePosition push_start() { return { *this, position() }; } struct ParserState { Lexer lexer; Token current_token; Vector errors; ScopePusher* current_scope_pusher { nullptr }; HashMap> labels_in_scope; HashTable* referenced_private_names { nullptr }; bool strict_mode { false }; bool allow_super_property_lookup { false }; bool allow_super_constructor_call { false }; bool in_function_context { false }; bool in_eval_function_context { false }; // This controls if we allow new.target or not. Note that eval("return") is not allowed, so we have to have a separate state variable for eval. bool in_formal_parameter_context { false }; bool in_generator_function_context { false }; bool await_expression_is_valid { false }; bool in_arrow_function_context { false }; bool in_break_context { false }; bool in_continue_context { false }; bool string_legacy_octal_escape_sequence_in_scope { false }; bool in_class_field_initializer { false }; bool in_class_static_init_block { false }; bool function_might_need_arguments_object { false }; ParserState(Lexer, Program::Type); }; class PositionKeyTraits { public: static int hash(Position const& position) { return int_hash(position.line) ^ int_hash(position.column); } static bool equals(Position const& a, Position const& b) { return a.column == b.column && a.line == b.line; } }; Vector m_rule_starts; ParserState m_state; FlyString m_filename; Vector m_saved_state; HashMap m_token_memoizations; Program::Type m_program_type; }; }