/* * Copyright (c) 2020, Stephan Unverwerth * * SPDX-License-Identifier: BSD-2-Clause */ #pragma once #include #include #include #include #include #include #include namespace JS { enum class Associativity { Left, Right }; struct FunctionNodeParseOptions { enum { CheckForFunctionAndName = 1 << 0, AllowSuperPropertyLookup = 1 << 1, AllowSuperConstructorCall = 1 << 2, IsGetterFunction = 1 << 3, IsSetterFunction = 1 << 4, IsArrowFunction = 1 << 5, IsGeneratorFunction = 1 << 6, }; }; class Parser { public: explicit Parser(Lexer lexer, Program::Type program_type = Program::Type::Script); NonnullRefPtr parse_program(bool starts_in_strict_mode = false); template NonnullRefPtr parse_function_node(u8 parse_options = FunctionNodeParseOptions::CheckForFunctionAndName); Vector parse_formal_parameters(int& function_length, u8 parse_options = 0); RefPtr parse_binding_pattern(bool strict_checks = false); struct PrimaryExpressionParseResult { NonnullRefPtr result; bool should_continue_parsing_as_expression { true }; }; NonnullRefPtr parse_declaration(); enum class AllowLabelledFunction { No, Yes }; NonnullRefPtr parse_statement(AllowLabelledFunction allow_labelled_function = AllowLabelledFunction::No); NonnullRefPtr parse_block_statement(); NonnullRefPtr parse_block_statement(bool& is_strict, bool function_with_non_simple_parameter_list = false); NonnullRefPtr parse_return_statement(); NonnullRefPtr parse_variable_declaration(bool for_loop_variable_declaration = false); NonnullRefPtr parse_for_statement(); NonnullRefPtr parse_for_in_of_statement(NonnullRefPtr lhs); NonnullRefPtr parse_if_statement(); NonnullRefPtr parse_throw_statement(); NonnullRefPtr parse_try_statement(); NonnullRefPtr parse_catch_clause(); NonnullRefPtr parse_switch_statement(); NonnullRefPtr parse_switch_case(); NonnullRefPtr parse_break_statement(); NonnullRefPtr parse_continue_statement(); NonnullRefPtr parse_do_while_statement(); NonnullRefPtr parse_while_statement(); NonnullRefPtr parse_with_statement(); NonnullRefPtr parse_debugger_statement(); NonnullRefPtr parse_conditional_expression(NonnullRefPtr test); NonnullRefPtr parse_expression(int min_precedence, Associativity associate = Associativity::Right, const Vector& forbidden = {}); PrimaryExpressionParseResult parse_primary_expression(); NonnullRefPtr parse_unary_prefixed_expression(); NonnullRefPtr parse_regexp_literal(); NonnullRefPtr parse_object_expression(); NonnullRefPtr parse_array_expression(); NonnullRefPtr parse_string_literal(const Token& token, bool in_template_literal = false); NonnullRefPtr parse_template_literal(bool is_tagged); NonnullRefPtr parse_secondary_expression(NonnullRefPtr, int min_precedence, Associativity associate = Associativity::Right); NonnullRefPtr parse_call_expression(NonnullRefPtr); NonnullRefPtr parse_new_expression(); NonnullRefPtr parse_class_declaration(); NonnullRefPtr parse_class_expression(bool expect_class_name); NonnullRefPtr parse_yield_expression(); NonnullRefPtr parse_property_key(); NonnullRefPtr parse_assignment_expression(AssignmentOp, NonnullRefPtr lhs, int min_precedence, Associativity); NonnullRefPtr parse_identifier(); NonnullRefPtr parse_import_statement(Program& program); NonnullRefPtr parse_export_statement(Program& program); RefPtr try_parse_arrow_function_expression(bool expect_parens); RefPtr try_parse_labelled_statement(AllowLabelledFunction allow_function); RefPtr try_parse_new_target_expression(); struct Error { String message; Optional position; String to_string() const { if (!position.has_value()) return message; return String::formatted("{} (line: {}, column: {})", message, position.value().line, position.value().column); } String source_location_hint(const StringView& source, const char spacer = ' ', const char indicator = '^') const { if (!position.has_value()) return {}; // We need to modify the source to match what the lexer considers one line - normalizing // line terminators to \n is easier than splitting using all different LT characters. String source_string { source }; source_string.replace("\r\n", "\n"); source_string.replace("\r", "\n"); source_string.replace(LINE_SEPARATOR_STRING, "\n"); source_string.replace(PARAGRAPH_SEPARATOR_STRING, "\n"); StringBuilder builder; builder.append(source_string.split_view('\n', true)[position.value().line - 1]); builder.append('\n'); for (size_t i = 0; i < position.value().column - 1; ++i) builder.append(spacer); builder.append(indicator); return builder.build(); } }; bool has_errors() const { return m_state.errors.size(); } const Vector& errors() const { return m_state.errors; } void print_errors(bool print_hint = true) const { for (auto& error : m_state.errors) { if (print_hint) { auto hint = error.source_location_hint(m_state.lexer.source()); if (!hint.is_empty()) warnln("{}", hint); } warnln("SyntaxError: {}", error.to_string()); } } struct TokenMemoization { bool try_parse_arrow_function_expression_failed; }; private: friend class ScopePusher; Associativity operator_associativity(TokenType) const; bool match_expression() const; bool match_unary_prefixed_expression() const; bool match_secondary_expression(const Vector& forbidden = {}) const; bool match_statement() const; bool match_export_or_import() const; bool match_declaration(); bool try_match_let_declaration(); bool match_variable_declaration(); bool match_identifier() const; bool match_identifier_name() const; bool match_property_key() const; bool match(TokenType type) const; bool done() const; void expected(const char* what); void syntax_error(const String& message, Optional = {}); Token consume(); Token consume_identifier(); Token consume_identifier_reference(); Token consume(TokenType type); Token consume_and_validate_numeric_literal(); void consume_or_insert_semicolon(); void save_state(); void load_state(); void discard_saved_state(); Position position() const; Token next_token(); void check_identifier_name_for_assignment_validity(StringView, bool force_strict = false); bool try_parse_arrow_function_expression_failed_at_position(const Position&) const; void set_try_parse_arrow_function_expression_failed_at_position(const Position&, bool); struct RulePosition { AK_MAKE_NONCOPYABLE(RulePosition); AK_MAKE_NONMOVABLE(RulePosition); public: RulePosition(Parser& parser, Position position) : m_parser(parser) , m_position(position) { m_parser.m_rule_starts.append(position); } ~RulePosition() { auto last = m_parser.m_rule_starts.take_last(); VERIFY(last.line == m_position.line); VERIFY(last.column == m_position.column); } const Position& position() const { return m_position; } private: Parser& m_parser; Position m_position; }; [[nodiscard]] RulePosition push_start() { return { *this, position() }; } struct Scope : public RefCounted { enum Type { Function, Block, }; struct HoistableDeclaration { NonnullRefPtr declaration; NonnullRefPtr scope; // where it is actually declared }; Type type; RefPtr parent; NonnullRefPtrVector function_declarations; Vector hoisted_function_declarations; HashTable lexical_declarations; explicit Scope(Type, RefPtr); RefPtr get_current_function_scope(); }; struct ParserState { Lexer lexer; Token current_token; Vector errors; Vector> var_scopes; Vector> let_scopes; RefPtr current_scope; Vector&> function_parameters; HashMap labels_in_scope; bool strict_mode { false }; bool allow_super_property_lookup { false }; bool allow_super_constructor_call { false }; bool in_function_context { false }; bool in_formal_parameter_context { false }; bool in_generator_function_context { false }; bool in_arrow_function_context { false }; bool in_break_context { false }; bool in_continue_context { false }; bool string_legacy_octal_escape_sequence_in_scope { false }; bool in_class_field_initializer { false }; ParserState(Lexer, Program::Type); }; class PositionKeyTraits { public: static int hash(const Position& position) { return int_hash(position.line) ^ int_hash(position.column); } static bool equals(const Position& a, const Position& b) { return a.column == b.column && a.line == b.line; } }; Vector m_rule_starts; ParserState m_state; FlyString m_filename; Vector m_saved_state; HashMap m_token_memoizations; Program::Type m_program_type; }; }