mirror of
https://github.com/RGBCube/serenity
synced 2025-10-24 01:42:35 +00:00

Identifying global variables during parsing will make it possible to generate special optimized instruction to access them in upcoming changes.
359 lines
14 KiB
C++
359 lines
14 KiB
C++
/*
|
|
* Copyright (c) 2020, Stephan Unverwerth <s.unverwerth@serenityos.org>
|
|
* Copyright (c) 2021-2022, David Tuin <davidot@serenityos.org>
|
|
* Copyright (c) 2023, Andreas Kling <kling@serenityos.org>
|
|
*
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
|
*/
|
|
|
|
#pragma once
|
|
|
|
#include <AK/Assertions.h>
|
|
#include <AK/HashTable.h>
|
|
#include <AK/NonnullRefPtr.h>
|
|
#include <AK/StringBuilder.h>
|
|
#include <LibJS/AST.h>
|
|
#include <LibJS/Lexer.h>
|
|
#include <LibJS/ParserError.h>
|
|
#include <LibJS/Runtime/FunctionConstructor.h>
|
|
#include <LibJS/SourceRange.h>
|
|
#include <LibJS/Token.h>
|
|
#include <initializer_list>
|
|
#include <stdio.h>
|
|
|
|
namespace JS {
|
|
|
|
enum class Associativity {
|
|
Left,
|
|
Right
|
|
};
|
|
|
|
struct FunctionNodeParseOptions {
|
|
enum : u16 {
|
|
CheckForFunctionAndName = 1 << 0,
|
|
AllowSuperPropertyLookup = 1 << 1,
|
|
AllowSuperConstructorCall = 1 << 2,
|
|
IsGetterFunction = 1 << 3,
|
|
IsSetterFunction = 1 << 4,
|
|
IsArrowFunction = 1 << 5,
|
|
IsGeneratorFunction = 1 << 6,
|
|
IsAsyncFunction = 1 << 7,
|
|
HasDefaultExportName = 1 << 8,
|
|
};
|
|
};
|
|
|
|
class ScopePusher;
|
|
|
|
class Parser {
|
|
public:
|
|
struct EvalInitialState {
|
|
bool in_eval_function_context { false };
|
|
bool allow_super_property_lookup { false };
|
|
bool allow_super_constructor_call { false };
|
|
bool in_class_field_initializer { false };
|
|
};
|
|
|
|
explicit Parser(Lexer lexer, Program::Type program_type = Program::Type::Script, Optional<EvalInitialState> initial_state_for_eval = {});
|
|
|
|
NonnullRefPtr<Program> parse_program(bool starts_in_strict_mode = false);
|
|
|
|
template<typename FunctionNodeType>
|
|
NonnullRefPtr<FunctionNodeType> parse_function_node(u16 parse_options = FunctionNodeParseOptions::CheckForFunctionAndName, Optional<Position> const& function_start = {});
|
|
Vector<FunctionParameter> parse_formal_parameters(int& function_length, u16 parse_options = 0);
|
|
|
|
enum class AllowDuplicates {
|
|
Yes,
|
|
No
|
|
};
|
|
|
|
enum class AllowMemberExpressions {
|
|
Yes,
|
|
No
|
|
};
|
|
|
|
RefPtr<BindingPattern const> parse_binding_pattern(AllowDuplicates is_var_declaration = AllowDuplicates::No, AllowMemberExpressions allow_member_expressions = AllowMemberExpressions::No);
|
|
|
|
struct PrimaryExpressionParseResult {
|
|
NonnullRefPtr<Expression const> result;
|
|
bool should_continue_parsing_as_expression { true };
|
|
};
|
|
|
|
NonnullRefPtr<Declaration const> parse_declaration();
|
|
|
|
enum class AllowLabelledFunction {
|
|
No,
|
|
Yes
|
|
};
|
|
|
|
NonnullRefPtr<Statement const> parse_statement(AllowLabelledFunction allow_labelled_function = AllowLabelledFunction::No);
|
|
NonnullRefPtr<BlockStatement const> parse_block_statement();
|
|
NonnullRefPtr<FunctionBody const> parse_function_body(Vector<FunctionParameter> const& parameters, FunctionKind function_kind, bool& contains_direct_call_to_eval);
|
|
NonnullRefPtr<ReturnStatement const> parse_return_statement();
|
|
|
|
enum class IsForLoopVariableDeclaration {
|
|
No,
|
|
Yes
|
|
};
|
|
|
|
NonnullRefPtr<VariableDeclaration const> parse_variable_declaration(IsForLoopVariableDeclaration is_for_loop_variable_declaration = IsForLoopVariableDeclaration::No);
|
|
RefPtr<Identifier const> parse_lexical_binding();
|
|
NonnullRefPtr<UsingDeclaration const> parse_using_declaration(IsForLoopVariableDeclaration is_for_loop_variable_declaration = IsForLoopVariableDeclaration::No);
|
|
NonnullRefPtr<Statement const> parse_for_statement();
|
|
|
|
enum class IsForAwaitLoop {
|
|
No,
|
|
Yes
|
|
};
|
|
|
|
struct ForbiddenTokens {
|
|
ForbiddenTokens(std::initializer_list<TokenType> const& forbidden);
|
|
ForbiddenTokens merge(ForbiddenTokens other) const;
|
|
bool allows(TokenType token) const;
|
|
ForbiddenTokens forbid(std::initializer_list<TokenType> const& forbidden) const;
|
|
|
|
private:
|
|
void forbid_tokens(std::initializer_list<TokenType> const& forbidden);
|
|
bool m_forbid_in_token : 1 { false };
|
|
bool m_forbid_logical_tokens : 1 { false };
|
|
bool m_forbid_coalesce_token : 1 { false };
|
|
bool m_forbid_paren_open : 1 { false };
|
|
bool m_forbid_question_mark_period : 1 { false };
|
|
bool m_forbid_equals : 1 { false };
|
|
};
|
|
|
|
struct ExpressionResult {
|
|
template<typename T>
|
|
ExpressionResult(NonnullRefPtr<T const> expression, ForbiddenTokens forbidden = {})
|
|
: expression(move(expression))
|
|
, forbidden(forbidden)
|
|
{
|
|
}
|
|
|
|
template<typename T>
|
|
ExpressionResult(NonnullRefPtr<T> expression, ForbiddenTokens forbidden = {})
|
|
: expression(move(expression))
|
|
, forbidden(forbidden)
|
|
{
|
|
}
|
|
NonnullRefPtr<Expression const> expression;
|
|
ForbiddenTokens forbidden;
|
|
};
|
|
|
|
NonnullRefPtr<Statement const> parse_for_in_of_statement(NonnullRefPtr<ASTNode const> lhs, IsForAwaitLoop is_await);
|
|
NonnullRefPtr<IfStatement const> parse_if_statement();
|
|
NonnullRefPtr<ThrowStatement const> parse_throw_statement();
|
|
NonnullRefPtr<TryStatement const> parse_try_statement();
|
|
NonnullRefPtr<CatchClause const> parse_catch_clause();
|
|
NonnullRefPtr<SwitchStatement const> parse_switch_statement();
|
|
NonnullRefPtr<SwitchCase const> parse_switch_case();
|
|
NonnullRefPtr<BreakStatement const> parse_break_statement();
|
|
NonnullRefPtr<ContinueStatement const> parse_continue_statement();
|
|
NonnullRefPtr<DoWhileStatement const> parse_do_while_statement();
|
|
NonnullRefPtr<WhileStatement const> parse_while_statement();
|
|
NonnullRefPtr<WithStatement const> parse_with_statement();
|
|
NonnullRefPtr<DebuggerStatement const> parse_debugger_statement();
|
|
NonnullRefPtr<ConditionalExpression const> parse_conditional_expression(NonnullRefPtr<Expression const> test, ForbiddenTokens);
|
|
NonnullRefPtr<OptionalChain const> parse_optional_chain(NonnullRefPtr<Expression const> base);
|
|
NonnullRefPtr<Expression const> parse_expression(int min_precedence, Associativity associate = Associativity::Right, ForbiddenTokens forbidden = {});
|
|
PrimaryExpressionParseResult parse_primary_expression();
|
|
NonnullRefPtr<Expression const> parse_unary_prefixed_expression();
|
|
NonnullRefPtr<RegExpLiteral const> parse_regexp_literal();
|
|
NonnullRefPtr<ObjectExpression const> parse_object_expression();
|
|
NonnullRefPtr<ArrayExpression const> parse_array_expression();
|
|
|
|
enum class StringLiteralType {
|
|
Normal,
|
|
NonTaggedTemplate,
|
|
TaggedTemplate
|
|
};
|
|
|
|
NonnullRefPtr<StringLiteral const> parse_string_literal(Token const& token, StringLiteralType string_literal_type = StringLiteralType::Normal, bool* contains_invalid_escape = nullptr);
|
|
NonnullRefPtr<TemplateLiteral const> parse_template_literal(bool is_tagged);
|
|
ExpressionResult parse_secondary_expression(NonnullRefPtr<Expression const>, int min_precedence, Associativity associate = Associativity::Right, ForbiddenTokens forbidden = {});
|
|
NonnullRefPtr<Expression const> parse_call_expression(NonnullRefPtr<Expression const>);
|
|
NonnullRefPtr<NewExpression const> parse_new_expression();
|
|
NonnullRefPtr<ClassDeclaration const> parse_class_declaration();
|
|
NonnullRefPtr<ClassExpression const> parse_class_expression(bool expect_class_name);
|
|
NonnullRefPtr<YieldExpression const> parse_yield_expression();
|
|
NonnullRefPtr<AwaitExpression const> parse_await_expression();
|
|
NonnullRefPtr<Expression const> parse_property_key();
|
|
NonnullRefPtr<AssignmentExpression const> parse_assignment_expression(AssignmentOp, NonnullRefPtr<Expression const> lhs, int min_precedence, Associativity, ForbiddenTokens forbidden = {});
|
|
NonnullRefPtr<Identifier const> parse_identifier();
|
|
NonnullRefPtr<ImportStatement const> parse_import_statement(Program& program);
|
|
NonnullRefPtr<ExportStatement const> parse_export_statement(Program& program);
|
|
|
|
RefPtr<FunctionExpression const> try_parse_arrow_function_expression(bool expect_parens, bool is_async = false);
|
|
RefPtr<LabelledStatement const> try_parse_labelled_statement(AllowLabelledFunction allow_function);
|
|
RefPtr<MetaProperty const> try_parse_new_target_expression();
|
|
RefPtr<MetaProperty const> try_parse_import_meta_expression();
|
|
NonnullRefPtr<ImportCall const> parse_import_call();
|
|
|
|
Vector<CallExpression::Argument> parse_arguments();
|
|
|
|
bool has_errors() const { return m_state.errors.size(); }
|
|
Vector<ParserError> const& errors() const { return m_state.errors; }
|
|
void print_errors(bool print_hint = true) const
|
|
{
|
|
for (auto& error : m_state.errors) {
|
|
if (print_hint) {
|
|
auto hint = error.source_location_hint(m_state.lexer.source());
|
|
if (!hint.is_empty())
|
|
warnln("{}", hint);
|
|
}
|
|
warnln("SyntaxError: {}", error.to_deprecated_string());
|
|
}
|
|
}
|
|
|
|
struct TokenMemoization {
|
|
bool try_parse_arrow_function_expression_failed;
|
|
};
|
|
|
|
// Needs to mess with m_state, and we're not going to expose a non-const getter for that :^)
|
|
friend ThrowCompletionOr<ECMAScriptFunctionObject*> FunctionConstructor::create_dynamic_function(VM&, FunctionObject&, FunctionObject*, FunctionKind, MarkedVector<Value> const&);
|
|
|
|
static Parser parse_function_body_from_string(DeprecatedString const& body_string, u16 parse_options, Vector<FunctionParameter> const& parameters, FunctionKind kind, bool& contains_direct_call_to_eval);
|
|
|
|
private:
|
|
friend class ScopePusher;
|
|
|
|
void parse_script(Program& program, bool starts_in_strict_mode);
|
|
void parse_module(Program& program);
|
|
|
|
Associativity operator_associativity(TokenType) const;
|
|
bool match_expression() const;
|
|
bool match_unary_prefixed_expression() const;
|
|
bool match_secondary_expression(ForbiddenTokens forbidden = {}) const;
|
|
bool match_statement() const;
|
|
bool match_export_or_import() const;
|
|
bool match_assert_clause() const;
|
|
|
|
enum class AllowUsingDeclaration {
|
|
No,
|
|
Yes
|
|
};
|
|
|
|
bool match_declaration(AllowUsingDeclaration allow_using = AllowUsingDeclaration::No) const;
|
|
bool try_match_let_declaration() const;
|
|
bool try_match_using_declaration() const;
|
|
bool match_variable_declaration() const;
|
|
bool match_identifier() const;
|
|
bool token_is_identifier(Token const&) const;
|
|
bool match_identifier_name() const;
|
|
bool match_property_key() const;
|
|
bool is_private_identifier_valid() const;
|
|
bool match(TokenType type) const;
|
|
bool done() const;
|
|
void expected(char const* what);
|
|
void syntax_error(DeprecatedString const& message, Optional<Position> = {});
|
|
Token consume();
|
|
Token consume_and_allow_division();
|
|
Token consume_identifier();
|
|
Token consume_identifier_reference();
|
|
Token consume(TokenType type);
|
|
Token consume_and_validate_numeric_literal();
|
|
void consume_or_insert_semicolon();
|
|
void save_state();
|
|
void load_state();
|
|
void discard_saved_state();
|
|
Position position() const;
|
|
|
|
RefPtr<BindingPattern const> synthesize_binding_pattern(Expression const& expression);
|
|
|
|
Token next_token(size_t steps = 1) const;
|
|
|
|
void check_identifier_name_for_assignment_validity(DeprecatedFlyString const&, bool force_strict = false);
|
|
|
|
bool try_parse_arrow_function_expression_failed_at_position(Position const&) const;
|
|
void set_try_parse_arrow_function_expression_failed_at_position(Position const&, bool);
|
|
|
|
bool match_invalid_escaped_keyword() const;
|
|
|
|
bool parse_directive(ScopeNode& body);
|
|
void parse_statement_list(ScopeNode& output_node, AllowLabelledFunction allow_labelled_functions = AllowLabelledFunction::No);
|
|
|
|
DeprecatedFlyString consume_string_value();
|
|
ModuleRequest parse_module_request();
|
|
|
|
struct RulePosition {
|
|
AK_MAKE_NONCOPYABLE(RulePosition);
|
|
AK_MAKE_NONMOVABLE(RulePosition);
|
|
|
|
public:
|
|
RulePosition(Parser& parser, Position position)
|
|
: m_parser(parser)
|
|
, m_position(position)
|
|
{
|
|
m_parser.m_rule_starts.append(position);
|
|
}
|
|
|
|
~RulePosition()
|
|
{
|
|
auto last = m_parser.m_rule_starts.take_last();
|
|
VERIFY(last.line == m_position.line);
|
|
VERIFY(last.column == m_position.column);
|
|
}
|
|
|
|
Position const& position() const { return m_position; }
|
|
|
|
private:
|
|
Parser& m_parser;
|
|
Position m_position;
|
|
};
|
|
|
|
[[nodiscard]] RulePosition push_start() { return { *this, position() }; }
|
|
|
|
struct ParserState {
|
|
Lexer lexer;
|
|
Token current_token;
|
|
Vector<ParserError> errors;
|
|
ScopePusher* current_scope_pusher { nullptr };
|
|
|
|
HashMap<StringView, Optional<Position>> labels_in_scope;
|
|
HashMap<size_t, Position> invalid_property_range_in_object_expression;
|
|
HashTable<StringView>* referenced_private_names { nullptr };
|
|
|
|
bool strict_mode { false };
|
|
bool allow_super_property_lookup { false };
|
|
bool allow_super_constructor_call { false };
|
|
bool in_function_context { false };
|
|
bool initiated_by_eval { false };
|
|
bool in_eval_function_context { false }; // This controls if we allow new.target or not. Note that eval("return") is not allowed, so we have to have a separate state variable for eval.
|
|
bool in_formal_parameter_context { false };
|
|
bool in_catch_parameter_context { false };
|
|
bool in_generator_function_context { false };
|
|
bool await_expression_is_valid { false };
|
|
bool in_arrow_function_context { false };
|
|
bool in_break_context { false };
|
|
bool in_continue_context { false };
|
|
bool string_legacy_octal_escape_sequence_in_scope { false };
|
|
bool in_class_field_initializer { false };
|
|
bool in_class_static_init_block { false };
|
|
bool function_might_need_arguments_object { false };
|
|
|
|
ParserState(Lexer, Program::Type);
|
|
};
|
|
|
|
class PositionKeyTraits {
|
|
public:
|
|
static int hash(Position const& position)
|
|
{
|
|
return int_hash(position.line) ^ int_hash(position.column);
|
|
}
|
|
|
|
static bool equals(Position const& a, Position const& b)
|
|
{
|
|
return a.column == b.column && a.line == b.line;
|
|
}
|
|
};
|
|
|
|
NonnullRefPtr<Identifier const> create_identifier_and_register_in_current_scope(SourceRange range, DeprecatedFlyString string);
|
|
|
|
NonnullRefPtr<SourceCode const> m_source_code;
|
|
Vector<Position> m_rule_starts;
|
|
ParserState m_state;
|
|
DeprecatedFlyString m_filename;
|
|
Vector<ParserState> m_saved_state;
|
|
HashMap<Position, TokenMemoization, PositionKeyTraits> m_token_memoizations;
|
|
Program::Type m_program_type;
|
|
};
|
|
}
|