From 6b30c4d2f0a98a904e2cdddddd41637546a3216c Mon Sep 17 00:00:00 2001
From: Dan Klishch <danilklishch@gmail.com>
Date: Wed, 17 Jan 2024 01:36:39 -0500
Subject: [PATCH] JSSpecCompiler: Issue meaningful errors in TextParser

---
 .../JSSpecCompiler/Parser/SpecParser.cpp      |  60 ++++--
 .../JSSpecCompiler/Parser/SpecParser.h        |   4 +-
 .../JSSpecCompiler/Parser/TextParser.cpp      | 204 ++++++++++++------
 .../JSSpecCompiler/Parser/TextParser.h        |  72 ++++---
 .../JSSpecCompiler/Parser/Token.h             |  79 +++----
 5 files changed, 272 insertions(+), 147 deletions(-)
diff --git a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/SpecParser.cpp b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/SpecParser.cpp
index 663d9ecb59..c2061d9033 100644
--- a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/SpecParser.cpp
+++ b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/SpecParser.cpp
@@ -86,24 +86,29 @@ Optional<AlgorithmStep> AlgorithmStep::create(SpecificationParsingContext& ctx,
         result.m_substeps = step_list.has_value() ? step_list->tree() : error_tree;
     }
 
-    auto parse_result = result.parse();
-    if (parse_result.is_error()) {
-        ctx.diag().error(ctx.location_from_xml_offset(parse_result.error()->offset()),
-            "{}", parse_result.error()->to_string());
+    if (!result.parse())
         return {};
-    }
-    result.m_expression = parse_result.release_value();
     return result;
 }
 
-ParseErrorOr<Tree> AlgorithmStep::parse()
+bool AlgorithmStep::parse()
 {
-    TextParser parser(m_tokens, m_node);
+    TextParser parser(m_ctx, m_tokens, m_node);
 
+    TextParseErrorOr<Tree> parse_result = TextParseError {};
     if (m_substeps)
-        return parser.parse_step_with_substeps(RefPtr(m_substeps).release_nonnull());
+        parse_result = parser.parse_step_with_substeps(RefPtr(m_substeps).release_nonnull());
     else
-        return parser.parse_step_without_substeps();
+        parse_result = parser.parse_step_without_substeps();
+
+    if (parse_result.is_error()) {
+        auto [location, message] = parser.get_diagnostic();
+        m_ctx.diag().error(location, "{}", message);
+        return false;
+    } else {
+        m_expression = parse_result.release_value();
+        return true;
+    }
 }
 
 Optional<AlgorithmStepList> AlgorithmStepList::create(SpecificationParsingContext& ctx, XML::Node const* element)
@@ -250,12 +255,26 @@ void SpecificationClause::collect_into(TranslationUnitRef translation_unit)
         subclause->collect_into(translation_unit);
 }
 
-ParseErrorOr<void> SpecificationClause::parse_header(XML::Node const* element)
+Optional<FailedTextParseDiagnostic> SpecificationClause::parse_header(XML::Node const* element)
 {
+    auto& ctx = *m_ctx_pointer;
     VERIFY(element->as_element().name == tag_h1);
-    auto tokens = TRY(tokenize_tree(*m_ctx_pointer, element));
-    TextParser parser(tokens.tokens, element);
-    m_header = TRY(parser.parse_clause_header());
+
+    auto tokenization_result = tokenize_tree(ctx, element, false);
+    if (tokenization_result.is_error()) {
+        return FailedTextParseDiagnostic {
+            ctx.location_from_xml_offset(tokenization_result.error()->offset()),
+            tokenization_result.error()->to_string()
+        };
+    }
+    auto const& tokens = tokenization_result.release_value().tokens;
+
+    TextParser parser(ctx, tokens, element);
+    auto parse_result = parser.parse_clause_header();
+    if (parse_result.is_error())
+        return parser.get_diagnostic();
+
+    m_header = parse_result.value();
     return {};
 }
 
@@ -264,7 +283,7 @@ void SpecificationClause::parse(XML::Node const* element)
     auto& ctx = context();
     u32 child_index = 0;
 
-    Optional<NonnullRefPtr<ParseError>> header_parse_error;
+    Optional<FailedTextParseDiagnostic> header_parse_error;
 
     for (auto const& child : element->as_element().children) {
         child->content.visit(
@@ -275,10 +294,8 @@ void SpecificationClause::parse(XML::Node const* element)
                             "<h1> must be the first child of <emu-clause>");
                         return;
                     }
-
-                    if (auto error = parse_header(child); error.is_error())
-                        header_parse_error = error.release_error();
-                    else
+                    header_parse_error = parse_header(child);
+                    if (!header_parse_error.has_value())
                         ctx.current_logical_scope().section = MUST(String::from_utf8(m_header.section_number));
                 } else {
                     if (element.name == tag_h1) {
@@ -294,10 +311,7 @@ void SpecificationClause::parse(XML::Node const* element)
                     if (header_parse_error.has_value()) {
                         ctx.diag().warn(ctx.location_from_xml_offset(child->offset),
                             "node content will be ignored since section header was not parsed successfully");
-                        // TODO: Integrate backtracing parser errors better
-                        ctx.diag().note(ctx.location_from_xml_offset(header_parse_error.value()->offset()),
-                            "{}", header_parse_error.value()->to_string());
-                        header_parse_error.clear();
+                        ctx.diag().note(header_parse_error->location, "{}", header_parse_error->message);
                     }
                 }
                 ++child_index;
diff --git a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/SpecParser.h b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/SpecParser.h
index d613cc25ea..c5802630ca 100644
--- a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/SpecParser.h
+++ b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/SpecParser.h
@@ -70,7 +70,7 @@ private:
     {
     }
 
-    ParseErrorOr<Tree> parse();
+    bool parse();
 
     SpecificationParsingContext& m_ctx;
     Vector<Token> m_tokens;
@@ -113,7 +113,7 @@ private:
     {
     }
 
-    ParseErrorOr<void> parse_header(XML::Node const* element);
+    Optional<FailedTextParseDiagnostic> parse_header(XML::Node const* element);
     void parse(XML::Node const* element);
 
     SpecificationParsingContext* m_ctx_pointer;
diff --git a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/TextParser.cpp b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/TextParser.cpp
index 21ae23e8f7..c70ad98af1 100644
--- a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/TextParser.cpp
+++ b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/TextParser.cpp
@@ -6,10 +6,21 @@
 
 #include <AK/ScopeGuard.h>
 
+#include "Parser/SpecParser.h"
 #include "Parser/TextParser.h"
 
 namespace JSSpecCompiler {
 
+void TextParser::save_error(Variant<TokenType, StringView, CustomMessage>&& expected)
+{
+    if (m_max_parsed_tokens > m_next_token_index)
+        return;
+    if (m_max_parsed_tokens < m_next_token_index)
+        m_suitable_continuations.clear();
+    m_max_parsed_tokens = m_next_token_index;
+    m_suitable_continuations.append(move(expected));
+}
+
 void TextParser::retreat()
 {
     --m_next_token_index;
@@ -24,48 +35,69 @@ auto TextParser::rollback_point()
     };
 }
 
-ParseErrorOr<Token const*> TextParser::peek_token()
+Optional<Token> TextParser::peek_token()
 {
     if (m_next_token_index == m_tokens.size())
-        return ParseError::create("Expected token but found EOF"sv, m_node);
-    return &m_tokens[m_next_token_index];
+        return {};
+    return m_tokens[m_next_token_index];
 }
 
-ParseErrorOr<Token const*> TextParser::consume_token()
+Optional<Token> TextParser::consume_token()
 {
     auto result = peek_token();
-    if (!result.is_error())
+    if (result.has_value())
         ++m_next_token_index;
     return result;
 }
 
-ParseErrorOr<Token const*> TextParser::consume_token_with_one_of_types(std::initializer_list<TokenType> types)
+TextParseErrorOr<Token> TextParser::consume_token_with_one_of_types(std::initializer_list<TokenType> types)
 {
-    auto token = TRY(consume_token());
-    for (TokenType type : types)
-        if (token->type == type)
-            return token;
-    retreat();
+    auto token = peek_token();
+    if (token.has_value()) {
+        for (TokenType type : types) {
+            if (token->type == type) {
+                (void)consume_token();
+                return *token;
+            } else {
+                save_error(type);
+            }
+        }
+    } else {
+        for (TokenType type : types)
+            save_error(type);
+    }
 
-    return ParseError::create(String::formatted("Unexpected token type {}", token->name()), token->node);
+    return TextParseError {};
 }
 
-ParseErrorOr<Token const*> TextParser::consume_token_with_type(TokenType type)
+TextParseErrorOr<Token> TextParser::consume_token_with_type(TokenType type)
 {
     return consume_token_with_one_of_types({ type });
 }
 
-ParseErrorOr<void> TextParser::consume_word(StringView word)
+TextParseErrorOr<void> TextParser::consume_token(TokenType type, StringView data)
 {
-    auto token = TRY(consume_token_with_type(TokenType::Word));
-    if (!token->data.equals_ignoring_ascii_case(word)) {
+    auto token = consume_token();
+    if (!token.has_value() || token->type != type || !token->data.equals_ignoring_ascii_case(data)) {
         retreat();
-        return ParseError::create("Unexpected word"sv, token->node);
+        save_error(data);
+        return TextParseError {};
     }
     return {};
 }
 
-ParseErrorOr<void> TextParser::consume_words(std::initializer_list<StringView> words)
+TextParseErrorOr<void> TextParser::consume_word(StringView word)
+{
+    auto token = consume_token();
+    if (!token.has_value() || token->type != TokenType::Word || !token->data.equals_ignoring_ascii_case(word)) {
+        retreat();
+        save_error(word);
+        return TextParseError {};
+    }
+    return {};
+}
+
+TextParseErrorOr<void> TextParser::consume_words(std::initializer_list<StringView> words)
 {
     for (auto word : words)
         TRY(consume_word(word));
@@ -77,14 +109,17 @@ bool TextParser::is_eof() const
     return m_next_token_index == m_tokens.size();
 }
 
-ParseErrorOr<void> TextParser::expect_eof() const
+TextParseErrorOr<void> TextParser::expect_eof()
 {
-    if (!is_eof())
-        return ParseError::create("Expected EOF"sv, m_node);
+    if (!is_eof()) {
+        save_error(CustomMessage { "EOF"sv });
+        return TextParseError {};
+    }
     return {};
 }
 
-ParseErrorOr<Tree> TextParser::parse_record_direct_list_initialization()
+// (the)? <record_name> { (<name>: <value>,)* }
+TextParseErrorOr<Tree> TextParser::parse_record_direct_list_initialization()
 {
     auto rollback = rollback_point();
 
@@ -96,36 +131,37 @@ ParseErrorOr<Tree> TextParser::parse_record_direct_list_initialization()
     while (true) {
         auto name = TRY(consume_token_with_one_of_types({ TokenType::Identifier, TokenType::BraceClose }));
 
-        if (name->is_bracket()) {
+        if (name.is_bracket()) {
             break;
         } else {
             TRY(consume_token_with_type(TokenType::Colon));
             auto value = TRY(parse_expression());
             (void)consume_token_with_type(TokenType::Comma);
-            arguments.append({ make_ref_counted<UnresolvedReference>(name->data), value });
+            arguments.append({ make_ref_counted<UnresolvedReference>(name.data), value });
         }
     }
 
     rollback.disarm();
     return make_ref_counted<RecordDirectListInitialization>(
-        make_ref_counted<UnresolvedReference>(identifier->data), move(arguments));
+        make_ref_counted<UnresolvedReference>(identifier.data), move(arguments));
 }
 
 // <expr>
-ParseErrorOr<Tree> TextParser::parse_expression()
+TextParseErrorOr<Tree> TextParser::parse_expression()
 {
     auto rollback = rollback_point();
 
-    // (the)? <record_name> { (<name>: <value>,)* }
     if (auto record_init = parse_record_direct_list_initialization(); !record_init.is_error()) {
         rollback.disarm();
         return record_init.release_value();
     }
 
-#define THROW_PARSE_ERROR_IF(expr)                                      \
-    do {                                                                \
-        if (expr)                                                       \
-            return ParseError::create("Expected expression"sv, m_node); \
+#define THROW_PARSE_ERROR_IF(expr)                                                                           \
+    do {                                                                                                     \
+        if (expr) {                                                                                          \
+            save_error(CustomMessage { "valid expression continuation (not valid because " #expr ")"##sv }); \
+            return TextParseError {};                                                                        \
+        }                                                                                                    \
     } while (false)
 #define THROW_PARSE_ERROR THROW_PARSE_ERROR_IF(true)
 
@@ -183,9 +219,9 @@ ParseErrorOr<Tree> TextParser::parse_expression()
 
     while (true) {
         auto token_or_error = peek_token();
-        if (token_or_error.is_error())
+        if (!token_or_error.has_value())
             break;
-        auto token = *token_or_error.release_value();
+        auto token = token_or_error.release_value();
 
         enum {
             NoneType,
@@ -274,7 +310,7 @@ ParseErrorOr<Tree> TextParser::parse_expression()
             merge_pre_merged();
         }
 
-        MUST(consume_token());
+        VERIFY(consume_token().has_value());
     }
 
     THROW_PARSE_ERROR_IF(stack.is_empty());
@@ -288,7 +324,7 @@ ParseErrorOr<Tree> TextParser::parse_expression()
 }
 
 // <condition> :== <expr> | (<expr> is <expr> (or <expr>)?)
-ParseErrorOr<Tree> TextParser::parse_condition()
+TextParseErrorOr<Tree> TextParser::parse_condition()
 {
     auto rollback = rollback_point();
     auto expression = TRY(parse_expression());
@@ -307,7 +343,7 @@ ParseErrorOr<Tree> TextParser::parse_condition()
 }
 
 // return <expr>
-ParseErrorOr<Tree> TextParser::parse_return_statement()
+TextParseErrorOr<Tree> TextParser::parse_return_statement()
 {
     auto rollback = rollback_point();
 
@@ -319,15 +355,11 @@ ParseErrorOr<Tree> TextParser::parse_return_statement()
 }
 
 // assert: <condition>
-ParseErrorOr<Tree> TextParser::parse_assert()
+TextParseErrorOr<Tree> TextParser::parse_assert()
 {
     auto rollback = rollback_point();
 
-    auto identifier = TRY(consume_token_with_type(TokenType::Identifier))->data;
-    if (!identifier.equals_ignoring_ascii_case("assert"sv)) {
-        return ParseError::create("Expected identifier \"Assert\""sv, m_node);
-    }
-
+    TRY(consume_token(TokenType::Identifier, "assert"sv));
     TRY(consume_token_with_type(TokenType::Colon));
     auto condition = TRY(parse_condition());
 
@@ -336,7 +368,7 @@ ParseErrorOr<Tree> TextParser::parse_assert()
 }
 
 // (let <expr> be <expr>) | (set <expr> to <expr>)
-ParseErrorOr<Tree> TextParser::parse_assignment()
+TextParseErrorOr<Tree> TextParser::parse_assignment()
 {
     auto rollback = rollback_point();
 
@@ -353,7 +385,7 @@ ParseErrorOr<Tree> TextParser::parse_assignment()
 }
 
 // <simple_step>
-ParseErrorOr<Tree> TextParser::parse_simple_step_or_inline_if_branch()
+TextParseErrorOr<Tree> TextParser::parse_simple_step_or_inline_if_branch()
 {
     auto rollback = rollback_point();
 
@@ -382,11 +414,11 @@ ParseErrorOr<Tree> TextParser::parse_simple_step_or_inline_if_branch()
         return result.release_value();
     }
 
-    return ParseError::create("Unable to parse simple step or inline if branch"sv, m_node);
+    return TextParseError {};
 }
 
 // <if_condition> :== (If <condition>) | (Else) | (Else if <condition>),
-ParseErrorOr<TextParser::IfConditionParseResult> TextParser::parse_if_beginning()
+TextParseErrorOr<TextParser::IfConditionParseResult> TextParser::parse_if_beginning()
 {
     auto rollback = rollback_point();
 
@@ -406,7 +438,7 @@ ParseErrorOr<TextParser::IfConditionParseResult> TextParser::parse_if_beginning(
 }
 
 // <inline_if> :== <if_condition> <simple_step>.$
-ParseErrorOr<Tree> TextParser::parse_inline_if_else()
+TextParseErrorOr<Tree> TextParser::parse_inline_if_else()
 {
     auto rollback = rollback_point();
 
@@ -420,7 +452,7 @@ ParseErrorOr<Tree> TextParser::parse_inline_if_else()
 }
 
 // <if> :== <if_condition> then$ <substeps>
-ParseErrorOr<Tree> TextParser::parse_if(Tree then_branch)
+TextParseErrorOr<Tree> TextParser::parse_if(Tree then_branch)
 {
     auto rollback = rollback_point();
 
@@ -436,7 +468,7 @@ ParseErrorOr<Tree> TextParser::parse_if(Tree then_branch)
 }
 
 // <else> :== Else,$ <substeps>
-ParseErrorOr<Tree> TextParser::parse_else(Tree else_branch)
+TextParseErrorOr<Tree> TextParser::parse_else(Tree else_branch)
 {
     auto rollback = rollback_point();
 
@@ -449,7 +481,7 @@ ParseErrorOr<Tree> TextParser::parse_else(Tree else_branch)
 }
 
 // <simple_step> | <inline_if>
-ParseErrorOr<Tree> TextParser::parse_step_without_substeps()
+TextParseErrorOr<Tree> TextParser::parse_step_without_substeps()
 {
     auto rollback = rollback_point();
 
@@ -465,11 +497,11 @@ ParseErrorOr<Tree> TextParser::parse_step_without_substeps()
         return result.release_value();
     }
 
-    return ParseError::create("Unable to parse step without substeps"sv, m_node);
+    return TextParseError {};
 }
 
 // <if> | <else>
-ParseErrorOr<Tree> TextParser::parse_step_with_substeps(Tree substeps)
+TextParseErrorOr<Tree> TextParser::parse_step_with_substeps(Tree substeps)
 {
     auto rollback = rollback_point();
 
@@ -485,32 +517,32 @@ ParseErrorOr<Tree> TextParser::parse_step_with_substeps(Tree substeps)
         return result.release_value();
     }
 
-    return ParseError::create("Unable to parse step with substeps"sv, m_node);
+    return TextParseError {};
 }
 
-ParseErrorOr<ClauseHeader> TextParser::parse_clause_header()
+TextParseErrorOr<ClauseHeader> TextParser::parse_clause_header()
 {
     ClauseHeader result;
 
     auto section_number_token = TRY(consume_token_with_type(TokenType::SectionNumber));
-    result.section_number = section_number_token->data;
+    result.section_number = section_number_token.data;
 
     ClauseHeader::FunctionDefinition function_definition;
 
-    function_definition.name = TRY(consume_token())->data;
+    function_definition.name = TRY(consume_token_with_type(TokenType::Word)).data;
 
     TRY(consume_token_with_type(TokenType::ParenOpen));
     while (true) {
         if (function_definition.arguments.is_empty()) {
             auto argument = TRY(consume_token_with_one_of_types({ TokenType::ParenClose, TokenType::Identifier }));
-            if (argument->type == TokenType::ParenClose)
+            if (argument.type == TokenType::ParenClose)
                 break;
-            function_definition.arguments.append({ argument->data });
+            function_definition.arguments.append({ argument.data });
         } else {
-            function_definition.arguments.append({ TRY(consume_token_with_type(TokenType::Identifier))->data });
+            function_definition.arguments.append({ TRY(consume_token_with_type(TokenType::Identifier)).data });
         }
         auto next_token = TRY(consume_token_with_one_of_types({ TokenType::ParenClose, TokenType::Comma }));
-        if (next_token->type == TokenType::ParenClose)
+        if (next_token.type == TokenType::ParenClose)
             break;
     }
     TRY(expect_eof());
@@ -520,4 +552,56 @@ ParseErrorOr<ClauseHeader> TextParser::parse_clause_header()
     return result;
 }
 
+FailedTextParseDiagnostic TextParser::get_diagnostic() const
+{
+    StringBuilder message;
+
+    message.append("unexpected "sv);
+
+    if (m_max_parsed_tokens == m_tokens.size()) {
+        message.append("EOF"sv);
+    } else {
+        auto token = m_tokens[m_max_parsed_tokens];
+        if (token.type == TokenType::Word)
+            message.appendff("'{}'", token.data);
+        else if (token.type == TokenType::Identifier)
+            message.appendff("identifier '{}'", token.data);
+        else
+            message.append(token.name_for_diagnostic());
+    }
+
+    message.appendff(", expected ");
+
+    size_t size = m_suitable_continuations.size();
+    VERIFY(size > 0);
+
+    for (size_t i = 0; i < size; ++i) {
+        m_suitable_continuations[i].visit(
+            [&](TokenType type) { message.append(token_info[to_underlying(type)].name_for_diagnostic); },
+            [&](StringView word) { message.appendff("'{}'", word); },
+            [&](CustomMessage continuation) { message.append(continuation.message); });
+
+        if (i + 1 != size) {
+            if (size == 2)
+                message.append(" or "sv);
+            else if (i + 2 == size)
+                message.append(", or "sv);
+            else
+                message.append(", "sv);
+        }
+    }
+
+    Location location = Location::global_scope();
+
+    if (m_max_parsed_tokens < m_tokens.size()) {
+        location = m_tokens[m_max_parsed_tokens].location;
+    } else {
+        // FIXME: Would be nice to point to the closing tag not the opening one. This is also the
+        //        only place where we use m_location.
+        location = m_ctx.location_from_xml_offset(m_node->offset);
+    }
+
+    return { location, MUST(message.to_string()) };
+}
+
 }
diff --git a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/TextParser.h b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/TextParser.h
index 627f9f353d..0e7c7756dd 100644
--- a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/TextParser.h
+++ b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/TextParser.h
@@ -23,17 +23,30 @@ struct ClauseHeader {
     Variant<AK::Empty, FunctionDefinition> header;
 };
 
+struct TextParseError { };
+
+struct FailedTextParseDiagnostic {
+    Location location;
+    String message;
+};
+
+template<typename T>
+using TextParseErrorOr = ErrorOr<T, TextParseError>;
+
 class TextParser {
 public:
-    TextParser(Vector<Token>& tokens_, XML::Node const* node_)
-        : m_tokens(tokens_)
-        , m_node(node_)
+    TextParser(SpecificationParsingContext& ctx, Vector<Token> const& tokens, XML::Node const* node)
+        : m_ctx(ctx)
+        , m_tokens(tokens)
+        , m_node(node)
     {
     }
 
-    ParseErrorOr<ClauseHeader> parse_clause_header();
-    ParseErrorOr<Tree> parse_step_without_substeps();
-    ParseErrorOr<Tree> parse_step_with_substeps(Tree substeps);
+    TextParseErrorOr<ClauseHeader> parse_clause_header();
+    TextParseErrorOr<Tree> parse_step_without_substeps();
+    TextParseErrorOr<Tree> parse_step_with_substeps(Tree substeps);
+
+    FailedTextParseDiagnostic get_diagnostic() const;
 
 private:
     struct IfConditionParseResult {
@@ -41,32 +54,43 @@ private:
         NullableTree condition;
     };
 
+    struct CustomMessage {
+        StringView message;
+    };
+
+    void save_error(Variant<TokenType, StringView, CustomMessage>&& expected);
+
     void retreat();
     [[nodiscard]] auto rollback_point();
-    ParseErrorOr<Token const*> peek_token();
-    ParseErrorOr<Token const*> consume_token();
-    ParseErrorOr<Token const*> consume_token_with_one_of_types(std::initializer_list<TokenType> types);
-    ParseErrorOr<Token const*> consume_token_with_type(TokenType type);
-    ParseErrorOr<void> consume_word(StringView word);
-    ParseErrorOr<void> consume_words(std::initializer_list<StringView> words);
+    Optional<Token> peek_token();
+    Optional<Token> consume_token();
+    TextParseErrorOr<Token> consume_token_with_one_of_types(std::initializer_list<TokenType> types);
+    TextParseErrorOr<Token> consume_token_with_type(TokenType type);
+    TextParseErrorOr<void> consume_token(TokenType type, StringView data);
+    TextParseErrorOr<void> consume_word(StringView word);
+    TextParseErrorOr<void> consume_words(std::initializer_list<StringView> words);
     bool is_eof() const;
-    ParseErrorOr<void> expect_eof() const;
+    TextParseErrorOr<void> expect_eof();
 
-    ParseErrorOr<Tree> parse_record_direct_list_initialization();
-    ParseErrorOr<Tree> parse_expression();
-    ParseErrorOr<Tree> parse_condition();
-    ParseErrorOr<Tree> parse_return_statement();
-    ParseErrorOr<Tree> parse_assert();
-    ParseErrorOr<Tree> parse_assignment();
-    ParseErrorOr<Tree> parse_simple_step_or_inline_if_branch();
-    ParseErrorOr<IfConditionParseResult> parse_if_beginning();
-    ParseErrorOr<Tree> parse_inline_if_else();
-    ParseErrorOr<Tree> parse_if(Tree then_branch);
-    ParseErrorOr<Tree> parse_else(Tree else_branch);
+    TextParseErrorOr<Tree> parse_record_direct_list_initialization();
+    TextParseErrorOr<Tree> parse_expression();
+    TextParseErrorOr<Tree> parse_condition();
+    TextParseErrorOr<Tree> parse_return_statement();
+    TextParseErrorOr<Tree> parse_assert();
+    TextParseErrorOr<Tree> parse_assignment();
+    TextParseErrorOr<Tree> parse_simple_step_or_inline_if_branch();
+    TextParseErrorOr<IfConditionParseResult> parse_if_beginning();
+    TextParseErrorOr<Tree> parse_inline_if_else();
+    TextParseErrorOr<Tree> parse_if(Tree then_branch);
+    TextParseErrorOr<Tree> parse_else(Tree else_branch);
 
+    SpecificationParsingContext& m_ctx;
     Vector<Token> const& m_tokens;
     size_t m_next_token_index = 0;
     XML::Node const* m_node;
+
+    size_t m_max_parsed_tokens = 0;
+    Vector<Variant<TokenType, StringView, CustomMessage>, 8> m_suitable_continuations;
 };
 
 }
diff --git a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/Token.h b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/Token.h
index e968079b4c..2f11167039 100644
--- a/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/Token.h
+++ b/Meta/Lagom/Tools/CodeGenerators/JSSpecCompiler/Parser/Token.h
@@ -20,38 +20,38 @@ constexpr i32 closing_bracket_precedence = 18;
 
 // NOTE: Operator precedence is generally the same as in
 //       https://en.cppreference.com/w/cpp/language/operator_precedence (common sense applies).
-#define ENUMERATE_TOKENS(F)                                   \
-    F(Invalid, -1, Invalid, Invalid, Invalid)                 \
-    F(SectionNumber, -1, Invalid, Invalid, Invalid)           \
-    F(Identifier, -1, Invalid, Invalid, Invalid)              \
-    F(Number, -1, Invalid, Invalid, Invalid)                  \
-    F(String, -1, Invalid, Invalid, Invalid)                  \
-    F(Undefined, -1, Invalid, Invalid, Invalid)               \
-    F(Word, -1, Invalid, Invalid, Invalid)                    \
-    F(ParenOpen, -1, Invalid, Invalid, ParenClose)            \
-    F(ParenClose, 18, Invalid, Invalid, ParenOpen)            \
-    F(BraceOpen, -1, Invalid, Invalid, BraceClose)            \
-    F(BraceClose, 18, Invalid, Invalid, BraceOpen)            \
-    F(Comma, 17, Invalid, Comma, Invalid)                     \
-    F(MemberAccess, 2, Invalid, MemberAccess, Invalid)        \
-    F(Dot, -1, Invalid, Invalid, Invalid)                     \
-    F(Colon, -1, Invalid, Invalid, Invalid)                   \
-    F(Less, 9, Invalid, CompareLess, Invalid)                 \
-    F(Greater, 9, Invalid, CompareGreater, Invalid)           \
-    F(NotEquals, 10, Invalid, CompareNotEqual, Invalid)       \
-    F(Equals, 10, Invalid, CompareEqual, Invalid)             \
-    F(Plus, 6, Invalid, Plus, Invalid)                        \
-    F(AmbiguousMinus, -2, Invalid, Invalid, Invalid)          \
-    F(UnaryMinus, 3, Minus, Invalid, Invalid)                 \
-    F(BinaryMinus, 6, Invalid, Minus, Invalid)                \
-    F(Multiplication, 5, Invalid, Multiplication, Invalid)    \
-    F(Division, 5, Invalid, Division, Invalid)                \
-    F(FunctionCall, 2, Invalid, FunctionCall, Invalid)        \
-    F(ExclamationMark, 3, AssertCompletion, Invalid, Invalid) \
-    F(Is, -1, Invalid, Invalid, Invalid)
+#define ENUMERATE_TOKENS(F)                                                          \
+    F(Invalid, -1, Invalid, Invalid, Invalid, "")                                    \
+    F(SectionNumber, -1, Invalid, Invalid, Invalid, "section number")                \
+    F(Identifier, -1, Invalid, Invalid, Invalid, "identifier")                       \
+    F(Number, -1, Invalid, Invalid, Invalid, "number")                               \
+    F(String, -1, Invalid, Invalid, Invalid, "string literal")                       \
+    F(Undefined, -1, Invalid, Invalid, Invalid, "constant")                          \
+    F(Word, -1, Invalid, Invalid, Invalid, "word")                                   \
+    F(ParenOpen, -1, Invalid, Invalid, ParenClose, "'('")                            \
+    F(ParenClose, 18, Invalid, Invalid, ParenOpen, "')'")                            \
+    F(BraceOpen, -1, Invalid, Invalid, BraceClose, "'{'")                            \
+    F(BraceClose, 18, Invalid, Invalid, BraceOpen, "'}'")                            \
+    F(Comma, 17, Invalid, Comma, Invalid, "','")                                     \
+    F(MemberAccess, 2, Invalid, MemberAccess, Invalid, "member access operator '.'") \
+    F(Dot, -1, Invalid, Invalid, Invalid, "punctuation mark '.'")                    \
+    F(Colon, -1, Invalid, Invalid, Invalid, "':'")                                   \
+    F(Less, 9, Invalid, CompareLess, Invalid, "less than")                           \
+    F(Greater, 9, Invalid, CompareGreater, Invalid, "greater than")                  \
+    F(NotEquals, 10, Invalid, CompareNotEqual, Invalid, "not equals")                \
+    F(Equals, 10, Invalid, CompareEqual, Invalid, "equals")                          \
+    F(Plus, 6, Invalid, Plus, Invalid, "plus")                                       \
+    F(AmbiguousMinus, -2, Invalid, Invalid, Invalid, "minus")                        \
+    F(UnaryMinus, 3, Minus, Invalid, Invalid, "unary minus")                         \
+    F(BinaryMinus, 6, Invalid, Minus, Invalid, "binary minus")                       \
+    F(Multiplication, 5, Invalid, Multiplication, Invalid, "multiplication")         \
+    F(Division, 5, Invalid, Division, Invalid, "division")                           \
+    F(FunctionCall, 2, Invalid, FunctionCall, Invalid, "function call token")        \
+    F(ExclamationMark, 3, AssertCompletion, Invalid, Invalid, "exclamation mark")    \
+    F(Is, -1, Invalid, Invalid, Invalid, "operator is")
 
 enum class TokenType {
-#define ID(name, precedence, unary_name, binary_name, matching_bracket) name,
+#define ID(name, precedence, unary_name, binary_name, matching_bracket, name_for_diagnostic) name,
     ENUMERATE_TOKENS(ID)
 #undef ID
 };
@@ -62,14 +62,16 @@ constexpr struct TokenInfo {
     UnaryOperator as_unary_operator;
     BinaryOperator as_binary_operator;
     TokenType matching_bracket;
+    StringView name_for_diagnostic;
 } token_info[] = {
-#define TOKEN_INFO(name, precedence, unary_name, binary_name, matching_bracket) \
-    {                                                                           \
-        #name##sv,                                                              \
-        precedence,                                                             \
-        UnaryOperator::unary_name,                                              \
-        BinaryOperator::binary_name,                                            \
-        TokenType::matching_bracket,                                            \
+#define TOKEN_INFO(name, precedence, unary_name, binary_name, matching_bracket, name_for_diagnostic) \
+    {                                                                                                \
+        #name##sv,                                                                                   \
+        precedence,                                                                                  \
+        UnaryOperator::unary_name,                                                                   \
+        BinaryOperator::binary_name,                                                                 \
+        TokenType::matching_bracket,                                                                 \
+        name_for_diagnostic##sv                                                                      \
     },
     ENUMERATE_TOKENS(TOKEN_INFO)
 #undef TOKEN_INFO
@@ -78,7 +80,8 @@ constexpr struct TokenInfo {
 struct Token {
     TokenInfo const& info() const { return token_info[to_underlying(type)]; }
 
-    StringView name() const { return token_info[to_underlying(type)].name; }
+    StringView name() const { return info().name; }
+    StringView name_for_diagnostic() const { return info().name_for_diagnostic; }
     i32 precedence() const { return info().precedence; }
     bool is_operator() const { return precedence() > 0 && precedence() < closing_bracket_precedence; }
     bool is_ambiguous_operator() const { return precedence() == ambiguous_operator_precedence; }