Add more grammar rules to the parser

Add a parser combinator to parse a delimited list
make parse_success always skip past trivia in the tokenlist
2025-04-01 23:43:05 +02:00 · 2025-04-01 23:39:48 +02:00 · 2025-04-01 23:39:01 +02:00 · 2025-04-01 23:36:08 +02:00 · 2025-04-01 23:22:29 +02:00 · 2025-04-01 22:09:36 +02:00
15 changed files with 92 additions and 411 deletions
@@ -1,55 +0,0 @@
-# Linker file format
-
-```C
-
-struct object_file {
-    uint64_t    magic;   // ".oo-bin"
-    uint64_t    version; // 1
-    uint64_t    architecture; // AMD64(0)
-    uint64_t    offsets_offset;
-
-    struct offsets {
-        uint64_t strings;
-        uint64_t sections;
-        uint64_t symbols;
-        uint64_t relocations;
-    } offsets;
-
-    struct string_table {
-        uint64_t size;
-        uint8_t data[static size];
-    } strings;
-
-    struct section_table {
-        uint32_t count;
-        struct section_entry {
-            uint32_t name;
-            uint64_t offset;
-            uint64_t size_on_disk;
-            uint64_t size_in_memory;
-            uint64_t flags;
-        } sections[static count];
-    } sections;
-
-    struct symbol_table {
-        uint32_t count;
-        struct symbol_entry {
-            uint32_t name;
-            uint8_t  kind;  // IMPORT(0) | EXPORT(1) | LOCAL(2)
-            uint32_t section;
-            uint64_t offset;
-        } symbols[static count];
-    } symbols;
-
-    struct relocation_table {
-        uint32_t count;
-        struct relocation_entry {
-            uint32_t section;
-            uint64_t offset;
-            uint8_t  size;
-            uint32_t symbol;
-            uint8_t  kind;  // ABSOLUTE(0) | RELATIVE(1)
-        } relocations[static count];
-    } relocations;
-};
-```
@@ -1,6 +1,5 @@
 #include "ast.h"
 #include "error.h"
-#include <assert.h>
 #include <string.h>

 error_t *err_node_children_cap = &(error_t){
@@ -84,104 +83,3 @@ error_t *ast_node_add_child(ast_node_t *node, ast_node_t *child) {

    return nullptr;
 }
-
-const char *ast_node_id_to_cstr(node_id_t id) {
-    switch (id) {
-    case NODE_INVALID:
-        return "NODE_INVALID";
-    case NODE_PROGRAM:
-        return "NODE_PROGRAM";
-    case NODE_STATEMENT:
-        return "NODE_STATEMENT";
-    case NODE_LABEL:
-        return "NODE_LABEL";
-    case NODE_DIRECTIVE:
-        return "NODE_DIRECTIVE";
-    case NODE_INSTRUCTION:
-        return "NODE_INSTRUCTION";
-    case NODE_OPERANDS:
-        return "NODE_OPERANDS";
-    case NODE_OPERAND:
-        return "NODE_OPERAND";
-    case NODE_IMMEDIATE:
-        return "NODE_IMMEDIATE";
-    case NODE_MEMORY:
-        return "NODE_MEMORY";
-    case NODE_NUMBER:
-        return "NODE_NUMBER";
-    case NODE_LABEL_REFERENCE:
-        return "NODE_LABEL_REFERENCE";
-    case NODE_MEMORY_EXPRESSION:
-        return "NODE_MEMORY_EXPRESSION";
-    case NODE_REGISTER_EXPRESSION:
-        return "NODE_REGISTER_EXPRESSION";
-    case NODE_REGISTER_INDEX:
-        return "NODE_REGISTER_INDEX";
-    case NODE_REGISTER_OFFSET:
-        return "NODE_REGISTER_OFFSET";
-    case NODE_PLUS_OR_MINUS:
-        return "NODE_PLUS_OR_MINUS";
-    case NODE_SECTION_DIRECTIVE:
-        return "NODE_SECTION_DIRECTIVE";
-    case NODE_REGISTER:
-        return "NODE_REGISTER";
-    case NODE_SECTION:
-        return "NODE_SECTION";
-    case NODE_IDENTIFIER:
-        return "NODE_IDENTIFIER";
-    case NODE_DECIMAL:
-        return "NODE_DECIMAL";
-    case NODE_HEXADECIMAL:
-        return "NODE_HEXADECIMAL";
-    case NODE_OCTAL:
-        return "NODE_OCTAL";
-    case NODE_BINARY:
-        return "NODE_BINARY";
-    case NODE_CHAR:
-        return "NODE_CHAR";
-    case NODE_STRING:
-        return "NODE_STRING";
-    case NODE_COLON:
-        return "NODE_COLON";
-    case NODE_COMMA:
-        return "NODE_COMMA";
-    case NODE_LBRACKET:
-        return "NODE_LBRACKET";
-    case NODE_RBRACKET:
-        return "NODE_RBRACKET";
-    case NODE_PLUS:
-        return "NODE_PLUS";
-    case NODE_MINUS:
-        return "NODE_MINUS";
-    case NODE_ASTERISK:
-        return "NODE_ASTERISK";
-    case NODE_DOT:
-        return "NODE_DOT";
-    }
-    assert(!"Unreachable, weird node id" && id);
-    __builtin_unreachable();
-}
-
-static void ast_node_print_internal(ast_node_t *node, int indent) {
-    if (node == NULL) {
-        return;
-    }
-
-    for (int i = 0; i < indent; i++) {
-        printf("  ");
-    }
-    printf("%s", ast_node_id_to_cstr(node->id));
-
-    if (node->token_entry && node->token_entry->token.value) {
-        printf(" \"%s\"", node->token_entry->token.value);
-    }
-    printf("\n");
-
-    for (size_t i = 0; i < node->len; i++) {
-        ast_node_print_internal(node->children[i], indent + 1);
-    }
-}
-
-void ast_node_print(ast_node_t *node) {
-    ast_node_print_internal(node, 0);
-}
@@ -106,15 +106,4 @@ void ast_node_free(ast_node_t *node);
 */
 error_t *ast_node_add_child(ast_node_t *node, ast_node_t *child);

-/**
- * @brief Prints an AST starting from the given node
- *
- * Prints a representation of the AST with indentation to show structure.
- * Each node's type is shown, and if a node has an associated token value,
- * that value is printed in quotes.
- *
- * @param node The root node of the AST to print
- */
-void ast_node_print(ast_node_t *node);
-
 #endif // INCLUDE_SRC_AST_H_
@@ -1,6 +1,6 @@
 #include "error.h"
 #include "lexer.h"
-#include "parser/parser.h"
+#include "parser.h"
 #include "tokenlist.h"

 #include <limits.h>
@@ -32,20 +32,13 @@ void print_text(tokenlist_t *list) {
    }
 }

-void print_ast(tokenlist_t *list) {
+void parse_ast(tokenlist_t *list) {
    parse_result_t result = parse(list->head);
    if (result.err) {
        puts(result.err->message);
        error_free(result.err);
        return;
    }
-    ast_node_print(result.node);
-
-    if (result.next != nullptr) {
-        puts("First unparsed token:");
-        lexer_token_print(&result.next->token);
-    }
-
    ast_node_free(result.node);
 }

@@ -89,7 +82,7 @@ int main(int argc, char *argv[]) {
        print_text(list);
        break;
    case MODE_AST:
-        print_ast(list);
+        parse_ast(list);
        break;
    }

@@ -0,0 +1,53 @@
+#include "parser.h"
+#include "ast.h"
+#include "lexer.h"
+#include "parser_combinators.h"
+#include "parser_primitives.h"
+#include "parser_util.h"
+#include "tokenlist.h"
+
+parse_result_t parse_number(tokenlist_entry_t *current) {
+    parser_t parsers[] = {parse_octal, parse_decimal, parse_hexadecimal,
+                          parse_binary, nullptr};
+    return parse_any(current, parsers);
+}
+
+parse_result_t parse_operand(tokenlist_entry_t *current) {
+    // FIXME: not the correct set of parsers
+    parser_t parsers[] = {parse_register, parse_number, nullptr};
+    return parse_any(current, parsers);
+}
+
+parse_result_t parse_operands(tokenlist_entry_t *current) {
+    return parse_list(current, NODE_OPERANDS, true, TOKEN_COMMA, parse_operand);
+}
+
+parse_result_t parse_label(tokenlist_entry_t *current) {
+    parser_t parsers[] = {parse_identifier, parse_colon, nullptr};
+    return parse_consecutive(current, NODE_LABEL, parsers);
+}
+
+parse_result_t parse_section_directive(tokenlist_entry_t *current) {
+    parser_t parsers[] = {parse_section, parse_identifier, nullptr};
+    return parse_consecutive(current, NODE_SECTION_DIRECTIVE, parsers);
+}
+
+parse_result_t parse_directive(tokenlist_entry_t *current) {
+    parser_t parsers[] = {parse_dot, parse_section_directive, nullptr};
+    return parse_consecutive(current, NODE_LABEL, parsers);
+}
+
+parse_result_t parse_instruction(tokenlist_entry_t *current) {
+    parser_t parsers[] = {parse_identifier, parse_operands, nullptr};
+    return parse_consecutive(current, NODE_INSTRUCTION, parsers);
+}
+
+parse_result_t parse_statement(tokenlist_entry_t *current) {
+    parser_t parsers[] = {parse_label, parse_directive, parse_instruction,
+                          nullptr};
+    return parse_any(current, parsers);
+}
+
+parse_result_t parse(tokenlist_entry_t *current) {
+    return parse_many(current, NODE_PROGRAM, true, parse_statement);
+}
@@ -0,0 +1,11 @@
+#ifndef INCLUDE_SRC_PARSER_H_
+#define INCLUDE_SRC_PARSER_H_
+
+#include "ast.h"
+#include "error.h"
+#include "parser_util.h"
+#include "tokenlist.h"
+
+parse_result_t parse(tokenlist_entry_t *current);
+
+#endif // INCLUDE_SRC_PARSER_H_
@@ -1,140 +0,0 @@
-#include "parser.h"
-#include "../ast.h"
-#include "../lexer.h"
-#include "../tokenlist.h"
-#include "combinators.h"
-#include "primitives.h"
-#include "util.h"
-
-parse_result_t parse_number(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_octal, parse_decimal, parse_hexadecimal,
-                          parse_binary, nullptr};
-    parse_result_t result = parse_any(current, parsers);
-    return parse_result_wrap(NODE_NUMBER, result);
-}
-
-parse_result_t parse_plus_or_minus(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_plus, parse_minus, nullptr};
-    return parse_any(current, parsers);
-}
-
-parse_result_t parse_register_index(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_plus, parse_register, parse_asterisk,
-                          parse_number, nullptr};
-    return parse_consecutive(current, NODE_REGISTER_INDEX, parsers);
-}
-
-parse_result_t parse_register_offset(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_plus_or_minus, parse_number, nullptr};
-    return parse_consecutive(current, NODE_REGISTER_OFFSET, parsers);
-}
-
-parse_result_t parse_register_expression(tokenlist_entry_t *current) {
-    parse_result_t result;
-
-    ast_node_t *expr;
-    error_t *err = ast_node_alloc(&expr);
-    if (err)
-        return parse_error(err);
-    expr->id = NODE_REGISTER_EXPRESSION;
-
-    // <register>
-    result = parse_register(current);
-    if (result.err) {
-        ast_node_free(expr);
-        return result;
-    }
-    err = ast_node_add_child(expr, result.node);
-    if (err) {
-        ast_node_free(result.node);
-        ast_node_free(expr);
-        return parse_error(err);
-    }
-    current = result.next;
-
-    // <register_index>?
-    result = parse_register_index(current);
-    if (result.err) {
-        error_free(result.err);
-    } else {
-        err = ast_node_add_child(expr, result.node);
-        if (err) {
-            ast_node_free(result.node);
-            ast_node_free(expr);
-            return parse_error(err);
-        }
-        current = result.next;
-    }
-
-    // <register_offset>?
-    result = parse_register_offset(current);
-    if (result.err) {
-        error_free(result.err);
-    } else {
-        err = ast_node_add_child(expr, result.node);
-        if (err) {
-            ast_node_free(result.node);
-            ast_node_free(expr);
-            return parse_error(err);
-        }
-        current = result.next;
-    }
-    return parse_success(expr, current);
-}
-
-parse_result_t parse_immediate(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_number, parse_identifier, nullptr};
-    parse_result_t result = parse_any(current, parsers);
-    return parse_result_wrap(NODE_IMMEDIATE, result);
-}
-
-parse_result_t parse_memory_expression(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_register_expression, parse_identifier, nullptr};
-    return parse_any(current, parsers);
-}
-
-parse_result_t parse_memory(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_lbracket, parse_memory_expression,
-                          parse_rbracket, nullptr};
-    return parse_consecutive(current, NODE_MEMORY, parsers);
-}
-
-parse_result_t parse_operand(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_register, parse_memory, parse_immediate,
-                          nullptr};
-    return parse_any(current, parsers);
-}
-
-parse_result_t parse_operands(tokenlist_entry_t *current) {
-    return parse_list(current, NODE_OPERANDS, true, TOKEN_COMMA, parse_operand);
-}
-
-parse_result_t parse_label(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_identifier, parse_colon, nullptr};
-    return parse_consecutive(current, NODE_LABEL, parsers);
-}
-
-parse_result_t parse_section_directive(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_section, parse_identifier, nullptr};
-    return parse_consecutive(current, NODE_SECTION_DIRECTIVE, parsers);
-}
-
-parse_result_t parse_directive(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_dot, parse_section_directive, nullptr};
-    return parse_consecutive(current, NODE_DIRECTIVE, parsers);
-}
-
-parse_result_t parse_instruction(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_identifier, parse_operands, nullptr};
-    return parse_consecutive(current, NODE_INSTRUCTION, parsers);
-}
-
-parse_result_t parse_statement(tokenlist_entry_t *current) {
-    parser_t parsers[] = {parse_label, parse_directive, parse_instruction,
-                          nullptr};
-    return parse_any(current, parsers);
-}
-
-parse_result_t parse(tokenlist_entry_t *current) {
-    return parse_many(current, NODE_PROGRAM, true, parse_statement);
-}
@@ -1,9 +0,0 @@
-#ifndef INCLUDE_PARSER_PARSER_H_
-#define INCLUDE_PARSER_PARSER_H_
-
-#include "../tokenlist.h"
-#include "util.h"
-
-parse_result_t parse(tokenlist_entry_t *current);
-
-#endif // INCLUDE_PARSER_PARSER_H_
@@ -1,4 +1,4 @@
-#include "combinators.h"
+#include "parser_combinators.h"

 // Parse a list of the given parser delimited by the given token id. Does not
 // store the delimiters in the parent node
@@ -50,8 +50,7 @@ parse_result_t parse_list(tokenlist_entry_t *current, node_id_t id,
 }

 parse_result_t parse_any(tokenlist_entry_t *current, parser_t parsers[]) {
-    parser_t parser;
-    while ((parser = *parsers++)) {
+    for (parser_t parser = *parsers; parser; parser = *parsers++) {
        parse_result_t result = parser(current);
        if (result.err == nullptr)
            return result;
@@ -107,8 +106,7 @@ parse_result_t parse_consecutive(tokenlist_entry_t *current, node_id_t id,

    all->id = id;

-    parser_t parser;
-    while ((parser = *parsers++) && current) {
+    for (parser_t parser = *parsers; parser && current; parser = *parsers++) {
        result = parser(current);
        if (result.err) {
            ast_node_free(all);
@@ -1,7 +1,4 @@
-#ifndef INCLUDE_PARSER_COMBINATORS_H_
-#define INCLUDE_PARSER_COMBINATORS_H_
-
-#include "util.h"
+#include "parser_util.h"

 typedef parse_result_t (*parser_t)(tokenlist_entry_t *);

@@ -21,5 +18,3 @@ parse_result_t parse_list(tokenlist_entry_t *current, node_id_t id,
 // wraps the parsed nodes in a new parent node.
 parse_result_t parse_consecutive(tokenlist_entry_t *current, node_id_t id,
                                 parser_t parsers[]);
-
-#endif // INCLUDE_PARSER_COMBINATORS_H_
@@ -1,5 +1,5 @@
-#include "primitives.h"
-#include "../ast.h"
+#include "parser_primitives.h"
+#include "ast.h"
 #include <string.h>

 parse_result_t parse_identifier(tokenlist_entry_t *current) {
@@ -62,25 +62,9 @@ parse_result_t parse_dot(tokenlist_entry_t *current) {
    return parse_token(current, TOKEN_DOT, NODE_DOT, nullptr);
 }

-parse_result_t parse_label_reference(tokenlist_entry_t *current) {
-    return parse_token(current, TOKEN_IDENTIFIER, NODE_LABEL_REFERENCE,
-                       nullptr);
-}
-
-const char *registers[] = {
-    // 64-bit registers
-    "rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10",
-    "r11", "r12", "r13", "r14", "r15",
-    // 32-bit registers
-    "eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d",
-    "r10d", "r11d", "r12d", "r13d", "r14d", "r15d",
-    // 16-bit registers
-    "ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w",
-    "r11w", "r12w", "r13w", "r14w", "r15w",
-    // 8-bit low registers
-    "al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b",
-    "r11b", "r12b", "r13b", "r14b", "r15b", nullptr};
-
+const char *registers[] = {"rax", "rcx", "rdx", "rbx", "rsp",  "rbp",
+                           "rsi", "rdi", "r8",  "r9",  "r10",  "r11",
+                           "r12", "r13", "r14", "r15", nullptr};
 bool is_register_token(lexer_token_t *token) {
    for (size_t i = 0; registers[i] != nullptr; ++i)
        if (strcmp(token->value, registers[i]) == 0)
@@ -97,7 +81,4 @@ bool is_section_token(lexer_token_t *token) {
    return strcmp(token->value, "section") == 0;
 }

-parse_result_t parse_section(tokenlist_entry_t *current) {
-    return parse_token(current, TOKEN_IDENTIFIER, NODE_SECTION,
-                       is_section_token);
-}
+parse_result_t parse_section(tokenlist_entry_t *current) {}
@@ -1,7 +1,7 @@
-#ifndef INCLUDE_PARSER_PRIMITIVES_H_
-#define INCLUDE_PARSER_PRIMITIVES_H_
+#ifndef INCLUDE_SRC_PARSER_PRIMITIVES_H_
+#define INCLUDE_SRC_PARSER_PRIMITIVES_H_

-#include "util.h"
+#include "parser_util.h"

 parse_result_t parse_identifier(tokenlist_entry_t *current);
 parse_result_t parse_decimal(tokenlist_entry_t *current);
@@ -18,7 +18,6 @@ parse_result_t parse_plus(tokenlist_entry_t *current);
 parse_result_t parse_minus(tokenlist_entry_t *current);
 parse_result_t parse_asterisk(tokenlist_entry_t *current);
 parse_result_t parse_dot(tokenlist_entry_t *current);
-parse_result_t parse_label_reference(tokenlist_entry_t *current);

 /* These are "primitives" with a different name and some extra validation on top
 * for example, register is just an identifier but it only matches a limited set
@@ -27,4 +26,4 @@ parse_result_t parse_label_reference(tokenlist_entry_t *current);
 parse_result_t parse_register(tokenlist_entry_t *current);
 parse_result_t parse_section(tokenlist_entry_t *current);

-#endif // INCLUDE_PARSER_PRIMITIVES_H_
+#endif // INCLUDE_SRC_PARSER_PRIMITIVES_H_
@@ -1,5 +1,5 @@
-#include "util.h"
-#include "../tokenlist.h"
+#include "parser_util.h"
+#include "tokenlist.h"

 error_t *err_parse_no_match =
    &(error_t){.message = "parsing failed to find the correct token sequence"};
@@ -33,24 +33,3 @@ parse_result_t parse_token(tokenlist_entry_t *current,

    return parse_success(node, current->next);
 }
-
-parse_result_t parse_result_wrap(node_id_t id, parse_result_t result) {
-    if (result.err)
-        return result;
-
-    ast_node_t *node;
-    error_t *err = ast_node_alloc(&node);
-    if (err) {
-        ast_node_free(result.node);
-        return parse_error(err);
-    }
-    node->id = id;
-
-    err = ast_node_add_child(node, result.node);
-    if (err) {
-        ast_node_free(result.node);
-        return parse_error(err);
-    }
-
-    return parse_success(node, result.next);
-}
@@ -1,9 +1,9 @@
-#ifndef INCLUDE_PARSER_UTIL_H_
-#define INCLUDE_PARSER_UTIL_H_
+#ifndef INCLUDE_SRC_PARSER_UTIL_H_
+#define INCLUDE_SRC_PARSER_UTIL_H_

-#include "../ast.h"
-#include "../error.h"
-#include "../tokenlist.h"
+#include "ast.h"
+#include "error.h"
+#include "tokenlist.h"

 typedef struct parse_result {
    error_t *err;
@@ -19,8 +19,9 @@ parse_result_t parse_success(ast_node_t *ast, tokenlist_entry_t *next);
 parse_result_t parse_token(tokenlist_entry_t *current,
                           lexer_token_id_t token_id, node_id_t ast_id,
                           token_validator_t is_valid);
-parse_result_t parse_result_wrap(node_id_t id, parse_result_t result);
+
+tokenlist_entry_t *skip_insignificant(tokenlist_entry_t *);

 extern error_t *err_parse_no_match;

-#endif // INCLUDE_PARSER_UTIL_H_
+#endif // INCLUDE_SRC_PARSER_UTIL_H_
@@ -1,17 +1,5 @@
-.section text
-
-; Small valid code snippet that should contain all different AST nodes
-
 _start:
-    mov eax, ebx
-    lea eax, [eax + ebx * 4 + 8]
-    lea eax, [eax + 8]
-    lea eax, [eax + ebx * 8]
-    lea eax, [esp - 24]
-    lea eax, [eax + ebx * 4 - 8]
-    lea eax, [_start]
-    mov eax, _start
-    mov eax, 555
+    mov eax, 555            ; move 555 into eax
    push 0o777
    xor eax, 0xDEADBEEF
    and ecx, 0o770
Author	SHA1	Message	Date
omicron	71f1b0aa64	Add more grammar rules to the parser Validate the build / validate-build (push) Successful in 26s Details	2025-04-01 23:43:05 +02:00
omicron	c3fcb917fc	Add a parser combinator to parse a delimited list	2025-04-01 23:39:48 +02:00
omicron	333991e05e	make parse_success always skip past trivia in the tokenlist	2025-04-01 23:39:01 +02:00
omicron	a1b4cc21f4	TODO: REVIEW ME AND WRITE PROPER MESSAGE Fix lexer issue where consuming n tokens always fails if there are n tokens and always succeeds if they aren't n tokens	2025-04-01 23:36:08 +02:00
omicron	80957326bc	fix operands list grammar rule	2025-04-01 23:22:29 +02:00
omicron	da51d66bb2	Match ast nodes to new grammar	2025-04-01 22:09:36 +02:00
omicron	42445338a4	Update grammar to match implementation	2025-04-01 22:01:33 +02:00
omicron	03fc44f339	Use new validator function for parse_token calls on all primitives Also adds new validated primitives for NODE_SECTION and NODE_REGISTER	2025-04-01 21:54:27 +02:00
omicron	eec02d6237	Fix incorrect error returned in parse_consecutive	2025-04-01 21:53:19 +02:00
omicron	39a4b2b0a7	Fix memory leak in ast. If a node has children the array of children was never freed.	2025-04-01 21:51:48 +02:00
omicron	048b8fcf9d	Extend parse_token to accept an optional validator function	2025-04-01 21:10:19 +02:00
omicron	1b21364939	Expose err_parse_no_match in parser_util.h	2025-04-01 20:57:34 +02:00
omicron	41114d7f9c	Add basic parser combinators	2025-04-01 20:05:35 +02:00
omicron	dfc89a7493	Add "primitive" parsers for all the semantic tokens in the lexer grammar	2025-04-01 20:03:53 +02:00
omicron	43a62095bf	Add basic parser utilities	2025-04-01 20:03:28 +02:00
omicron	ff7d33bf2a	Add functions to skip over trivia in a tokenlist	2025-04-01 19:55:00 +02:00
omicron	208f30ac48	Expand AST node ids to support the lexer tokens and grammar rules	2025-04-01 19:26:54 +02:00
omicron	988b54aee3	Adjust grammar so that it never depends on newline tokens	2025-04-01 19:26:27 +02:00
omicron	ed1491db33	Fix parse_token to add the correct information to a parse node	2025-04-01 17:20:50 +02:00
omicron	0bf4ba3a1b	Fix ast nodes now containing token entry instead of token	2025-04-01 17:20:32 +02:00
omicron	e632764bf2	Partial parser implementation	2025-04-01 17:16:21 +02:00
omicron	a298e99895	Add invalid ast node id	2025-04-01 15:06:42 +02:00
omicron	126905a092	FIXME REORDER COMMIT -- Change main so it can parse the ast FIXME THIS COMMIT NEEDS TO BE REORDERED FIXME THIS COMMIT NEEDS TO BE REORDERED FIXME THIS COMMIT NEEDS TO BE REORDERED FIXME THIS COMMIT NEEDS TO BE REORDERED	2025-04-01 15:06:20 +02:00
omicron	0f6efa8050	Add basic AST functionality Validate the build / validate-build (push) Successful in 24s Details	2025-03-31 18:43:50 +02:00
omicron	36af377ba0	Add a parser grammar Currently this is a subset of the grammar, enough to get reasonable work going.	2025-03-31 18:43:34 +02:00