Compare commits
	
		
			10 Commits
		
	
	
		
			object_for
			...
			d40273b329
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| d40273b329 | |||
| 000756fca9 | |||
| dabd3fd86f | |||
| ccf8f52b6e | |||
| 35c471f8d4 | |||
| 44fab4c678 | |||
| bcc1569b39 | |||
| 5746ef1c5a | |||
| 2cab530eed | |||
| 7ac4eac37f | 
| @@ -1,55 +0,0 @@ | ||||
| # Linker file format | ||||
|  | ||||
| ```C | ||||
|  | ||||
| struct object_file { | ||||
|     uint64_t    magic;   // ".oo-bin" | ||||
|     uint64_t    version; // 1 | ||||
|     uint64_t    architecture; // AMD64(0) | ||||
|     uint64_t    offsets_offset; | ||||
|  | ||||
|     struct offsets { | ||||
|         uint64_t strings; | ||||
|         uint64_t sections; | ||||
|         uint64_t symbols; | ||||
|         uint64_t relocations; | ||||
|     } offsets; | ||||
|  | ||||
|     struct string_table { | ||||
|         uint64_t size; | ||||
|         uint8_t data[static size]; | ||||
|     } strings; | ||||
|  | ||||
|     struct section_table { | ||||
|         uint32_t count; | ||||
|         struct section_entry { | ||||
|             uint32_t name; | ||||
|             uint64_t offset; | ||||
|             uint64_t size_on_disk; | ||||
|             uint64_t size_in_memory; | ||||
|             uint64_t flags; | ||||
|         } sections[static count]; | ||||
|     } sections; | ||||
|  | ||||
|     struct symbol_table { | ||||
|         uint32_t count; | ||||
|         struct symbol_entry { | ||||
|             uint32_t name; | ||||
|             uint8_t  kind;  // IMPORT(0) | EXPORT(1) | LOCAL(2) | ||||
|             uint32_t section; | ||||
|             uint64_t offset; | ||||
|         } symbols[static count]; | ||||
|     } symbols; | ||||
|  | ||||
|     struct relocation_table { | ||||
|         uint32_t count; | ||||
|         struct relocation_entry { | ||||
|             uint32_t section; | ||||
|             uint64_t offset; | ||||
|             uint8_t  size; | ||||
|             uint32_t symbol; | ||||
|             uint8_t  kind;  // ABSOLUTE(0) | RELATIVE(1) | ||||
|         } relocations[static count]; | ||||
|     } relocations; | ||||
| }; | ||||
| ``` | ||||
| @@ -9,8 +9,7 @@ | ||||
| parse_result_t parse_number(tokenlist_entry_t *current) { | ||||
|     parser_t parsers[] = {parse_octal, parse_decimal, parse_hexadecimal, | ||||
|                           parse_binary, nullptr}; | ||||
|     parse_result_t result = parse_any(current, parsers); | ||||
|     return parse_result_wrap(NODE_NUMBER, result); | ||||
|     return parse_any(current, parsers); | ||||
| } | ||||
|  | ||||
| parse_result_t parse_plus_or_minus(tokenlist_entry_t *current) { | ||||
| @@ -21,12 +20,12 @@ parse_result_t parse_plus_or_minus(tokenlist_entry_t *current) { | ||||
| parse_result_t parse_register_index(tokenlist_entry_t *current) { | ||||
|     parser_t parsers[] = {parse_plus, parse_register, parse_asterisk, | ||||
|                           parse_number, nullptr}; | ||||
|     return parse_consecutive(current, NODE_REGISTER_INDEX, parsers); | ||||
|     return parse_consecutive(current, NODE_LABEL, parsers); | ||||
| } | ||||
|  | ||||
| parse_result_t parse_register_offset(tokenlist_entry_t *current) { | ||||
|     parser_t parsers[] = {parse_plus_or_minus, parse_number, nullptr}; | ||||
|     return parse_consecutive(current, NODE_REGISTER_OFFSET, parsers); | ||||
|     return parse_consecutive(current, NODE_LABEL, parsers); | ||||
| } | ||||
|  | ||||
| parse_result_t parse_register_expression(tokenlist_entry_t *current) { | ||||
| @@ -36,7 +35,6 @@ parse_result_t parse_register_expression(tokenlist_entry_t *current) { | ||||
|     error_t *err = ast_node_alloc(&expr); | ||||
|     if (err) | ||||
|         return parse_error(err); | ||||
|     expr->id = NODE_REGISTER_EXPRESSION; | ||||
|  | ||||
|     // <register> | ||||
|     result = parse_register(current); | ||||
| @@ -84,8 +82,7 @@ parse_result_t parse_register_expression(tokenlist_entry_t *current) { | ||||
|  | ||||
| parse_result_t parse_immediate(tokenlist_entry_t *current) { | ||||
|     parser_t parsers[] = {parse_number, parse_identifier, nullptr}; | ||||
|     parse_result_t result = parse_any(current, parsers); | ||||
|     return parse_result_wrap(NODE_IMMEDIATE, result); | ||||
|     return parse_any(current, parsers); | ||||
| } | ||||
|  | ||||
| parse_result_t parse_memory_expression(tokenlist_entry_t *current) { | ||||
| @@ -96,7 +93,7 @@ parse_result_t parse_memory_expression(tokenlist_entry_t *current) { | ||||
| parse_result_t parse_memory(tokenlist_entry_t *current) { | ||||
|     parser_t parsers[] = {parse_lbracket, parse_memory_expression, | ||||
|                           parse_rbracket, nullptr}; | ||||
|     return parse_consecutive(current, NODE_MEMORY, parsers); | ||||
|     return parse_consecutive(current, NODE_LABEL, parsers); | ||||
| } | ||||
|  | ||||
| parse_result_t parse_operand(tokenlist_entry_t *current) { | ||||
|   | ||||
| @@ -62,11 +62,6 @@ parse_result_t parse_dot(tokenlist_entry_t *current) { | ||||
|     return parse_token(current, TOKEN_DOT, NODE_DOT, nullptr); | ||||
| } | ||||
|  | ||||
| parse_result_t parse_label_reference(tokenlist_entry_t *current) { | ||||
|     return parse_token(current, TOKEN_IDENTIFIER, NODE_LABEL_REFERENCE, | ||||
|                        nullptr); | ||||
| } | ||||
|  | ||||
| const char *registers[] = { | ||||
|     // 64-bit registers | ||||
|     "rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", | ||||
| @@ -80,7 +75,6 @@ const char *registers[] = { | ||||
|     // 8-bit low registers | ||||
|     "al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", | ||||
|     "r11b", "r12b", "r13b", "r14b", "r15b", nullptr}; | ||||
|  | ||||
| bool is_register_token(lexer_token_t *token) { | ||||
|     for (size_t i = 0; registers[i] != nullptr; ++i) | ||||
|         if (strcmp(token->value, registers[i]) == 0) | ||||
|   | ||||
| @@ -18,7 +18,6 @@ parse_result_t parse_plus(tokenlist_entry_t *current); | ||||
| parse_result_t parse_minus(tokenlist_entry_t *current); | ||||
| parse_result_t parse_asterisk(tokenlist_entry_t *current); | ||||
| parse_result_t parse_dot(tokenlist_entry_t *current); | ||||
| parse_result_t parse_label_reference(tokenlist_entry_t *current); | ||||
|  | ||||
| /* These are "primitives" with a different name and some extra validation on top | ||||
|  * for example, register is just an identifier but it only matches a limited set | ||||
|   | ||||
| @@ -33,24 +33,3 @@ parse_result_t parse_token(tokenlist_entry_t *current, | ||||
|  | ||||
|     return parse_success(node, current->next); | ||||
| } | ||||
|  | ||||
| parse_result_t parse_result_wrap(node_id_t id, parse_result_t result) { | ||||
|     if (result.err) | ||||
|         return result; | ||||
|  | ||||
|     ast_node_t *node; | ||||
|     error_t *err = ast_node_alloc(&node); | ||||
|     if (err) { | ||||
|         ast_node_free(result.node); | ||||
|         return parse_error(err); | ||||
|     } | ||||
|     node->id = id; | ||||
|  | ||||
|     err = ast_node_add_child(node, result.node); | ||||
|     if (err) { | ||||
|         ast_node_free(result.node); | ||||
|         return parse_error(err); | ||||
|     } | ||||
|  | ||||
|     return parse_success(node, result.next); | ||||
| } | ||||
|   | ||||
| @@ -19,7 +19,8 @@ parse_result_t parse_success(ast_node_t *ast, tokenlist_entry_t *next); | ||||
| parse_result_t parse_token(tokenlist_entry_t *current, | ||||
|                            lexer_token_id_t token_id, node_id_t ast_id, | ||||
|                            token_validator_t is_valid); | ||||
| parse_result_t parse_result_wrap(node_id_t id, parse_result_t result); | ||||
|  | ||||
| tokenlist_entry_t *skip_insignificant(tokenlist_entry_t *); | ||||
|  | ||||
| extern error_t *err_parse_no_match; | ||||
|  | ||||
|   | ||||
| @@ -1,17 +1,8 @@ | ||||
| .section text | ||||
|  | ||||
| ; Small valid code snippet that should contain all different AST nodes | ||||
|  | ||||
| _start: | ||||
|     mov eax, ebx | ||||
|     lea eax, [eax + ebx * 4 + 8] | ||||
|     lea eax, [eax + 8] | ||||
|     lea eax, [eax + ebx * 8] | ||||
|     lea eax, [esp - 24] | ||||
|     lea eax, [eax + ebx * 4 - 8] | ||||
|     lea eax, [_start] | ||||
|     mov eax, _start | ||||
|     mov eax, 555 | ||||
|     mov eax, 555            ; move 555 into eax | ||||
|     push 0o777 | ||||
|     xor eax, 0xDEADBEEF | ||||
|     and ecx, 0o770 | ||||
|   | ||||
		Reference in New Issue
	
	Block a user