1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
|
/* Copyright (C) 2023 Aryadev Chavali
* You may distribute and modify this code under the terms of the
* GPLv2 license. You should have received a copy of the GPLv2
* license with this file. If not, please write to:
* aryadev@aryadevchavali.com.
* Created: 2023-10-23
* Author: Aryadev Chavali
* Description: Assembly source code compiler, targeting OVM
*/
#include <lib/darr.h>
#include "./lexer.h"
#include "./parser.h"
void usage(const char *program_name, FILE *fp)
{
fprintf(fp,
"Usage: %s FILE OUT-FILE\n"
"\tFILE: Source code to compile\n"
"\tOUT-FILE: Name of file to store bytecode\n",
program_name);
}
int main(int argc, char *argv[])
{
int ret = 0;
char *source_file = "";
char *out_file = "";
if (argc < 3)
{
usage(argv[0], stderr);
return 1;
}
source_file = argv[1];
out_file = argv[2];
#if VERBOSE >= 1
printf("[%sASSEMBLER%s]: Assembling `%s` to `%s`\n", TERM_YELLOW, TERM_RESET,
source_file, out_file);
#endif
FILE *fp = fopen(source_file, "rb");
darr_t buffer = darr_read_file(fp);
fclose(fp);
token_stream_t tokens = {0};
lerr_t lex_error = tokenise_buffer(&buffer, &tokens);
if (lex_error)
{
// Compute the line/newlines by hand
size_t column = 0, line = 1;
for (size_t i = 0; i < buffer.used; ++i)
{
if (buffer.data[i] == '\n')
{
column = 0;
++line;
}
else
++column;
}
fprintf(stderr, "%s:%lu:%lu: %s\n", source_file, line, column,
lerr_as_cstr(lex_error));
ret = 255 - lex_error;
goto end;
}
#if VERBOSE >= 1
printf("\t[%sTOKENISER%s]: %lu bytes -> %lu tokens\n", TERM_GREEN, TERM_RESET,
buffer.used, tokens.available);
#endif
#if VERBOSE >= 2
printf("\t[%sTOKENISER%s]: Tokens parsed:\n", TERM_GREEN, TERM_RESET);
for (size_t i = 0; i < tokens.available; ++i)
{
token_t token = TOKEN_STREAM_AT(tokens.data, i);
printf("\t[%lu]: %s(`%s`)@%lu,%lu\n", i, token_type_as_cstr(token.type),
token.str, token.line, token.column);
}
#endif
free(buffer.data);
buffer.data = NULL;
#if VERBOSE >= 2
printf("\t[%sPARSER%s]: Beginning parse...\n", TERM_YELLOW, TERM_RESET);
#endif
prog_t *program = NULL;
perr_t parse_error = parse_stream(&tokens, &program);
if (parse_error)
{
size_t column = 0;
size_t line = 0;
if (tokens.used < tokens.available)
{
token_t t = TOKEN_STREAM_AT(tokens.data, tokens.used);
column = t.column;
line = t.line;
}
fprintf(stderr, "%s:%lu:%lu: %s\n", source_file, line, column,
perr_as_cstr(parse_error));
ret = 255 - parse_error;
goto end;
}
#if VERBOSE >= 1
printf("\t[%sPARSER%s]: %lu tokens -> %lu instructions\n", TERM_GREEN,
TERM_RESET, tokens.available, program->count);
#endif
#if VERBOSE >= 2
printf("\t[%sPARSER%s]: Instructions parsed:\n", TERM_GREEN, TERM_RESET);
for (size_t i = 0; i < program->count; ++i)
{
printf("\t[%lu]: ", i);
inst_print(program->instructions[i], stdout);
printf("\n");
}
#endif
fp = fopen(out_file, "wb");
prog_write_file(program, fp);
fclose(fp);
#if VERBOSE >= 1
printf("[%sASSEMBLER%s]: Wrote bytecode to `%s`\n", TERM_GREEN, TERM_RESET,
out_file);
#endif
end:
if (buffer.data)
free(buffer.data);
if (tokens.data)
{
for (size_t i = 0; i < tokens.available; ++i)
free(TOKEN_STREAM_AT(tokens.data, i).str);
free(tokens.data);
}
if (program)
free(program);
return ret;
}
|