1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
|
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include "types.h"
#include "lexer.h"
#include "parser.h"
#include "runtime.h"
static pit_lex_token peek(pit_parser *st) {
if (!st) return PIT_LEX_TOKEN_ERROR;
return st->next.token;
}
static pit_lex_token advance(pit_parser *st) {
if (!st) return PIT_LEX_TOKEN_ERROR;
st->cur = st->next;
st->next.token = pit_lex_next(st->lexer);
st->next.start = st->lexer->start;
st->next.end = st->lexer->end;
return st->cur.token;
}
static bool match(pit_parser *st, pit_lex_token t) {
if (peek(st) == t) {
advance(st);
return true;
} else return false;
}
static void get_token_string(pit_parser *st, char *buf, i64 len) {
i64 diff = st->cur.end - st->cur.start;
i64 tlen = diff >= len ? len - 1 : diff;
memcpy(buf, st->lexer->input + st->cur.start, tlen);
buf[tlen] = 0;
}
pit_parser *pit_parser_from_lexer(pit_lexer *lex) {
pit_parser *ret = malloc(sizeof(*ret));
ret->lexer = lex;
ret->cur.token = ret->next.token = PIT_LEX_TOKEN_ERROR;
ret->cur.start = ret->next.start = 0;
ret->cur.end = ret->next.end = 0;
advance(ret);
return ret;
}
// parse a single expression
pit_value pit_parse(pit_runtime *rt, pit_parser *st) {
char buf[256] = {0};
pit_lex_token t = advance(st);
printf("token: %s\n", pit_lex_token_name(t));
switch (t) {
case PIT_LEX_TOKEN_ERROR:
pit_error(rt, "encountered an error token while parsing");
return PIT_NIL;
case PIT_LEX_TOKEN_EOF:
pit_error(rt, "end-of-file while parsing");
return PIT_NIL;
case PIT_LEX_TOKEN_LPAREN: {
i64 arg = 0; i64 args_cap = 32;
pit_value *args = calloc(args_cap, sizeof(pit_value));
while (!match(st, PIT_LEX_TOKEN_RPAREN)) {
args[arg++] = pit_parse(rt, st);
if (rt->error != PIT_NIL) return PIT_NIL; // if we hit an error, stop!
if (arg >= args_cap) args = realloc(args, (args_cap <<= 1) * sizeof(pit_value));
}
pit_value ret = PIT_NIL;
for (int i = 0; i < arg; ++i) {
ret = pit_cons(rt, args[arg - i - 1], ret);
}
return ret;
}
case PIT_LEX_TOKEN_QUOTE:
return pit_list(rt, 2, pit_intern_cstr(rt, "quote"), pit_parse(rt, st));
case PIT_LEX_TOKEN_INTEGER_LITERAL:
get_token_string(st, buf, sizeof(buf));
return pit_integer_new(rt, atoi(buf));
case PIT_LEX_TOKEN_STRING_LITERAL:
get_token_string(st, buf, sizeof(buf));
i64 len = strlen(buf);
i64 cur = 0;
for (i64 i = 1; i < len; ++i) {
if (buf[i] == '\\' && i + 1 < len) buf[cur++] = buf[++i];
else if (buf[i] != '"') buf[cur++] = buf[i];
else break;
}
return pit_bytes_new(rt, (u8 *) buf, cur);
case PIT_LEX_TOKEN_SYMBOL:
get_token_string(st, buf, sizeof(buf));
return pit_intern_cstr(rt, buf);
default:
pit_error(rt, "unexpected token: %s", pit_lex_token_name(t));
return PIT_NIL;
}
}
|