forked from kanaka/mal
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathreader.m
122 lines (114 loc) · 4.16 KB
/
reader.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
% this is just being used as a namespace
classdef reader
methods (Static = true)
function tokens = tokenize(str)
re = '[\s,]*(~@|[\[\]{}()''`~^@]|"(?:\\.|[^\\"])*"|;[^\n]*|[^\s\[\]{}(''"`,;)]*)';
% extract the capture group (to ignore spaces and commas)
tokens = cellfun(@(x) x(1), regexp(str, re, 'tokens'));
comments = cellfun(@(x) length(x) > 0 && x(1) == ';', tokens);
tokens = tokens(~comments);
end
function atm = read_atom(rdr)
token = rdr.next();
%fprintf('in read_atom: %s\n', token);
if not(isempty(regexp(token, '^-?[0-9]+$', 'match')))
atm = str2double(token);
elseif strcmp(token(1), '"')
atm = token(2:length(token)-1);
atm = strrep(atm, '\"', '"');
atm = strrep(atm, '\n', char(10));
elseif strcmp(token(1), ':')
atm = types.keyword(token);
elseif strcmp(token, 'nil')
atm = types.nil;
elseif strcmp(token, 'true')
atm = true;
elseif strcmp(token, 'false')
atm = false;
else
atm = types.Symbol(token);
end
end
function seq = read_seq(rdr, start, last)
%fprintf('in read_seq\n');
seq = {};
token = rdr.next();
if not(strcmp(token, start))
error(sprintf('expected ''%s''', start));
end
token = rdr.peek();
while true
if eq(token, false)
error(sprintf('expected ''%s''', last));
end
if strcmp(token, last), break, end
seq{end+1} = reader.read_form(rdr);
token = rdr.peek();
end
rdr.next();
end
function lst = read_list(rdr)
seq = reader.read_seq(rdr, '(', ')');
lst = types.List(seq{:});
end
function vec = read_vector(rdr)
seq = reader.read_seq(rdr, '[', ']');
vec = types.Vector(seq{:});
end
function map = read_hash_map(rdr)
seq = reader.read_seq(rdr, '{', '}');
map = types.HashMap(seq{:});
end
function ast = read_form(rdr)
%fprintf('in read_form\n');
token = rdr.peek();
switch token
case ''''
rdr.next();
ast = types.List(types.Symbol('quote'), ...
reader.read_form(rdr));
case '`'
rdr.next();
ast = types.List(types.Symbol('quasiquote'), ...
reader.read_form(rdr));
case '~'
rdr.next();
ast = types.List(types.Symbol('unquote'), ...
reader.read_form(rdr));
case '~@'
rdr.next();
ast = types.List(types.Symbol('splice-unquote'), ...
reader.read_form(rdr));
case '^'
rdr.next();
meta = reader.read_form(rdr);
ast = types.List(types.Symbol('with-meta'), ...
reader.read_form(rdr), meta);
case '@'
rdr.next();
ast = types.List(types.Symbol('deref'), ...
reader.read_form(rdr));
case ')'
error('unexpected '')''');
case '('
ast = reader.read_list(rdr);
case ']'
error('unexpected '']''');
case '['
ast = reader.read_vector(rdr);
case '}'
error('unexpected ''}''');
case '{'
ast = reader.read_hash_map(rdr);
otherwise
ast = reader.read_atom(rdr);
end
end
function ast = read_str(str)
%fprintf('in read_str\n');
tokens = reader.tokenize(str);
rdr = Reader(tokens);
ast = reader.read_form(rdr);
end
end
end