-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathparser.mly
209 lines (177 loc) · 8.23 KB
/
parser.mly
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
%{
open Utils
open Ast
let loc startpos endpos = Some(startpos, endpos)
(* Parse applications: either set/map/list magic functions,
* or a regular nesting of curryfied applications. *)
let app loc f args =
let collection k list = EColl(loc, k, args) in
match f with
| EId(_, "list") -> collection CList args
| EId(_, "map") -> collection CMap args
| EId(_, "set") -> collection CSet args
| f -> eapp (f::args)
(* TODO catch formulae like "f+1", which are applications but might have
* been intented to be nat additions. The offset difference between
* end of f and beginning of args shall be used. *)
let data_collection ?(loc=noloc) constr_name args =
if not (List.mem constr_name ["list";"set";"map"]) then
failwith "Not a data constructor";
app loc (EId(noloc, constr_name)) args
%}
%token <int> NAT
%token <int> INT
%token <int> TEZ
%token <string> STRING
%token <string> TIMESTAMP
%token <string> SIGNATURE
%token <string> KEY
%token <string> ID
%token <string> TAG
%token LPAREN RPAREN
%token LAMBDA ARROW DOUBLE_ARROW FORALL TYPE_ANNOT
%token COMMA COLON SEMICOLON LEFT_ARROW
%token <int> TUPLE_GET
%token <string> PRODUCT_GET
%token LBRACE RBRACE
%token BAR STORE
%token EQ NEQ LE LT GE GT CONCAT
%token OR AND XOR PLUS MINUS STAR DIV LSR LSL
%token TYPE LET IF CASE ELSE NOT END
%token EOF
%start <Ast.contract> contract
%start <(string*Ast.expr) list> data_store
%start <Ast.expr> data_parameter
%right ARROW
%left OR XOR
%left AND
%nonassoc EQ NEQ
%nonassoc LE LT GE GT
%nonassoc LSR LSL
%left PLUS MINUS
%left STAR DIV
%nonassoc NOT
%%
contract: d=etype_decl* s=store_decl* e=expr EOF {d, s, e}
etype:
| arg=etype ARROW res=etype {let loc = loc $startpos $endpos in TLambda(loc, arg, res, true)}
| arg=etype DOUBLE_ARROW res=etype {let loc = loc $startpos $endpos in TLambda(loc, arg, res, false)}
| id=ID args=etype_arg* {if args=[] then TId(loc $startpos $endpos, id) else TApp(loc $startpos $endpos, id, args)}
| t=etype_tuple {t}
etype_arg: id=ID {TId(loc $startpos $endpos, id)} | t=etype_tuple {t}
etype_tuple: LPAREN types=separated_nonempty_list(STAR, etype) RPAREN {match types with [t]->t | _ ->TTuple(loc $startpos $endpos, types)}
scheme:
| FORALL vars=ID* COLON t=etype {vars, t}
| t=etype {[], t}
etype_decl: TYPE name=ID params=ID* EQ r=composite_decl_rhs {r name params}
composite_decl_rhs:
| t=etype {fun name params -> if name="primitive" && params=[] then DPrim(loc $startpos $endpos, name, params) else DAlias(loc $startpos $endpos, name, params, t)}
| p0=composite_decl_pair STAR pp=separated_list(STAR, composite_decl_pair) {fun name params -> DProduct(loc $startpos $endpos, name, params, p0::pp)}
| p0=composite_decl_pair PLUS pp=separated_list(PLUS, composite_decl_pair) {fun name params -> DSum(loc $startpos $endpos, name, params, p0::pp)}
composite_decl_pair: tag=TAG COLON? t=etype {(tag, t)}
store_decl:
| STORE name=store_tag TYPE_ANNOT t=etype EQ v=data SEMICOLON? {(name, t, Some v)}
| STORE name=store_tag TYPE_ANNOT t=etype SEMICOLON? {(name, t, None)}
atomic_constant:
| n=INT {LInt(loc $startpos $endpos, n)}
| n=NAT {LNat(loc $startpos $endpos, n)}
| n=TEZ {LTez(loc $startpos $endpos, n)}
| n=TIMESTAMP {LTime(loc $startpos $endpos, n)}
| s=SIGNATURE {LSig(loc $startpos $endpos, s)}
| s=STRING {LString(loc $startpos $endpos, s)}
| s=KEY {LKey(loc $startpos $endpos, s)}
data:
| c=atomic_constant {ELit(loc $startpos $endpos, c)}
| LAMBDA p=parameter+ COLON e=expr {not_impl "lambda data"}
| LPAREN p=separated_list(COMMA, data) RPAREN {etuple ~loc:(loc $startpos $endpos) p}
| LPAREN constr=ID args=data* RPAREN {data_collection ~loc:(loc $startpos $endpos) constr args}
| LBRACE p=separated_list(COMMA, data_product_pair) RBRACE {EProduct(loc $startpos $endpos, p);}
| tag=TAG e=data? {match e with Some e -> ESum(loc $startpos $endpos, tag, e) | None -> ESum(loc $startpos $endpos, tag, eunit)}
data_product_pair: tag=TAG COLON? data=data {tag, data}
data_store_item: STORE? i=store_tag EQ d=data {i, d}
data_store: x=data_store_item* EOF {x}
data_parameter: d=data EOF {d}
expr0:
| c=atomic_constant {ELit(loc $startpos $endpos, c)}
| s=ID {EId(loc $startpos $endpos, s)}
| LAMBDA p=separated_nonempty_list(COMMA, parameter) opt_type_annot COLON res=expr_sequence {
let loc = loc $startpos $endpos in
let p_prm, t_prm = match p with
| [] -> assert false
| [p, t] -> p, t
| _ -> PTuple(List.map fst p), ttuple(List.map snd p) in
elambda ~loc p_prm t_prm res
}
| LPAREN RPAREN {eunit_loc (loc $startpos $endpos)}
| LPAREN e=expr RPAREN {e}
| LPAREN e0=expr COMMA rest=separated_nonempty_list(COMMA, expr) RPAREN {
let loc = loc $startpos $endpos in
etuple ~loc (e0::rest) }
| LPAREN e0=expr SEMICOLON rest=separated_nonempty_list(SEMICOLON, expr) RPAREN {
let loc = loc $startpos $endpos in
esequence ~loc (e0::rest) }
| CASE e=expr BAR c=separated_list(BAR, sum_case) END {ESumCase(loc $startpos $endpos, e, c)}
| IF BAR? c=separated_list(BAR, if_case) END {let loc=loc $startpos $endpos in eif ~loc c}
| LBRACE p=separated_list(COMMA, product_pair) RBRACE {EProduct(loc $startpos $endpos, p);}
| LET p=parameter opt_scheme_annot EQ e0=expr SEMICOLON e1=expr {ELet(loc $startpos $endpos, fst p, ([], snd p), e0, e1)} (* TODO keep annotation if present *)
| e=expr0 tag=PRODUCT_GET {EProductGet(loc $startpos $endpos, e, tag)}
| e0=expr0 LEFT_ARROW tag=TAG COLON e1=expr {EProductSet(loc $startpos $endpos, e0, tag, e1)}
| e=expr0 n=TUPLE_GET {ETupleGet(loc $startpos $endpos, e, n)}
| STORE s=store_tag {EProductGet(loc $startpos $endpos, EId(loc $startpos $endpos, "@"), s)}
| STORE s=store_tag LEFT_ARROW e0=expr SEMICOLON e1=expr {EStoreSet(loc $startpos $endpos, s, e0, e1)}
opt_type_annot: TYPE_ANNOT t=etype {t} | {fresh_tvar()}
opt_scheme_annot: TYPE_ANNOT s=scheme {s} | {[], fresh_tvar()}
expr:
| f=expr0 args=expr_arg* { app (loc $startpos $endpos) f args }
| tag=TAG e=expr0? {
let loc=loc $startpos $endpos in
let arg = match e with Some e -> [e] | None -> [] in
esum ~loc tag arg}
| e=expr TYPE_ANNOT t=etype {ETypeAnnot(loc $startpos $endpos, e, t)}
(* TODO can put infix operators in a separate rule if it's inlined, to preserve precedences. *)
| a=expr EQ b=expr {EBinOp(loc $startpos $endpos, a, BEq, b)}
| a=expr NEQ b=expr {EBinOp(loc $startpos $endpos, a, BNeq, b)}
| a=expr LE b=expr {EBinOp(loc $startpos $endpos, a, BLe, b)}
| a=expr LT b=expr {EBinOp(loc $startpos $endpos, a, BLt, b)}
| a=expr GE b=expr {EBinOp(loc $startpos $endpos, a, BGe, b)}
| a=expr GT b=expr {EBinOp(loc $startpos $endpos, a, BGt, b)}
| a=expr CONCAT b=expr {EBinOp(loc $startpos $endpos, a, BConcat, b)}
| a=expr OR b=expr {EBinOp(loc $startpos $endpos, a, BOr, b)}
| a=expr AND b=expr {EBinOp(loc $startpos $endpos, a, BAnd, b)}
| a=expr XOR b=expr {EBinOp(loc $startpos $endpos, a, BXor, b)}
| a=expr PLUS b=expr {EBinOp(loc $startpos $endpos, a, BAdd, b)}
| a=expr MINUS b=expr {EBinOp(loc $startpos $endpos, a, BSub, b)}
| a=expr STAR b=expr {EBinOp(loc $startpos $endpos, a, BMul, b)}
| a=expr DIV b=expr {EBinOp(loc $startpos $endpos, a, BDiv, b)}
| a=expr LSR b=expr {EBinOp(loc $startpos $endpos, a, BLsr, b)}
| a=expr LSL b=expr {EBinOp(loc $startpos $endpos, a, BLsl, b)}
| MINUS a=expr {EUnOp(loc $startpos $endpos, UNeg, a)}
| NOT a=expr {EUnOp(loc $startpos $endpos, UNot, a)}
expr_arg:
| e=expr0 {e}
| tag=TAG {esum ~loc:(loc $startpos $endpos) tag []}
/* Why did I put this?! | LPAREN e=expr RPAREN {e} */
expr_sequence: l=separated_nonempty_list(SEMICOLON, expr) {
match l with
| [e] -> e
| _ -> let loc =loc $startpos $endpos in esequence ~loc l
}
store_tag: t=TAG {"@"^t} | v=ID {"@"^String.capitalize_ascii v}
sum_case:
| tag=TAG COLON expr=expr_sequence {(tag, (PAny, expr))}
| tag=TAG p=pattern COLON? expr=expr_sequence {(tag, (p, expr))}
if_case:
| cond=expr COLON body=expr_sequence {(cond, body)}
| ELSE COLON? body=expr_sequence {(esum "True" [], body)}
product_pair: tag=TAG COLON? expr=expr {tag, expr}
parameter:
/* | id=ID {PId id, ([], fresh_tvar ~prefix:id ())} */
| p=pattern {p, fresh_tvar()}
| p=pattern TYPE_ANNOT t=etype {p, t}
/* TODO allow schemes in lets, not in lambdas */
pattern:
| id=ID { PId id}
| LPAREN p=separated_list(COMMA, pattern) RPAREN {PTuple p}
| LBRACE p=separated_list(COMMA, product_pattern_list) RBRACE {PProduct p}
product_pattern_list:
| t=TAG COLON p=pattern {t, p}