types and locations
[ccc.git] / ast.c
1 #include <stdlib.h>
2 #include <stdio.h>
3 #include <string.h>
4
5 #include "util.h"
6 #include "ast.h"
7 #include "y.tab.h"
8
9 static const char *binop_str[] = {
10 [binor] = "||", [binand] = "&&", [eq] = "==", [neq] = "!=",
11 [leq] = "<=", [le] = "<", [geq] = ">=", [ge] = ">", [cons] = ":",
12 [plus] = "+", [minus] = "-", [times] = "*", [divide] = "/",
13 [modulo] = "%", [power] = "^",
14 };
15 static const char *fieldspec_str[] = {
16 [fst] = "fst", [snd] = "snd", [hd] = "hd", [tl] = "tl"};
17 static const char *unop_str[] = { [inverse] = "!", [negate] = "-", };
18 static const char *basictype_str[] = {
19 [btbool] = "Bool", [btchar] = "Char", [btint] = "Int",
20 [btvoid] = "Void",
21 };
22
23 struct ast *ast(struct list *decls)
24 {
25 struct ast *res = safe_malloc(sizeof(struct ast));
26 res->decls = (struct decl **)list_to_array(decls, &res->ndecls, true);
27 return res;
28 }
29
30 struct vardecl *vardecl(struct type *type, char *ident, struct expr *expr)
31 {
32 struct vardecl *res = safe_malloc(sizeof(struct vardecl));
33 res->type = type;
34 res->ident = ident;
35 res->expr = expr;
36 return res;
37 }
38
39 struct decl *decl_fun(char *ident, struct list *args, struct list *atypes,
40 struct type *rtype, struct list *vars, struct list *body)
41 {
42 struct decl *res = safe_malloc(sizeof(struct decl));
43 res->type = dfundecl;
44 res->data.dfun.ident = ident;
45 res->data.dfun.args = (char **)
46 list_to_array(args, &res->data.dfun.nargs, true);
47 res->data.dfun.atypes = (struct type **)
48 list_to_array(atypes, &res->data.dfun.natypes, true);
49 res->data.dfun.rtype = rtype;
50 res->data.dfun.vars = (struct vardecl **)
51 list_to_array(vars, &res->data.dfun.nvar, true);
52 res->data.dfun.body = (struct stmt **)
53 list_to_array(body, &res->data.dfun.nbody, true);
54 return res;
55 }
56
57 struct decl *decl_var(struct vardecl *vardecl)
58 {
59 struct decl *res = safe_malloc(sizeof(struct decl));
60 res->type = dvardecl;
61 res->data.dvar = vardecl;
62 return res;
63 }
64
65 struct stmt *stmt_assign(char *ident, struct expr *expr)
66 {
67 struct stmt *res = safe_malloc(sizeof(struct stmt));
68 res->type = sassign;
69 res->data.sassign.ident = ident;
70 res->data.sassign.expr = expr;
71 return res;
72 }
73
74 struct stmt *stmt_if(struct expr *pred, struct list *then, struct list *els)
75 {
76 struct stmt *res = safe_malloc(sizeof(struct stmt));
77 res->type = sif;
78 res->data.sif.pred = pred;
79 res->data.sif.then = (struct stmt **)
80 list_to_array(then, &res->data.sif.nthen, true);
81 res->data.sif.els = (struct stmt **)
82 list_to_array(els, &res->data.sif.nels, true);
83 return res;
84 }
85
86 struct stmt *stmt_return(struct expr *rtrn)
87 {
88 struct stmt *res = safe_malloc(sizeof(struct stmt));
89 res->type = sreturn;
90 res->data.sreturn = rtrn;
91 return res;
92 }
93
94 struct stmt *stmt_expr(struct expr *expr)
95 {
96 struct stmt *res = safe_malloc(sizeof(struct stmt));
97 res->type = sexpr;
98 res->data.sexpr = expr;
99 return res;
100 }
101
102 struct stmt *stmt_while(struct expr *pred, struct list *body)
103 {
104 struct stmt *res = safe_malloc(sizeof(struct stmt));
105 res->type = swhile;
106 res->data.swhile.pred = pred;
107 res->data.swhile.body = (struct stmt **)
108 list_to_array(body, &res->data.swhile.nbody, true);
109 return res;
110 }
111
112 struct expr *expr_binop(struct expr *l, enum binop op, struct expr *r)
113 {
114 struct expr *res = safe_malloc(sizeof(struct expr));
115 res->type = ebinop;
116 res->data.ebinop.l = l;
117 res->data.ebinop.op = op;
118 res->data.ebinop.r = r;
119 return res;
120 }
121
122 struct expr *expr_bool(bool b)
123 {
124 struct expr *res = safe_malloc(sizeof(struct expr));
125 res->type = ebool;
126 res->data.ebool = b;
127 return res;
128 }
129 int fromHex(char c)
130 {
131 if (c >= '0' && c <= '9')
132 return c-'0';
133 if (c >= 'a' && c <= 'f')
134 return c-'a'+10;
135 if (c >= 'A' && c <= 'F')
136 return c-'A'+10;
137 return -1;
138 }
139
140 struct expr *expr_char(const char *c)
141 {
142 struct expr *res = safe_malloc(sizeof(struct expr));
143 res->type = echar;
144 //regular char
145 if (strlen(c) == 3)
146 res->data.echar = c[1];
147 //escape
148 if (strlen(c) == 4)
149 switch(c[2]) {
150 case '0': res->data.echar = '\0'; break;
151 case 'a': res->data.echar = '\a'; break;
152 case 'b': res->data.echar = '\b'; break;
153 case 't': res->data.echar = '\t'; break;
154 case 'v': res->data.echar = '\v'; break;
155 case 'f': res->data.echar = '\f'; break;
156 case 'r': res->data.echar = '\r'; break;
157 }
158 //hex escape
159 if (strlen(c) == 6)
160 res->data.echar = (fromHex(c[3])<<4)+fromHex(c[4]);
161 return res;
162 }
163
164 struct expr *expr_funcall(char *ident, struct list *args)
165 {
166 struct expr *res = safe_malloc(sizeof(struct expr));
167 res->type = efuncall;
168 res->data.efuncall.ident = ident;
169 res->data.efuncall.args = (struct expr **)
170 list_to_array(args, &res->data.efuncall.nargs, true);
171 return res;
172 }
173
174 struct expr *expr_int(int integer)
175 {
176 struct expr *res = safe_malloc(sizeof(struct expr));
177 res->type = eint;
178 res->data.eint = integer;
179 return res;
180 }
181
182 struct expr *expr_ident(char *ident, struct list *fields)
183 {
184 struct expr *res = safe_malloc(sizeof(struct expr));
185 res->type = eident;
186 res->data.eident.ident = ident;
187
188 void **els = list_to_array(fields, &res->data.eident.nfields, true);
189 res->data.eident.fields = (enum fieldspec *)safe_malloc(
190 res->data.eident.nfields*sizeof(enum fieldspec));
191 for (int i = 0; i<res->data.eident.nfields; i++) {
192 char *t = els[i];
193 if (strcmp(t, "fst") == 0)
194 res->data.eident.fields[i] = fst;
195 else if (strcmp(t, "snd") == 0)
196 res->data.eident.fields[i] = snd;
197 else if (strcmp(t, "hd") == 0)
198 res->data.eident.fields[i] = hd;
199 else if (strcmp(t, "tl") == 0)
200 res->data.eident.fields[i] = tl;
201 free(t);
202 }
203 free(els);
204 return res;
205 }
206
207 struct expr *expr_nil()
208 {
209 struct expr *res = safe_malloc(sizeof(struct expr));
210 res->type = enil;
211 return res;
212 }
213
214 struct expr *expr_tuple(struct expr *left, struct expr *right)
215 {
216 struct expr *res = safe_malloc(sizeof(struct expr));
217 res->type = etuple;
218 res->data.etuple.left = left;
219 res->data.etuple.right = right;
220 return res;
221 }
222
223 struct expr *expr_unop(enum unop op, struct expr *l)
224 {
225 struct expr *res = safe_malloc(sizeof(struct expr));
226 res->type = eunop;
227 res->data.eunop.op = op;
228 res->data.eunop.l = l;
229 return res;
230 }
231
232 struct type *type_list(struct type *type)
233 {
234 struct type *res = safe_malloc(sizeof(struct type));
235 res->type = tlist;
236 res->data.tlist = type;
237 return res;
238 }
239
240 struct type *type_tuple(struct type *l, struct type *r)
241 {
242 struct type *res = safe_malloc(sizeof(struct type));
243 res->type = ttuple;
244 res->data.ttuple.l = l;
245 res->data.ttuple.r = r;
246 return res;
247 }
248
249 struct type *type_var(char *ident)
250 {
251 struct type *res = safe_malloc(sizeof(struct type));
252 if (strcmp(ident, "Int") == 0) {
253 res->type = tbasic;
254 res->data.tbasic = btint;
255 free(ident);
256 } else if (strcmp(ident, "Char") == 0) {
257 res->type = tbasic;
258 res->data.tbasic = btchar;
259 free(ident);
260 } else if (strcmp(ident, "Bool") == 0) {
261 res->type = tbasic;
262 res->data.tbasic = btbool;
263 free(ident);
264 } else if (strcmp(ident, "Void") == 0) {
265 res->type = tbasic;
266 res->data.tbasic = btvoid;
267 free(ident);
268 } else {
269 res->type = tvar;
270 res->data.tvar = ident;
271 }
272 return res;
273 }
274
275
276 const char *cescapes[] = {
277 [0] = "\\0", [1] = "\\x01", [2] = "\\x02", [3] = "\\x03",
278 [4] = "\\x04", [5] = "\\x05", [6] = "\\x06", [7] = "\\a", [8] = "\\b",
279 [9] = "\\t", [10] = "\\n", [11] = "\\v", [12] = "\\f", [13] = "\\r",
280 [14] = "\\x0E", [15] = "\\x0F", [16] = "\\x10", [17] = "\\x11",
281 [18] = "\\x12", [19] = "\\x13", [20] = "\\x14", [21] = "\\x15",
282 [22] = "\\x16", [23] = "\\x17", [24] = "\\x18", [25] = "\\x19",
283 [26] = "\\x1A", [27] = "\\x1B", [28] = "\\x1C", [29] = "\\x1D",
284 [30] = "\\x1E", [31] = "\\x1F",
285 [127] = "\\x7F"
286 };
287
288 void ast_print(struct ast *ast, FILE *out)
289 {
290 if (ast == NULL)
291 return;
292 for (int i = 0; i<ast->ndecls; i++)
293 decl_print(ast->decls[i], 0, out);
294 }
295
296 void vardecl_print(struct vardecl *decl, int indent, FILE *out)
297 {
298 pindent(indent, out);
299 if (decl->type == NULL)
300 safe_fprintf(out, "var");
301 else
302 type_print(decl->type, out);
303 safe_fprintf(out, " %s = ", decl->ident);
304 expr_print(decl->expr, out);
305 safe_fprintf(out, ";\n");
306 }
307
308 void decl_print(struct decl *decl, int indent, FILE *out)
309 {
310 if (decl == NULL)
311 return;
312 switch(decl->type) {
313 case dfundecl:
314 pindent(indent, out);
315 safe_fprintf(out, "%s (", decl->data.dfun.ident);
316 for (int i = 0; i<decl->data.dfun.nargs; i++) {
317 safe_fprintf(out, "%s", decl->data.dfun.args[i]);
318 if (i < decl->data.dfun.nargs - 1)
319 safe_fprintf(out, ", ");
320 }
321 safe_fprintf(out, ")");
322 if (decl->data.dfun.rtype != NULL) {
323 safe_fprintf(out, " :: ");
324 for (int i = 0; i<decl->data.dfun.natypes; i++) {
325 type_print(decl->data.dfun.atypes[i], out);
326 safe_fprintf(out, " ");
327 }
328 safe_fprintf(out, "-> ");
329 type_print(decl->data.dfun.rtype, out);
330 }
331 safe_fprintf(out, " {\n");
332 for (int i = 0; i<decl->data.dfun.nvar; i++)
333 vardecl_print(decl->data.dfun.vars[i], indent+1, out);
334 for (int i = 0; i<decl->data.dfun.nbody; i++)
335 stmt_print(decl->data.dfun.body[i], indent+1, out);
336 pindent(indent, out);
337 safe_fprintf(out, "}\n");
338 break;
339 case dvardecl:
340 vardecl_print(decl->data.dvar, indent, out);
341 break;
342 default:
343 die("Unsupported decl node\n");
344 }
345 }
346
347 void stmt_print(struct stmt *stmt, int indent, FILE *out)
348 {
349 if (stmt == NULL)
350 return;
351 switch(stmt->type) {
352 case sassign:
353 pindent(indent, out);
354 fprintf(out, "%s", stmt->data.sassign.ident);
355 safe_fprintf(out, " = ");
356 expr_print(stmt->data.sassign.expr, out);
357 safe_fprintf(out, ";\n");
358 break;
359 case sif:
360 pindent(indent, out);
361 safe_fprintf(out, "if (");
362 expr_print(stmt->data.sif.pred, out);
363 safe_fprintf(out, ") {\n");
364 for (int i = 0; i<stmt->data.sif.nthen; i++)
365 stmt_print(stmt->data.sif.then[i], indent+1, out);
366 pindent(indent, out);
367 safe_fprintf(out, "} else {\n");
368 for (int i = 0; i<stmt->data.sif.nels; i++)
369 stmt_print(stmt->data.sif.els[i], indent+1, out);
370 pindent(indent, out);
371 safe_fprintf(out, "}\n");
372 break;
373 case sreturn:
374 pindent(indent, out);
375 safe_fprintf(out, "return ");
376 expr_print(stmt->data.sreturn, out);
377 safe_fprintf(out, ";\n");
378 break;
379 case sexpr:
380 pindent(indent, out);
381 expr_print(stmt->data.sexpr, out);
382 safe_fprintf(out, ";\n");
383 break;
384 case swhile:
385 pindent(indent, out);
386 safe_fprintf(out, "while (");
387 expr_print(stmt->data.swhile.pred, out);
388 safe_fprintf(out, ") {\n");
389 for (int i = 0; i<stmt->data.swhile.nbody; i++) {
390 stmt_print(stmt->data.swhile.body[i], indent+1, out);
391 }
392 pindent(indent, out);
393 safe_fprintf(out, "}\n");
394 break;
395 default:
396 die("Unsupported stmt node\n");
397 }
398 }
399
400 void expr_print(struct expr *expr, FILE *out)
401 {
402 if (expr == NULL)
403 return;
404 switch(expr->type) {
405 case ebinop:
406 safe_fprintf(out, "(");
407 expr_print(expr->data.ebinop.l, out);
408 safe_fprintf(out, "%s", binop_str[expr->data.ebinop.op]);
409 expr_print(expr->data.ebinop.r, out);
410 safe_fprintf(out, ")");
411 break;
412 case ebool:
413 safe_fprintf(out, "%s", expr->data.ebool ? "true" : "false");
414 break;
415 case echar:
416 if (expr->data.echar < 0)
417 safe_fprintf(out, "'?'");
418 if (expr->data.echar < ' ' || expr->data.echar == 127)
419 safe_fprintf(out, "'%s'",
420 cescapes[(int)expr->data.echar]);
421 else
422 safe_fprintf(out, "'%c'", expr->data.echar);
423 break;
424 case efuncall:
425 safe_fprintf(out, "%s(", expr->data.efuncall.ident);
426 for(int i = 0; i<expr->data.efuncall.nargs; i++) {
427 expr_print(expr->data.efuncall.args[i], out);
428 if (i+1 < expr->data.efuncall.nargs)
429 safe_fprintf(out, ", ");
430 }
431 safe_fprintf(out, ")");
432 break;
433 case eint:
434 safe_fprintf(out, "%d", expr->data.eint);
435 break;
436 case eident:
437 fprintf(out, "%s", expr->data.eident.ident);
438 for (int i = 0; i<expr->data.eident.nfields; i++)
439 fprintf(out, ".%s",
440 fieldspec_str[expr->data.eident.fields[i]]);
441 break;
442 case enil:
443 safe_fprintf(out, "[]");
444 break;
445 case etuple:
446 safe_fprintf(out, "(");
447 expr_print(expr->data.etuple.left, out);
448 safe_fprintf(out, ", ");
449 expr_print(expr->data.etuple.right, out);
450 safe_fprintf(out, ")");
451 break;
452 case eunop:
453 safe_fprintf(out, "(%s", unop_str[expr->data.eunop.op]);
454 expr_print(expr->data.eunop.l, out);
455 safe_fprintf(out, ")");
456 break;
457 default:
458 die("Unsupported expr node\n");
459 }
460 }
461
462 void type_print(struct type *type, FILE *out)
463 {
464 if (type == NULL)
465 return;
466 switch (type->type) {
467 case tbasic:
468 safe_fprintf(out, "%s", basictype_str[type->data.tbasic]);
469 break;
470 case tlist:
471 safe_fprintf(out, "[");
472 type_print(type->data.tlist, out);
473 safe_fprintf(out, "]");
474 break;
475 case ttuple:
476 safe_fprintf(out, "(");
477 type_print(type->data.ttuple.l, out);
478 safe_fprintf(out, ",");
479 type_print(type->data.ttuple.r, out);
480 safe_fprintf(out, ")");
481 break;
482 case tvar:
483 safe_fprintf(out, "%s", type->data.tvar);
484 break;
485 default:
486 die("Unsupported type node\n");
487 }
488 }
489
490 void ast_free(struct ast *ast)
491 {
492 if (ast == NULL)
493 return;
494 for (int i = 0; i<ast->ndecls; i++)
495 decl_free(ast->decls[i]);
496 free(ast->decls);
497 free(ast);
498 }
499
500 void vardecl_free(struct vardecl *decl)
501 {
502 type_free(decl->type);
503 free(decl->ident);
504 expr_free(decl->expr);
505 free(decl);
506 }
507
508 void decl_free(struct decl *decl)
509 {
510 if (decl == NULL)
511 return;
512 switch(decl->type) {
513 case dfundecl:
514 free(decl->data.dfun.ident);
515 for (int i = 0; i<decl->data.dfun.nargs; i++)
516 free(decl->data.dfun.args[i]);
517 free(decl->data.dfun.args);
518 for (int i = 0; i<decl->data.dfun.natypes; i++)
519 type_free(decl->data.dfun.atypes[i]);
520 free(decl->data.dfun.atypes);
521 type_free(decl->data.dfun.rtype);
522 for (int i = 0; i<decl->data.dfun.nvar; i++)
523 vardecl_free(decl->data.dfun.vars[i]);
524 free(decl->data.dfun.vars);
525 for (int i = 0; i<decl->data.dfun.nbody; i++)
526 stmt_free(decl->data.dfun.body[i]);
527 free(decl->data.dfun.body);
528 break;
529 case dvardecl:
530 vardecl_free(decl->data.dvar);
531 break;
532 default:
533 die("Unsupported decl node\n");
534 }
535 free(decl);
536 }
537
538 void stmt_free(struct stmt *stmt)
539 {
540 if (stmt == NULL)
541 return;
542 switch(stmt->type) {
543 case sassign:
544 free(stmt->data.sassign.ident);
545 expr_free(stmt->data.sassign.expr);
546 break;
547 case sif:
548 expr_free(stmt->data.sif.pred);
549 for (int i = 0; i<stmt->data.sif.nthen; i++)
550 stmt_free(stmt->data.sif.then[i]);
551 free(stmt->data.sif.then);
552 for (int i = 0; i<stmt->data.sif.nels; i++)
553 stmt_free(stmt->data.sif.els[i]);
554 free(stmt->data.sif.els);
555 break;
556 case sreturn:
557 expr_free(stmt->data.sreturn);
558 break;
559 case sexpr:
560 expr_free(stmt->data.sexpr);
561 break;
562 case swhile:
563 expr_free(stmt->data.swhile.pred);
564 for (int i = 0; i<stmt->data.swhile.nbody; i++)
565 stmt_free(stmt->data.swhile.body[i]);
566 free(stmt->data.swhile.body);
567 break;
568 default:
569 die("Unsupported stmt node\n");
570 }
571 free(stmt);
572 }
573
574 void expr_free(struct expr *expr)
575 {
576 if (expr == NULL)
577 return;
578 switch(expr->type) {
579 case ebinop:
580 expr_free(expr->data.ebinop.l);
581 expr_free(expr->data.ebinop.r);
582 break;
583 case ebool:
584 break;
585 case echar:
586 break;
587 case efuncall:
588 free(expr->data.efuncall.ident);
589 for (int i = 0; i<expr->data.efuncall.nargs; i++)
590 expr_free(expr->data.efuncall.args[i]);
591 free(expr->data.efuncall.args);
592 break;
593 case eint:
594 break;
595 case eident:
596 free(expr->data.eident.ident);
597 free(expr->data.eident.fields);
598 break;
599 case enil:
600 break;
601 case etuple:
602 expr_free(expr->data.etuple.left);
603 expr_free(expr->data.etuple.right);
604 break;
605 case eunop:
606 expr_free(expr->data.eunop.l);
607 break;
608 default:
609 die("Unsupported expr node\n");
610 }
611 free(expr);
612 }
613
614 void type_free(struct type *type)
615 {
616 if (type == NULL)
617 return;
618 switch (type->type) {
619 case tbasic:
620 break;
621 case tlist:
622 type_free(type->data.tlist);
623 break;
624 case ttuple:
625 type_free(type->data.ttuple.l);
626 type_free(type->data.ttuple.r);
627 break;
628 case tvar:
629 free(type->data.tvar);
630 break;
631 default:
632 die("Unsupported type node\n");
633 }
634 free(type);
635 }