add parsing of asm statements, avoid some statement casts
[cparser] / ast.c
1 #include <config.h>
2
3 #include "ast_t.h"
4 #include "type_t.h"
5
6 #include <assert.h>
7 #include <stdio.h>
8 #include <stdlib.h>
9 #include <ctype.h>
10
11 #include "adt/error.h"
12
13 struct obstack ast_obstack;
14
15 static FILE *out;
16 static int   indent;
17
18 static void print_statement(const statement_t *statement);
19
20 void change_indent(int delta)
21 {
22         indent += delta;
23         assert(indent >= 0);
24 }
25
26 void print_indent(void)
27 {
28         for(int i = 0; i < indent; ++i)
29                 fprintf(out, "\t");
30 }
31
32 static void print_const(const const_expression_t *cnst)
33 {
34         if(cnst->expression.datatype == NULL)
35                 return;
36
37         if(is_type_integer(cnst->expression.datatype)) {
38                 fprintf(out, "%lld", cnst->v.int_value);
39         } else if(is_type_floating(cnst->expression.datatype)) {
40                 fprintf(out, "%Lf", cnst->v.float_value);
41         }
42 }
43
44 static void print_quoted_string(const char *string)
45 {
46         fputc('"', out);
47         for(const char *c = string; *c != '\0'; ++c) {
48                 switch(*c) {
49                 case '\"':  fputs("\\\"", out); break;
50                 case '\\':  fputs("\\\\", out); break;
51                 case '\a':  fputs("\\a", out); break;
52                 case '\b':  fputs("\\b", out); break;
53                 case '\f':  fputs("\\f", out); break;
54                 case '\n':  fputs("\\n", out); break;
55                 case '\r':  fputs("\\r", out); break;
56                 case '\t':  fputs("\\t", out); break;
57                 case '\v':  fputs("\\v", out); break;
58                 case '\?':  fputs("\\?", out); break;
59                 default:
60                         if(!isprint(*c)) {
61                                 fprintf(out, "\\x%x", *c);
62                                 break;
63                         }
64                         fputc(*c, out);
65                         break;
66                 }
67         }
68         fputc('"', out);
69 }
70
71 static void print_string_literal(
72                 const string_literal_expression_t *string_literal)
73 {
74         print_quoted_string(string_literal->value);
75 }
76
77 static void print_call_expression(const call_expression_t *call)
78 {
79         print_expression(call->function);
80         fprintf(out, "(");
81         call_argument_t *argument = call->arguments;
82         int              first    = 1;
83         while(argument != NULL) {
84                 if(!first) {
85                         fprintf(out, ", ");
86                 } else {
87                         first = 0;
88                 }
89                 print_expression(argument->expression);
90
91                 argument = argument->next;
92         }
93         fprintf(out, ")");
94 }
95
96 static void print_binary_expression(const binary_expression_t *binexpr)
97 {
98         fprintf(out, "(");
99         print_expression(binexpr->left);
100         fprintf(out, " ");
101         switch(binexpr->type) {
102         case BINEXPR_INVALID:            fputs("INVOP", out); break;
103         case BINEXPR_COMMA:              fputs(",", out);     break;
104         case BINEXPR_ASSIGN:             fputs("=", out);     break;
105         case BINEXPR_ADD:                fputs("+", out);     break;
106         case BINEXPR_SUB:                fputs("-", out);     break;
107         case BINEXPR_MUL:                fputs("*", out);     break;
108         case BINEXPR_MOD:                fputs("%", out);     break;
109         case BINEXPR_DIV:                fputs("/", out);     break;
110         case BINEXPR_BITWISE_OR:         fputs("|", out);     break;
111         case BINEXPR_BITWISE_AND:        fputs("&", out);     break;
112         case BINEXPR_BITWISE_XOR:        fputs("^", out);     break;
113         case BINEXPR_LOGICAL_OR:         fputs("||", out);    break;
114         case BINEXPR_LOGICAL_AND:        fputs("&&", out);    break;
115         case BINEXPR_NOTEQUAL:           fputs("!=", out);    break;
116         case BINEXPR_EQUAL:              fputs("==", out);    break;
117         case BINEXPR_LESS:               fputs("<", out);     break;
118         case BINEXPR_LESSEQUAL:          fputs("<=", out);    break;
119         case BINEXPR_GREATER:            fputs(">", out);     break;
120         case BINEXPR_GREATEREQUAL:       fputs(">=", out);    break;
121         case BINEXPR_SHIFTLEFT:          fputs("<<", out);    break;
122         case BINEXPR_SHIFTRIGHT:         fputs(">>", out);    break;
123
124         case BINEXPR_ADD_ASSIGN:         fputs("+=", out);    break;
125         case BINEXPR_SUB_ASSIGN:         fputs("-=", out);    break;
126         case BINEXPR_MUL_ASSIGN:         fputs("*=", out);    break;
127         case BINEXPR_MOD_ASSIGN:         fputs("%=", out);    break;
128         case BINEXPR_DIV_ASSIGN:         fputs("/=", out);    break;
129         case BINEXPR_BITWISE_OR_ASSIGN:  fputs("|=", out);    break;
130         case BINEXPR_BITWISE_AND_ASSIGN: fputs("&=", out);    break;
131         case BINEXPR_BITWISE_XOR_ASSIGN: fputs("^=", out);    break;
132         case BINEXPR_SHIFTLEFT_ASSIGN:   fputs("<<=", out);   break;
133         case BINEXPR_SHIFTRIGHT_ASSIGN:  fputs(">>=", out);   break;
134         }
135         fprintf(out, " ");
136         print_expression(binexpr->right);
137         fprintf(out, ")");
138 }
139
140 static void print_unary_expression(const unary_expression_t *unexpr)
141 {
142         switch(unexpr->type) {
143         case UNEXPR_NEGATE:           fputs("-", out);  break;
144         case UNEXPR_PLUS:             fputs("+", out);  break;
145         case UNEXPR_NOT:              fputs("!", out);  break;
146         case UNEXPR_BITWISE_NEGATE:   fputs("~", out);  break;
147         case UNEXPR_PREFIX_INCREMENT: fputs("++", out); break;
148         case UNEXPR_PREFIX_DECREMENT: fputs("--", out); break;
149         case UNEXPR_DEREFERENCE:      fputs("*", out);  break;
150         case UNEXPR_TAKE_ADDRESS:     fputs("&", out);  break;
151
152         case UNEXPR_POSTFIX_INCREMENT:
153                 fputs("(", out);
154                 print_expression(unexpr->value);
155                 fputs(")", out);
156                 fputs("++", out);
157                 return;
158         case UNEXPR_POSTFIX_DECREMENT:
159                 fputs("(", out);
160                 print_expression(unexpr->value);
161                 fputs(")", out);
162                 fputs("--", out);
163                 return;
164         case UNEXPR_CAST:
165                 fputs("(", out);
166                 print_type(unexpr->expression.datatype);
167                 fputs(")", out);
168                 break;
169         case UNEXPR_INVALID:
170                 fprintf(out, "unop%d", (int) unexpr->type);
171                 break;
172         }
173         fputs("(", out);
174         print_expression(unexpr->value);
175         fputs(")", out);
176 }
177
178 static void print_reference_expression(const reference_expression_t *ref)
179 {
180         fprintf(out, "%s", ref->declaration->symbol->string);
181 }
182
183 static void print_array_expression(const array_access_expression_t *expression)
184 {
185         if(!expression->flipped) {
186                 fputs("(", out);
187                 print_expression(expression->array_ref);
188                 fputs(")[", out);
189                 print_expression(expression->index);
190                 fputs("]", out);
191         } else {
192                 fputs("(", out);
193                 print_expression(expression->index);
194                 fputs(")[", out);
195                 print_expression(expression->array_ref);
196                 fputs("]", out);
197         }
198 }
199
200 static void print_sizeof_expression(const sizeof_expression_t *expression)
201 {
202         fputs("sizeof", out);
203         if(expression->size_expression != NULL) {
204                 fputc('(', out);
205                 print_expression(expression->size_expression);
206                 fputc(')', out);
207         } else {
208                 fputc('(', out);
209                 print_type(expression->type);
210                 fputc(')', out);
211         }
212 }
213
214 static void print_builtin_symbol(const builtin_symbol_expression_t *expression)
215 {
216         fputs(expression->symbol->string, out);
217 }
218
219 static void print_conditional(const conditional_expression_t *expression)
220 {
221         fputs("(", out);
222         print_expression(expression->condition);
223         fputs(" ? ", out);
224         print_expression(expression->true_expression);
225         fputs(" : ", out);
226         print_expression(expression->false_expression);
227         fputs(")", out);
228 }
229
230 static void print_va_arg(const va_arg_expression_t *expression)
231 {
232         fputs("__builtin_va_arg(", out);
233         print_expression(expression->arg);
234         fputs(", ", out);
235         print_type(expression->expression.datatype);
236         fputs(")", out);
237 }
238
239 static void print_select(const select_expression_t *expression)
240 {
241         print_expression(expression->compound);
242         if(expression->compound->base.datatype == NULL ||
243                         expression->compound->base.datatype->type == TYPE_POINTER) {
244                 fputs("->", out);
245         } else {
246                 fputc('.', out);
247         }
248         fputs(expression->symbol->string, out);
249 }
250
251 static void print_classify_type_expression(
252         const classify_type_expression_t *const expr)
253 {
254         fputs("__builtin_classify_type(", out);
255         print_expression(expr->type_expression);
256         fputc(')', out);
257 }
258
259 void print_expression(const expression_t *expression)
260 {
261         switch(expression->type) {
262         case EXPR_UNKNOWN:
263         case EXPR_INVALID:
264                 fprintf(out, "*invalid expression*");
265                 break;
266         case EXPR_CONST:
267                 print_const(&expression->conste);
268                 break;
269         case EXPR_FUNCTION:
270         case EXPR_PRETTY_FUNCTION:
271         case EXPR_STRING_LITERAL:
272                 print_string_literal(&expression->string);
273                 break;
274         case EXPR_CALL:
275                 print_call_expression(&expression->call);
276                 break;
277         case EXPR_BINARY:
278                 print_binary_expression(&expression->binary);
279                 break;
280         case EXPR_REFERENCE:
281                 print_reference_expression(&expression->reference);
282                 break;
283         case EXPR_ARRAY_ACCESS:
284                 print_array_expression(&expression->array_access);
285                 break;
286         case EXPR_UNARY:
287                 print_unary_expression(&expression->unary);
288                 break;
289         case EXPR_SIZEOF:
290                 print_sizeof_expression(&expression->sizeofe);
291                 break;
292         case EXPR_BUILTIN_SYMBOL:
293                 print_builtin_symbol(&expression->builtin_symbol);
294                 break;
295         case EXPR_CONDITIONAL:
296                 print_conditional(&expression->conditional);
297                 break;
298         case EXPR_VA_ARG:
299                 print_va_arg(&expression->va_arge);
300                 break;
301         case EXPR_SELECT:
302                 print_select(&expression->select);
303                 break;
304         case EXPR_CLASSIFY_TYPE:
305                 print_classify_type_expression(&expression->classify_type);
306                 break;
307
308         case EXPR_OFFSETOF:
309         case EXPR_STATEMENT:
310                 /* TODO */
311                 fprintf(out, "some expression of type %d", (int) expression->type);
312                 break;
313         }
314 }
315
316 static void print_compound_statement(const compound_statement_t *block)
317 {
318         fputs("{\n", out);
319         indent++;
320
321         statement_t *statement = block->statements;
322         while(statement != NULL) {
323                 print_indent();
324                 print_statement(statement);
325
326                 statement = statement->base.next;
327         }
328         indent--;
329         print_indent();
330         fputs("}\n", out);
331 }
332
333 static void print_return_statement(const return_statement_t *statement)
334 {
335         fprintf(out, "return ");
336         if(statement->return_value != NULL)
337                 print_expression(statement->return_value);
338         fputs(";\n", out);
339 }
340
341 static void print_expression_statement(const expression_statement_t *statement)
342 {
343         print_expression(statement->expression);
344         fputs(";\n", out);
345 }
346
347 static void print_goto_statement(const goto_statement_t *statement)
348 {
349         fprintf(out, "goto ");
350         fputs(statement->label->symbol->string, out);
351         fprintf(stderr, "(%p)", (void*) statement->label);
352         fputs(";\n", out);
353 }
354
355 static void print_label_statement(const label_statement_t *statement)
356 {
357         fprintf(stderr, "(%p)", (void*) statement->label);
358         fprintf(out, "%s:\n", statement->label->symbol->string);
359         if(statement->label_statement != NULL) {
360                 print_statement(statement->label_statement);
361         }
362 }
363
364 static void print_if_statement(const if_statement_t *statement)
365 {
366         fputs("if(", out);
367         print_expression(statement->condition);
368         fputs(") ", out);
369         if(statement->true_statement != NULL) {
370                 print_statement(statement->true_statement);
371         }
372
373         if(statement->false_statement != NULL) {
374                 print_indent();
375                 fputs("else ", out);
376                 print_statement(statement->false_statement);
377         }
378 }
379
380 static void print_switch_statement(const switch_statement_t *statement)
381 {
382         fputs("switch(", out);
383         print_expression(statement->expression);
384         fputs(") ", out);
385         print_statement(statement->body);
386 }
387
388 static void print_case_label(const case_label_statement_t *statement)
389 {
390         if(statement->expression == NULL) {
391                 fputs("default:\n", out);
392         } else {
393                 fputs("case ", out);
394                 print_expression(statement->expression);
395                 fputs(":\n", out);
396         }
397         print_statement(statement->label_statement);
398 }
399
400 static void print_declaration_statement(
401                 const declaration_statement_t *statement)
402 {
403         int first = 1;
404         declaration_t *declaration = statement->declarations_begin;
405         for( ; declaration != statement->declarations_end->next;
406                declaration = declaration->next) {
407                 if(!first) {
408                         print_indent();
409                 } else {
410                         first = 0;
411                 }
412                 print_declaration(declaration);
413                 fputc('\n', out);
414         }
415 }
416
417 static void print_while_statement(const while_statement_t *statement)
418 {
419         fputs("while(", out);
420         print_expression(statement->condition);
421         fputs(") ", out);
422         print_statement(statement->body);
423 }
424
425 static void print_do_while_statement(const do_while_statement_t *statement)
426 {
427         fputs("do ", out);
428         print_statement(statement->body);
429         print_indent();
430         fputs("while(", out);
431         print_expression(statement->condition);
432         fputs(");\n", out);
433 }
434
435 static void print_for_statement(const for_statement_t *statement)
436 {
437         fputs("for(", out);
438         if(statement->context.declarations != NULL) {
439                 assert(statement->initialisation == NULL);
440                 print_declaration(statement->context.declarations);
441                 if(statement->context.declarations->next != NULL) {
442                         panic("multiple declarations in for statement not supported yet");
443                 }
444                 fputc(' ', out);
445         } else {
446                 if(statement->initialisation) {
447                         print_expression(statement->initialisation);
448                 }
449                 fputs("; ", out);
450         }
451         if(statement->condition != NULL) {
452                 print_expression(statement->condition);
453         }
454         fputs("; ", out);
455         if(statement->step != NULL) {
456                 print_expression(statement->step);
457         }
458         fputs(")", out);
459         print_statement(statement->body);
460 }
461
462 static void print_asm_constraints(asm_constraint_t *constraints)
463 {
464         asm_constraint_t *constraint = constraints;
465         for( ; constraint != NULL; constraint = constraint->next) {
466                 if(constraint != constraints)
467                         fputs(", ", out);
468
469                 if(constraint->symbol) {
470                         fprintf(out, "[%s] ", constraint->symbol->string);
471                 }
472                 print_quoted_string(constraint->constraints);
473                 fputs(" (", out);
474                 print_expression(constraint->expression);
475                 fputs(")", out);
476         }
477 }
478
479 static void print_asm_clobbers(asm_clobber_t *clobbers)
480 {
481         asm_clobber_t *clobber = clobbers;
482         for( ; clobber != NULL; clobber = clobber->next) {
483                 if(clobber != clobbers)
484                         fputs(", ", out);
485
486                 print_quoted_string(clobber->clobber);
487         }
488 }
489
490 static void print_asm_statement(const asm_statement_t *statement)
491 {
492         fputs("asm", out);
493         if(statement->is_volatile) {
494                 fputs(" volatile", out);
495         }
496         fputs("(", out);
497         print_quoted_string(statement->asm_text);
498         if(statement->inputs == NULL && statement->outputs == NULL
499                         && statement->clobbers == NULL)
500                 goto end_of_print_asm_statement;
501
502         fputs(" : ", out);
503         print_asm_constraints(statement->inputs);
504         if(statement->outputs == NULL && statement->clobbers == NULL)
505                 goto end_of_print_asm_statement;
506
507         fputs(": ", out);
508         print_asm_constraints(statement->outputs);
509         if(statement->clobbers == NULL)
510                 goto end_of_print_asm_statement;
511
512         fputs(": ", out);
513         print_asm_clobbers(statement->clobbers);
514
515 end_of_print_asm_statement:
516         fputs(");\n", out);
517 }
518
519 void print_statement(const statement_t *statement)
520 {
521         switch(statement->type) {
522         case STATEMENT_COMPOUND:
523                 print_compound_statement(&statement->compound);
524                 break;
525         case STATEMENT_RETURN:
526                 print_return_statement(&statement->returns);
527                 break;
528         case STATEMENT_EXPRESSION:
529                 print_expression_statement(&statement->expression);
530                 break;
531         case STATEMENT_LABEL:
532                 print_label_statement(&statement->label);
533                 break;
534         case STATEMENT_GOTO:
535                 print_goto_statement(&statement->gotos);
536                 break;
537         case STATEMENT_CONTINUE:
538                 fputs("continue;\n", out);
539                 break;
540         case STATEMENT_BREAK:
541                 fputs("break;\n", out);
542                 break;
543         case STATEMENT_IF:
544                 print_if_statement(&statement->ifs);
545                 break;
546         case STATEMENT_SWITCH:
547                 print_switch_statement(&statement->switchs);
548                 break;
549         case STATEMENT_CASE_LABEL:
550                 print_case_label(&statement->case_label);
551                 break;
552         case STATEMENT_DECLARATION:
553                 print_declaration_statement(&statement->declaration);
554                 break;
555         case STATEMENT_WHILE:
556                 print_while_statement(&statement->whiles);
557                 break;
558         case STATEMENT_DO_WHILE:
559                 print_do_while_statement(&statement->do_while);
560                 break;
561         case STATEMENT_FOR:
562                 print_for_statement(&statement->fors);
563                 break;
564         case STATEMENT_ASM:
565                 print_asm_statement(&statement->asms);
566                 break;
567         case STATEMENT_INVALID:
568                 fprintf(out, "*invalid statement*");
569                 break;
570         }
571 }
572
573 static void print_storage_class(unsigned storage_class)
574 {
575         switch((storage_class_tag_t) storage_class) {
576         case STORAGE_CLASS_ENUM_ENTRY:
577         case STORAGE_CLASS_NONE:
578                 break;
579         case STORAGE_CLASS_TYPEDEF:       fputs("typedef ",        out); break;
580         case STORAGE_CLASS_EXTERN:        fputs("extern ",         out); break;
581         case STORAGE_CLASS_STATIC:        fputs("static ",         out); break;
582         case STORAGE_CLASS_AUTO:          fputs("auto ",           out); break;
583         case STORAGE_CLASS_REGISTER:      fputs("register ",       out); break;
584         case STORAGE_CLASS_THREAD:        fputs("__thread",        out); break;
585         case STORAGE_CLASS_THREAD_EXTERN: fputs("extern __thread", out); break;
586         case STORAGE_CLASS_THREAD_STATIC: fputs("static __thread", out); break;
587         }
588 }
589
590 void print_initializer(const initializer_t *initializer)
591 {
592         if(initializer->type == INITIALIZER_VALUE) {
593                 const initializer_value_t *value = &initializer->value;
594                 print_expression(value->value);
595                 return;
596         }
597
598         assert(initializer->type == INITIALIZER_LIST);
599         fputs("{ ", out);
600         const initializer_list_t *list = &initializer->list;
601
602         for(size_t i = 0 ; i < list->len; ++i) {
603                 if(i > 0) {
604                         fputs(", ", out);
605                 }
606                 print_initializer(list->initializers[i]);
607         }
608         fputs("}", out);
609 }
610
611 static void print_normal_declaration(const declaration_t *declaration)
612 {
613         print_storage_class(declaration->storage_class);
614         if(declaration->is_inline) {
615                 fputs("inline ", out);
616         }
617         print_type_ext(declaration->type, declaration->symbol,
618                        &declaration->context);
619
620         if(declaration->type->type == TYPE_FUNCTION) {
621                 if(declaration->init.statement != NULL) {
622                         fputs("\n", out);
623                         print_statement(declaration->init.statement);
624                         return;
625                 }
626         } else if(declaration->init.initializer != NULL) {
627                 fputs(" = ", out);
628                 print_initializer(declaration->init.initializer);
629         }
630         fputc(';', out);
631 }
632
633 void print_declaration(const declaration_t *declaration)
634 {
635         if(declaration->namespc != NAMESPACE_NORMAL &&
636                         declaration->symbol == NULL)
637                 return;
638
639         switch(declaration->namespc) {
640         case NAMESPACE_NORMAL:
641                 print_normal_declaration(declaration);
642                 break;
643         case NAMESPACE_STRUCT:
644                 fputs("struct ", out);
645                 fputs(declaration->symbol->string, out);
646                 fputc(' ', out);
647                 print_compound_definition(declaration);
648                 fputc(';', out);
649                 break;
650         case NAMESPACE_UNION:
651                 fputs("union ", out);
652                 fputs(declaration->symbol->string, out);
653                 fputc(' ', out);
654                 print_compound_definition(declaration);
655                 fputc(';', out);
656                 break;
657         case NAMESPACE_ENUM:
658                 fputs("enum ", out);
659                 fputs(declaration->symbol->string, out);
660                 fputc(' ', out);
661                 print_enum_definition(declaration);
662                 fputc(';', out);
663                 break;
664         }
665 }
666
667 void print_ast(const translation_unit_t *unit)
668 {
669         inc_type_visited();
670
671         declaration_t *declaration = unit->context.declarations;
672         for( ; declaration != NULL; declaration = declaration->next) {
673                 if(declaration->storage_class == STORAGE_CLASS_ENUM_ENTRY)
674                         continue;
675                 if(declaration->namespc != NAMESPACE_NORMAL &&
676                                 declaration->symbol == NULL)
677                         continue;
678
679                 print_indent();
680                 print_declaration(declaration);
681                 fputc('\n', out);
682         }
683 }
684
685 void init_ast(void)
686 {
687         obstack_init(&ast_obstack);
688 }
689
690 void exit_ast(void)
691 {
692         obstack_free(&ast_obstack, NULL);
693 }
694
695 void ast_set_output(FILE *stream)
696 {
697         out = stream;
698         type_set_output(stream);
699 }
700
701 void* (allocate_ast) (size_t size)
702 {
703         return _allocate_ast(size);
704 }