10 #include "type_hash.h"
12 #include "adt/bitfiddle.h"
13 #include "adt/error.h"
14 #include "adt/array.h"
18 struct environment_entry_t {
20 environment_entry_t *old_entry;
21 declaration_t *declaration;
22 unsigned short old_symbol_ID;
26 static struct obstack environment_obstack;
27 static environment_entry_t **environment_stack = NULL;
28 static translation_unit_t *translation_unit = NULL;
29 static block_statement_t *context = NULL;
32 statement_t *parse_compound_statement(void);
34 statement_t *parse_statement(void);
37 expression_t *parse_sub_expression(unsigned precedence);
39 expression_t *parse_expression(void);
42 void *allocate_ast_zero(size_t size)
44 void *res = allocate_ast(size);
50 void *allocate_type_zero(size_t size)
52 void *res = obstack_alloc(type_obst, size);
58 * pushs an environment_entry on the environment stack and links the
59 * corresponding symbol to the new entry
62 environment_entry_t *environment_push(symbol_t *symbol)
64 environment_entry_t *entry
65 = obstack_alloc(&environment_obstack, sizeof(entry[0]));
66 memset(entry, 0, sizeof(entry[0]));
68 int top = ARR_LEN(environment_stack);
69 ARR_RESIZE(environment_stack, top + 1);
70 environment_stack[top] = entry;
72 entry->old_entry = symbol->thing;
73 entry->symbol = symbol;
74 symbol->thing = entry;
80 * pops symbols from the environment stack until @p new_top is the top element
83 void environment_pop_to(size_t new_top)
85 environment_entry_t *entry = NULL;
86 size_t top = ARR_LEN(environment_stack);
92 assert(new_top < top);
95 entry = environment_stack[i - 1];
97 symbol_t *symbol = entry->symbol;
100 if(entry->type == ENTRY_LOCAL_VARIABLE
101 && entry->e.variable->refs == 0) {
102 variable_declaration_statement_t *variable = entry->e.variable;
103 print_warning_prefix(env, variable->statement.source_position);
104 fprintf(stderr, "variable '%s' was declared but never read\n",
109 if(entry->declaration->storage_class == STORAGE_CLASS_TYPEDEF) {
110 fprintf(stderr, "pop typename '%s'\n", entry->symbol->string);
111 symbol->ID = entry->old_symbol_ID;
114 assert(symbol->thing == entry);
115 symbol->thing = entry->old_entry;
118 } while(i != new_top);
119 obstack_free(&environment_obstack, entry);
121 ARR_SHRINKLEN(environment_stack, (int) new_top);
125 * returns the top element of the environment stack
128 size_t environment_top()
130 return ARR_LEN(environment_stack);
136 void next_token(void)
138 lexer_next_token(&token);
141 print_token(stderr, &token);
142 fprintf(stderr, "\n");
147 void eat(token_type_t type)
149 assert(token.type == type);
153 void parser_print_error_prefix(void)
155 fputs(source_position.input_name, stderr);
157 fprintf(stderr, "%d", source_position.linenr);
158 fputs(": error: ", stderr);
162 void parse_error(const char *message)
164 parser_print_error_prefix();
165 fprintf(stderr, "parse error: %s\n", message);
169 void parse_error_expected(const char *message, ...)
174 if(message != NULL) {
175 parser_print_error_prefix();
176 fprintf(stderr, "%s\n", message);
178 parser_print_error_prefix();
179 fputs("Parse error: got ", stderr);
180 print_token(stderr, &token);
181 fputs(", expected ", stderr);
183 va_start(args, message);
184 token_type_t token_type = va_arg(args, token_type_t);
185 while(token_type != 0) {
189 fprintf(stderr, ", ");
191 print_token_type(stderr, token_type);
192 token_type = va_arg(args, token_type_t);
195 fprintf(stderr, "\n");
199 void eat_until_semi(void)
201 while(token.type != ';') {
203 if(token.type == T_EOF)
209 #define expect(expected) \
210 if(UNLIKELY(token.type != (expected))) { \
211 parse_error_expected(NULL, (expected), 0); \
217 #define expect_void(expected) \
218 if(UNLIKELY(token.type != (expected))) { \
219 parse_error_expected(NULL, (expected), 0); \
225 static expression_t *parse_constant_expression(void)
227 /* TODO: not correct yet */
228 return parse_expression();
231 static compound_entry_t *parse_compound_type_entries(void);
233 typedef struct declaration_specifiers_t declaration_specifiers_t;
234 struct declaration_specifiers_t {
235 storage_class_t storage_class;
239 static type_t *parse_struct_specifier(void)
243 compound_type_t *struct_type = allocate_type_zero(sizeof(struct_type[0]));
244 struct_type->type.type = TYPE_COMPOUND_STRUCT;
245 struct_type->source_position = source_position;
247 if(token.type == T_IDENTIFIER) {
250 if(token.type == '{') {
251 parse_compound_type_entries();
253 } else if(token.type == '{') {
254 parse_compound_type_entries();
256 parse_error_expected("problem while parsing struct type specifiers",
261 return (type_t*) struct_type;
264 static type_t *parse_union_specifier(void)
268 compound_type_t *union_type = allocate_type_zero(sizeof(union_type[0]));
269 union_type->type.type = TYPE_COMPOUND_UNION;
270 union_type->source_position = source_position;
272 if(token.type == T_IDENTIFIER) {
275 if(token.type == '{') {
276 parse_compound_type_entries();
278 } else if(token.type == '{') {
279 parse_compound_type_entries();
281 parse_error_expected("problem while parsing union type specifiers",
285 return (type_t*) union_type;
289 SPECIFIER_SIGNED = 1 << 0,
290 SPECIFIER_UNSIGNED = 1 << 1,
291 SPECIFIER_LONG = 1 << 2,
292 SPECIFIER_INT = 1 << 3,
293 SPECIFIER_DOUBLE = 1 << 4,
294 SPECIFIER_CHAR = 1 << 5,
295 SPECIFIER_SHORT = 1 << 6,
296 SPECIFIER_LONG_LONG = 1 << 7,
297 SPECIFIER_FLOAT = 1 << 8,
298 SPECIFIER_BOOL = 1 << 9,
299 SPECIFIER_VOID = 1 << 10,
300 #ifdef PROVIDE_COMPLEX
301 SPECIFIER_COMPLEX = 1 << 11,
303 #ifdef PROVIDE_IMAGINARY
304 SPECIFIER_IMAGINARY = 1 << 12,
308 #define STORAGE_CLASSES \
315 #define TYPE_QUALIFIERS \
320 case T___extension__: \
321 case T___attribute__:
323 #ifdef PROVIDE_COMPLEX
324 #define COMPLEX_SPECIFIERS \
327 #define COMPLEX_SPECIFIERS
330 #ifdef PROVIDE_IMAGINARY
331 #define IMAGINARY_SPECIFIERS \
334 #define IMAGINARY_SPECIFIERS
337 #define TYPE_SPECIFIERS \
358 void parse_declaration_specifiers(declaration_specifiers_t *specifiers)
361 unsigned type_qualifiers = 0;
362 unsigned type_specifiers = 0;
368 #define MATCH_STORAGE_CLASS(token, class) \
370 if(specifiers->storage_class != STORAGE_CLASS_NONE) { \
371 parse_error("multiple storage classes in declaration " \
374 specifiers->storage_class = class; \
378 MATCH_STORAGE_CLASS(T_typedef, STORAGE_CLASS_TYPEDEF)
379 MATCH_STORAGE_CLASS(T_extern, STORAGE_CLASS_EXTERN)
380 MATCH_STORAGE_CLASS(T_static, STORAGE_CLASS_STATIC)
381 MATCH_STORAGE_CLASS(T_auto, STORAGE_CLASS_AUTO)
382 MATCH_STORAGE_CLASS(T_register, STORAGE_CLASS_REGISTER)
384 /* type qualifiers */
385 #define MATCH_TYPE_QUALIFIER(token, qualifier) \
387 type_qualifiers |= qualifier; \
391 MATCH_TYPE_QUALIFIER(T_const, TYPE_QUALIFIER_CONST);
392 MATCH_TYPE_QUALIFIER(T_restrict, TYPE_QUALIFIER_RESTRICT);
393 MATCH_TYPE_QUALIFIER(T_volatile, TYPE_QUALIFIER_VOLATILE);
394 MATCH_TYPE_QUALIFIER(T_inline, TYPE_QUALIFIER_INLINE);
396 case T___extension__:
401 case T___attribute__:
402 fprintf(stderr, "TODO: __attribute__ not handled yet\n");
406 /* type specifiers */
407 #define MATCH_SPECIFIER(token, specifier, name) \
410 if(type_specifiers & specifier) { \
411 parse_error("multiple " name " type specifiers given"); \
413 type_specifiers |= specifier; \
417 MATCH_SPECIFIER(T_void, SPECIFIER_VOID, "void")
418 MATCH_SPECIFIER(T_char, SPECIFIER_CHAR, "char")
419 MATCH_SPECIFIER(T_short, SPECIFIER_SHORT, "short")
420 MATCH_SPECIFIER(T_int, SPECIFIER_INT, "int")
421 MATCH_SPECIFIER(T_float, SPECIFIER_FLOAT, "float")
422 MATCH_SPECIFIER(T_double, SPECIFIER_DOUBLE, "double")
423 MATCH_SPECIFIER(T_signed, SPECIFIER_SIGNED, "signed")
424 MATCH_SPECIFIER(T_unsigned, SPECIFIER_UNSIGNED, "unsigned")
425 MATCH_SPECIFIER(T__Bool, SPECIFIER_BOOL, "_Bool")
426 #ifdef PROVIDE_COMPLEX
427 MATCH_SPECIFIER(T__Complex, SPECIFIER_COMPLEX, "_Complex")
429 #ifdef PROVIDE_IMAGINARY
430 MATCH_SPECIFIER(T__Imaginary, SPECIFIER_IMAGINARY, "_Imaginary")
434 if(type_specifiers & SPECIFIER_LONG_LONG) {
435 parse_error("multiple type specifiers given");
436 } else if(type_specifiers & SPECIFIER_LONG) {
437 type_specifiers |= SPECIFIER_LONG_LONG;
439 type_specifiers |= SPECIFIER_LONG;
445 if(type_specifiers & SPECIFIER_LONG_LONG ||
446 type_specifiers & SPECIFIER_LONG) {
447 parse_error("multiple type specifiers given");
449 type_specifiers |= specifier;
456 type = parse_struct_specifier();
459 type = parse_union_specifier();
467 if(type != NULL || type_specifiers != 0) {
468 goto finish_specifiers;
471 type = token.v.symbol->thing->declaration->type;
472 assert(type != NULL);
476 /* function specifier */
478 goto finish_specifiers;
485 atomic_type_type_t atomic_type;
487 /* match valid basic types */
488 switch(type_specifiers) {
490 atomic_type = ATOMIC_TYPE_VOID;
493 atomic_type = ATOMIC_TYPE_CHAR;
495 case SPECIFIER_SIGNED | SPECIFIER_CHAR:
496 atomic_type = ATOMIC_TYPE_SCHAR;
498 case SPECIFIER_UNSIGNED | SPECIFIER_CHAR:
499 atomic_type = ATOMIC_TYPE_UCHAR;
501 case SPECIFIER_SHORT:
502 case SPECIFIER_SIGNED | SPECIFIER_SHORT:
503 case SPECIFIER_SHORT | SPECIFIER_INT:
504 case SPECIFIER_SIGNED | SPECIFIER_SHORT | SPECIFIER_INT:
505 atomic_type = ATOMIC_TYPE_SHORT;
507 case SPECIFIER_UNSIGNED | SPECIFIER_SHORT:
508 case SPECIFIER_UNSIGNED | SPECIFIER_SHORT | SPECIFIER_INT:
509 atomic_type = ATOMIC_TYPE_USHORT;
512 case SPECIFIER_SIGNED:
513 case SPECIFIER_SIGNED | SPECIFIER_INT:
514 atomic_type = ATOMIC_TYPE_INT;
516 case SPECIFIER_UNSIGNED:
517 case SPECIFIER_UNSIGNED | SPECIFIER_INT:
518 atomic_type = ATOMIC_TYPE_UINT;
521 case SPECIFIER_SIGNED | SPECIFIER_LONG:
522 case SPECIFIER_LONG | SPECIFIER_INT:
523 case SPECIFIER_SIGNED | SPECIFIER_LONG | SPECIFIER_INT:
524 atomic_type = ATOMIC_TYPE_LONG;
526 case SPECIFIER_UNSIGNED | SPECIFIER_LONG:
527 case SPECIFIER_UNSIGNED | SPECIFIER_LONG | SPECIFIER_INT:
528 atomic_type = ATOMIC_TYPE_ULONG;
530 case SPECIFIER_LONG_LONG:
531 case SPECIFIER_SIGNED | SPECIFIER_LONG_LONG:
532 case SPECIFIER_LONG_LONG | SPECIFIER_INT:
533 case SPECIFIER_SIGNED | SPECIFIER_LONG_LONG | SPECIFIER_INT:
534 atomic_type = ATOMIC_TYPE_LONGLONG;
536 case SPECIFIER_UNSIGNED | SPECIFIER_LONG_LONG:
537 case SPECIFIER_UNSIGNED | SPECIFIER_LONG_LONG | SPECIFIER_INT:
538 atomic_type = ATOMIC_TYPE_ULONGLONG;
540 case SPECIFIER_FLOAT:
541 atomic_type = ATOMIC_TYPE_FLOAT;
543 case SPECIFIER_DOUBLE:
544 atomic_type = ATOMIC_TYPE_DOUBLE;
546 case SPECIFIER_LONG | SPECIFIER_DOUBLE:
547 atomic_type = ATOMIC_TYPE_LONG_DOUBLE;
550 atomic_type = ATOMIC_TYPE_BOOL;
552 #ifdef PROVIDE_COMPLEX
553 case SPECIFIER_FLOAT | SPECIFIER_COMPLEX:
554 atomic_type = ATOMIC_TYPE_FLOAT_COMPLEX;
556 case SPECIFIER_DOUBLE | SPECIFIER_COMPLEX:
557 atomic_type = ATOMIC_TYPE_DOUBLE_COMPLEX;
559 case SPECIFIER_LONG | SPECIFIER_DOUBLE | SPECIFIER_COMPLEX:
560 atomic_type = ATOMIC_TYPE_LONG_DOUBLE_COMPLEX;
563 #ifdef PROVIDE_IMAGINARY
564 case SPECIFIER_FLOAT | SPECIFIER_IMAGINARY:
565 atomic_type = ATOMIC_TYPE_FLOAT_IMAGINARY;
567 case SPECIFIER_DOUBLE | SPECIFIER_IMAGINARY:
568 atomic_type = ATOMIC_TYPE_DOUBLE_IMAGINARY;
570 case SPECIFIER_LONG | SPECIFIER_DOUBLE | SPECIFIER_IMAGINARY:
571 atomic_type = ATOMIC_TYPE_LONG_DOUBLE_IMAGINARY;
575 /* invalid specifier combination, give an error message */
576 if(type_specifiers == 0) {
577 parse_error("no type specifiers given in declaration");
578 } else if((type_specifiers & SPECIFIER_SIGNED) &&
579 (type_specifiers & SPECIFIER_UNSIGNED)) {
580 parse_error("signed and unsigned specifiers gives");
581 } else if(type_specifiers & (SPECIFIER_SIGNED | SPECIFIER_UNSIGNED)) {
582 parse_error("only integer types can be signed or unsigned");
584 parse_error("multiple datatypes in declaration");
586 atomic_type = ATOMIC_TYPE_INVALID;
589 atomic_type_t *atype = allocate_type_zero(sizeof(atype[0]));
590 atype->type.type = TYPE_ATOMIC;
591 atype->atype = atomic_type;
593 type = (type_t*) atype;
595 if(type_specifiers != 0) {
596 parse_error("multiple datatypes in declaration");
600 type->qualifiers = type_qualifiers;
602 type_t *result = typehash_insert(type);
603 if(result != (type_t*) type) {
604 obstack_free(type_obst, type);
607 specifiers->type = result;
609 fprintf(stderr, "Specifiers type: ");
610 print_type(stderr, result);
611 fprintf(stderr, "\n");
615 unsigned parse_type_qualifiers()
617 unsigned type_qualifiers = 0;
621 /* type qualifiers */
622 MATCH_TYPE_QUALIFIER(T_const, TYPE_QUALIFIER_CONST);
623 MATCH_TYPE_QUALIFIER(T_restrict, TYPE_QUALIFIER_RESTRICT);
624 MATCH_TYPE_QUALIFIER(T_volatile, TYPE_QUALIFIER_VOLATILE);
625 MATCH_TYPE_QUALIFIER(T_inline, TYPE_QUALIFIER_INLINE);
628 return type_qualifiers;
634 void parse_declarator(declaration_t *declaration, storage_class_t storage_class,
637 while(token.type == '*') {
641 pointer_type_t *pointer_type
642 = allocate_type_zero(sizeof(pointer_type[0]));
643 pointer_type->type.type = TYPE_POINTER;
644 pointer_type->points_to = type;
646 pointer_type->type.qualifiers = parse_type_qualifiers();
648 type_t *result = typehash_insert((type_t*) pointer_type);
649 if(result != (type_t*) pointer_type) {
650 obstack_free(type_obst, pointer_type);
655 declaration->storage_class = storage_class;
656 declaration->type = type;
661 declaration->symbol = token.v.symbol;
666 parse_declarator(declaration, storage_class, type);
670 parse_error("problem while parsing declarator");
673 if(token.type == '(') {
676 /* parse parameter-type-list or identifier-list */
679 } else if(token.type == '[') {
682 /* multiple type qualifiers, and static */
684 /* assignment_expression or '*' or nothing */
689 fprintf(stderr, "Declarator type: ");
690 print_type(stderr, type);
691 fprintf(stderr, "\n");
693 symbol_t *symbol = declaration->symbol;
695 environment_entry_t *entry = environment_push(symbol);
696 entry->declaration = declaration;
697 entry->old_symbol_ID = symbol->ID;
699 if(storage_class == STORAGE_CLASS_TYPEDEF) {
700 symbol->ID = T_TYPENAME;
702 symbol->ID = T_IDENTIFIER;
707 void parse_init_declarators(const declaration_specifiers_t *specifiers)
710 declaration_t *declaration = allocate_ast_zero(sizeof(declaration[0]));
712 parse_declarator(declaration, specifiers->storage_class,
714 if(token.type == '=') {
716 // parse_initializer TODO
717 } else if(token.type == '{') {
718 parse_compound_statement();
722 if(token.type != ',')
730 void parse_struct_declarators(const declaration_specifiers_t *specifiers)
733 declaration_t declaration;
734 compound_entry_t *entry = allocate_ast_zero(sizeof(entry[0]));
736 if(token.type == ':') {
738 parse_constant_expression();
741 parse_declarator(&declaration, specifiers->storage_class,
744 if(token.type == ':') {
746 parse_constant_expression();
751 if(token.type != ',')
758 static compound_entry_t *parse_compound_type_entries(void)
762 compound_entry_t *entries = NULL;
764 while(token.type != '}' && token.type != T_EOF) {
765 declaration_specifiers_t specifiers;
766 memset(&specifiers, 0, sizeof(specifiers));
767 /* TODO not correct as this allows storage class stuff... but only
768 * specifiers and qualifiers sould be allowed here */
769 parse_declaration_specifiers(&specifiers);
771 parse_struct_declarators(&specifiers);
778 void parse_declaration(void)
780 declaration_specifiers_t specifiers;
781 memset(&specifiers, 0, sizeof(specifiers));
782 parse_declaration_specifiers(&specifiers);
784 if(token.type == ';') {
788 parse_init_declarators(&specifiers);
793 typedef expression_t* (*parse_expression_function) (unsigned precedence);
794 typedef expression_t* (*parse_expression_infix_function) (unsigned precedence,
797 typedef struct expression_parser_function_t expression_parser_function_t;
798 struct expression_parser_function_t {
800 parse_expression_function parser;
801 unsigned infix_precedence;
802 parse_expression_infix_function infix_parser;
805 expression_parser_function_t expression_parsers[T_LAST_TOKEN];
808 expression_t *expected_expression_error(void)
810 parser_print_error_prefix();
811 fprintf(stderr, "expected expression, got token ");
812 print_token(stderr, & token);
813 fprintf(stderr, "\n");
815 expression_t *expression = allocate_ast_zero(sizeof(expression[0]));
816 expression->type = EXPR_INVALID;
823 expression_t *parse_string_const(void)
825 string_literal_t *cnst = allocate_ast_zero(sizeof(cnst[0]));
827 cnst->expression.type = EXPR_STRING_LITERAL;
828 cnst->value = token.v.string;
832 return (expression_t*) cnst;
836 expression_t *parse_int_const(void)
838 const_t *cnst = allocate_ast_zero(sizeof(cnst[0]));
840 cnst->expression.type = EXPR_CONST;
841 cnst->value = token.v.intvalue;
845 return (expression_t*) cnst;
849 expression_t *parse_reference(void)
851 reference_expression_t *ref = allocate_ast_zero(sizeof(ref[0]));
853 ref->expression.type = EXPR_REFERENCE;
854 ref->symbol = token.v.symbol;
858 return (expression_t*) ref;
862 expression_t *parse_brace_expression(void)
866 expression_t *result = parse_expression();
873 expression_t *parse_primary_expression(void)
877 return parse_int_const();
878 case T_STRING_LITERAL:
879 return parse_string_const();
881 return parse_reference();
883 return parse_brace_expression();
886 /* TODO: error message */
891 expression_t *parse_array_expression(unsigned precedence,
892 expression_t *array_ref)
898 array_access_expression_t *array_access
899 = allocate_ast_zero(sizeof(array_access[0]));
901 array_access->expression.type = EXPR_ARRAY_ACCESS;
902 array_access->array_ref = array_ref;
903 array_access->index = parse_expression();
905 if(token.type != ']') {
906 parse_error_expected("Problem while parsing array access", ']', 0);
911 return (expression_t*) array_access;
915 expression_t *parse_sizeof(unsigned precedence)
925 expression_t *parse_select_expression(unsigned precedence,
926 expression_t *compound)
930 assert(token.type == '.' || token.type == T_SELECT);
933 select_expression_t *select = allocate_ast_zero(sizeof(select[0]));
935 select->expression.type = EXPR_SELECT;
936 select->compound = compound;
938 if(token.type != T_IDENTIFIER) {
939 parse_error_expected("Problem while parsing compound select",
943 select->symbol = token.v.symbol;
946 return (expression_t*) select;
950 expression_t *parse_call_expression(unsigned precedence,
951 expression_t *expression)
954 call_expression_t *call = allocate_ast_zero(sizeof(call[0]));
956 call->expression.type = EXPR_CALL;
957 call->method = expression;
959 /* parse arguments */
962 if(token.type != ')') {
963 call_argument_t *last_argument = NULL;
966 call_argument_t *argument = allocate_ast_zero(sizeof(argument[0]));
968 argument->expression = parse_expression();
969 if(last_argument == NULL) {
970 call->arguments = argument;
972 last_argument->next = argument;
974 last_argument = argument;
976 if(token.type != ',')
983 return (expression_t*) call;
986 #define CREATE_UNARY_EXPRESSION_PARSER(token_type, unexpression_type) \
988 expression_t *parse_##unexpression_type(unsigned precedence) \
992 unary_expression_t *unary_expression \
993 = allocate_ast_zero(sizeof(unary_expression[0])); \
994 unary_expression->expression.type = EXPR_UNARY; \
995 unary_expression->type = unexpression_type; \
996 unary_expression->value = parse_sub_expression(precedence); \
998 return (expression_t*) unary_expression; \
1001 CREATE_UNARY_EXPRESSION_PARSER('-', UNEXPR_NEGATE)
1002 CREATE_UNARY_EXPRESSION_PARSER('+', UNEXPR_PLUS)
1003 CREATE_UNARY_EXPRESSION_PARSER('!', UNEXPR_NOT)
1004 CREATE_UNARY_EXPRESSION_PARSER('*', UNEXPR_DEREFERENCE)
1005 CREATE_UNARY_EXPRESSION_PARSER('&', UNEXPR_TAKE_ADDRESS)
1006 CREATE_UNARY_EXPRESSION_PARSER('~', UNEXPR_BITWISE_NEGATE)
1007 CREATE_UNARY_EXPRESSION_PARSER(T_PLUSPLUS, UNEXPR_PREFIX_INCREMENT)
1008 CREATE_UNARY_EXPRESSION_PARSER(T_MINUSMINUS, UNEXPR_PREFIX_DECREMENT)
1010 #define CREATE_UNARY_POSTFIX_EXPRESSION_PARSER(token_type, unexpression_type) \
1012 expression_t *parse_##unexpression_type(unsigned precedence, \
1013 expression_t *left) \
1015 (void) precedence; \
1018 unary_expression_t *unary_expression \
1019 = allocate_ast_zero(sizeof(unary_expression[0])); \
1020 unary_expression->expression.type = EXPR_UNARY; \
1021 unary_expression->type = unexpression_type; \
1022 unary_expression->value = left; \
1024 return (expression_t*) unary_expression; \
1027 CREATE_UNARY_POSTFIX_EXPRESSION_PARSER(T_PLUSPLUS, UNEXPR_POSTFIX_INCREMENT)
1028 CREATE_UNARY_POSTFIX_EXPRESSION_PARSER(T_MINUSMINUS, UNEXPR_POSTFIX_DECREMENT)
1030 #define CREATE_BINEXPR_PARSER(token_type, binexpression_type) \
1032 expression_t *parse_##binexpression_type(unsigned precedence, \
1033 expression_t *left) \
1037 expression_t *right = parse_sub_expression(precedence); \
1039 binary_expression_t *binexpr \
1040 = allocate_ast_zero(sizeof(binexpr[0])); \
1041 binexpr->expression.type = EXPR_BINARY; \
1042 binexpr->type = binexpression_type; \
1043 binexpr->left = left; \
1044 binexpr->right = right; \
1046 return (expression_t*) binexpr; \
1049 CREATE_BINEXPR_PARSER('*', BINEXPR_MUL)
1050 CREATE_BINEXPR_PARSER('/', BINEXPR_DIV)
1051 CREATE_BINEXPR_PARSER('+', BINEXPR_ADD)
1052 CREATE_BINEXPR_PARSER('-', BINEXPR_SUB)
1053 CREATE_BINEXPR_PARSER('<', BINEXPR_LESS)
1054 CREATE_BINEXPR_PARSER('>', BINEXPR_GREATER)
1055 CREATE_BINEXPR_PARSER('=', BINEXPR_ASSIGN)
1056 CREATE_BINEXPR_PARSER(T_EQUALEQUAL, BINEXPR_EQUAL)
1057 CREATE_BINEXPR_PARSER(T_SLASHEQUAL, BINEXPR_NOTEQUAL)
1058 CREATE_BINEXPR_PARSER(T_LESSEQUAL, BINEXPR_LESSEQUAL)
1059 CREATE_BINEXPR_PARSER(T_GREATEREQUAL, BINEXPR_GREATEREQUAL)
1060 CREATE_BINEXPR_PARSER('&', BINEXPR_BITWISE_AND)
1061 CREATE_BINEXPR_PARSER('|', BINEXPR_BITWISE_OR)
1062 CREATE_BINEXPR_PARSER('^', BINEXPR_BITWISE_XOR)
1063 CREATE_BINEXPR_PARSER(T_LESSLESS, BINEXPR_SHIFTLEFT)
1064 CREATE_BINEXPR_PARSER(T_GREATERGREATER, BINEXPR_SHIFTRIGHT)
1067 expression_t *parse_sub_expression(unsigned precedence)
1069 if(token.type < 0) {
1070 return expected_expression_error();
1073 expression_parser_function_t *parser
1074 = &expression_parsers[token.type];
1075 source_position_t source_position = source_position;
1078 if(parser->parser != NULL) {
1079 left = parser->parser(parser->precedence);
1081 left = parse_primary_expression();
1084 left->source_position = source_position;
1087 if(token.type < 0) {
1088 return expected_expression_error();
1091 parser = &expression_parsers[token.type];
1092 if(parser->infix_parser == NULL)
1094 if(parser->infix_precedence < precedence)
1097 left = parser->infix_parser(parser->infix_precedence, left);
1099 left->source_position = source_position;
1106 expression_t *parse_expression(void)
1108 return parse_sub_expression(1);
1113 void register_expression_parser(parse_expression_function parser,
1114 int token_type, unsigned precedence)
1116 expression_parser_function_t *entry = &expression_parsers[token_type];
1118 if(entry->parser != NULL) {
1119 fprintf(stderr, "for token ");
1120 print_token_type(stderr, token_type);
1121 fprintf(stderr, "\n");
1122 panic("trying to register multiple expression parsers for a token");
1124 entry->parser = parser;
1125 entry->precedence = precedence;
1128 void register_expression_infix_parser(parse_expression_infix_function parser,
1129 int token_type, unsigned precedence)
1131 expression_parser_function_t *entry = &expression_parsers[token_type];
1133 if(entry->infix_parser != NULL) {
1134 fprintf(stderr, "for token ");
1135 print_token_type(stderr, token_type);
1136 fprintf(stderr, "\n");
1137 panic("trying to register multiple infix expression parsers for a "
1140 entry->infix_parser = parser;
1141 entry->infix_precedence = precedence;
1145 void init_expression_parsers(void)
1147 memset(&expression_parsers, 0, sizeof(expression_parsers));
1149 register_expression_infix_parser(parse_BINEXPR_MUL, '*', 16);
1150 register_expression_infix_parser(parse_BINEXPR_DIV, '/', 16);
1151 register_expression_infix_parser(parse_BINEXPR_SHIFTLEFT,
1153 register_expression_infix_parser(parse_BINEXPR_SHIFTRIGHT,
1154 T_GREATERGREATER, 16);
1155 register_expression_infix_parser(parse_BINEXPR_ADD, '+', 15);
1156 register_expression_infix_parser(parse_BINEXPR_SUB, '-', 15);
1157 register_expression_infix_parser(parse_BINEXPR_LESS, '<', 14);
1158 register_expression_infix_parser(parse_BINEXPR_GREATER, '>', 14);
1159 register_expression_infix_parser(parse_BINEXPR_LESSEQUAL, T_LESSEQUAL, 14);
1160 register_expression_infix_parser(parse_BINEXPR_GREATEREQUAL,
1161 T_GREATEREQUAL, 14);
1162 register_expression_infix_parser(parse_BINEXPR_EQUAL, T_EQUALEQUAL, 13);
1163 register_expression_infix_parser(parse_BINEXPR_NOTEQUAL,
1164 T_EXCLAMATIONMARKEQUAL, 13);
1165 register_expression_infix_parser(parse_BINEXPR_BITWISE_AND, '&', 12);
1166 register_expression_infix_parser(parse_BINEXPR_BITWISE_XOR, '^', 11);
1167 register_expression_infix_parser(parse_BINEXPR_BITWISE_OR, '|', 10);
1168 register_expression_infix_parser(parse_BINEXPR_ASSIGN, T_EQUAL, 2);
1170 register_expression_infix_parser(parse_array_expression, '[', 30);
1171 register_expression_infix_parser(parse_call_expression, '(', 30);
1172 register_expression_infix_parser(parse_select_expression, '.', 30);
1173 register_expression_infix_parser(parse_select_expression, T_SELECT, 30);
1174 register_expression_infix_parser(parse_UNEXPR_POSTFIX_INCREMENT,
1176 register_expression_infix_parser(parse_UNEXPR_POSTFIX_DECREMENT,
1179 register_expression_parser(parse_UNEXPR_NEGATE, '-', 25);
1180 register_expression_parser(parse_UNEXPR_PLUS, '+', 25);
1181 register_expression_parser(parse_UNEXPR_NOT, '!', 25);
1182 register_expression_parser(parse_UNEXPR_BITWISE_NEGATE, '~', 25);
1183 register_expression_parser(parse_UNEXPR_DEREFERENCE, '*', 25);
1184 register_expression_parser(parse_UNEXPR_TAKE_ADDRESS, '&', 25);
1185 register_expression_parser(parse_UNEXPR_PREFIX_INCREMENT, T_PLUSPLUS, 25);
1186 register_expression_parser(parse_UNEXPR_PREFIX_DECREMENT, T_MINUSMINUS, 25);
1187 register_expression_parser(parse_sizeof, T_sizeof, 25);
1192 statement_t *parse_case_statement(void)
1203 statement_t *parse_default_statement(void)
1213 statement_t *parse_label_statement(void)
1223 statement_t *parse_if(void)
1231 if(token.type == T_else) {
1240 statement_t *parse_switch(void)
1252 statement_t *parse_while(void)
1264 statement_t *parse_do(void)
1277 statement_t *parse_for(void)
1281 if(token.type != ';') {
1282 /* TODO not correct... this could also be a declaration */
1286 if(token.type != ';') {
1290 if(token.type != ')') {
1300 statement_t *parse_goto(void)
1303 expect(T_IDENTIFIER);
1310 statement_t *parse_continue(void)
1319 statement_t *parse_break(void)
1328 statement_t *parse_return(void)
1338 statement_t *parse_declaration_statement(void)
1340 parse_declaration();
1345 statement_t *parse_statement(void)
1347 statement_t *statement = NULL;
1349 /* declaration or statement */
1350 switch(token.type) {
1352 statement = parse_case_statement();
1356 statement = parse_default_statement();
1360 statement = parse_label_statement();
1364 statement = parse_compound_statement();
1368 statement = parse_if();
1372 statement = parse_switch();
1376 statement = parse_while();
1380 statement = parse_do();
1384 statement = parse_for();
1388 statement = parse_goto();
1392 statement = parse_continue();
1396 statement = parse_break();
1400 statement = parse_return();
1410 statement = parse_declaration_statement();
1418 statement_t *parse_compound_statement(void)
1422 int top = environment_top();
1424 while(token.type != '}') {
1428 environment_pop_to(top);
1436 translation_unit_t *parse_translation_unit(void)
1438 translation_unit_t *unit = allocate_ast_zero(sizeof(unit[0]));
1440 assert(translation_unit == NULL);
1441 assert(context == NULL);
1442 translation_unit = unit;
1444 while(token.type != T_EOF) {
1445 parse_declaration();
1448 translation_unit = NULL;
1452 translation_unit_t *parse(void)
1454 obstack_init(&environment_obstack);
1455 environment_stack = NEW_ARR_F(environment_entry_t*, 0);
1458 translation_unit_t *unit = parse_translation_unit();
1460 DEL_ARR_F(environment_stack);
1461 obstack_free(&environment_obstack, NULL);
1466 void init_parser(void)
1468 init_expression_parsers();
1471 void exit_parser(void)