X-Git-Url: http://nsz.repo.hu/git/?a=blobdiff_plain;f=parser.c;h=d35396f2cebd706bbe9bd1d83c7c78f3c496b629;hb=a337ecba4682dce4b7ac695cccce0399bbdaaa47;hp=3f73c1d316d8c07bdc337af52ed0935a515df1c2;hpb=5f726e137fc98e9f545df84f390876a4578a2bf4;p=cparser diff --git a/parser.c b/parser.c index 3f73c1d..d35396f 100644 --- a/parser.c +++ b/parser.c @@ -42,9 +42,10 @@ static type_t *type_uint = NULL; static type_t *type_long_double = NULL; static type_t *type_double = NULL; static type_t *type_float = NULL; -static type_t *type_const_char = NULL; +static type_t *type_char = NULL; static type_t *type_string = NULL; static type_t *type_void = NULL; +static type_t *type_void_ptr = NULL; static type_t *type_size_t = NULL; static type_t *type_ptrdiff_t = NULL; @@ -71,14 +72,10 @@ static type_t *parse_typename(void); #ifdef PROVIDE_COMPLEX #define COMPLEX_SPECIFIERS \ case T__Complex: -#else -#define COMPLEX_SPECIFIERS -#endif - -#ifdef PROVIDE_IMAGINARY #define IMAGINARY_SPECIFIERS \ case T__Imaginary: #else +#define COMPLEX_SPECIFIERS #define IMAGINARY_SPECIFIERS #endif @@ -123,6 +120,26 @@ static inline void *allocate_type_zero(size_t size) return res; } +static inline size_t get_initializer_size(initializer_type_t type) +{ + static const size_t size[] = { + [INITIALIZER_VALUE] = sizeof(initializer_value_t), + [INITIALIZER_STRING] = sizeof(initializer_string_t), + [INITIALIZER_LIST] = sizeof(initializer_list_t) + }; + assert(type < INITIALIZER_COUNT); + assert(size[type] != 0); + return size[type]; +} + +static inline initializer_t *allocate_initializer(initializer_type_t type) +{ + initializer_t *result = allocate_ast_zero(get_initializer_size(type)); + result->type = type; + + return result; +} + static inline void free_type(void *type) { obstack_free(type_obst, type); @@ -657,57 +674,62 @@ static expression_t *create_implicit_cast(expression_t *expression, if(source_type == dest_type) return expression; - if(dest_type->type == TYPE_ATOMIC) { - if(source_type->type != TYPE_ATOMIC) - panic("casting of non-atomic types not implemented yet"); + switch (dest_type->type) { + case TYPE_ENUM: + /* TODO warning for implicitly converting to enum */ + case TYPE_ATOMIC: + if (source_type->type != TYPE_ATOMIC && + source_type->type != TYPE_ENUM) { + panic("casting of non-atomic types not implemented yet"); + } - if(is_type_floating(dest_type) && !is_type_scalar(source_type)) { - type_error_incompatible("can't cast types", - expression->source_position, - source_type, dest_type); - return expression; - } + if(is_type_floating(dest_type) && !is_type_scalar(source_type)) { + type_error_incompatible("can't cast types", + expression->source_position, source_type, dest_type); + return expression; + } - return create_cast_expression(expression, dest_type); - } - if(dest_type->type == TYPE_POINTER) { - pointer_type_t *pointer_type - = (pointer_type_t*) dest_type; - switch (source_type->type) { - case TYPE_ATOMIC: - if (is_null_expression(expression)) { - return create_cast_expression(expression, dest_type); - } - break; + return create_cast_expression(expression, dest_type); - case TYPE_POINTER: - if (pointers_compatible(source_type, dest_type)) { - return create_cast_expression(expression, dest_type); - } - break; + case TYPE_POINTER: + switch (source_type->type) { + case TYPE_ATOMIC: + if (is_null_expression(expression)) { + return create_cast_expression(expression, dest_type); + } + break; + + case TYPE_POINTER: + if (pointers_compatible(source_type, dest_type)) { + return create_cast_expression(expression, dest_type); + } + break; - case TYPE_ARRAY: { - array_type_t *const array_type = (array_type_t*) source_type; - if (types_compatible(array_type->element_type, - pointer_type->points_to)) { - return create_cast_expression(expression, dest_type); + case TYPE_ARRAY: { + array_type_t *array_type = (array_type_t*) source_type; + pointer_type_t *pointer_type + = (pointer_type_t*) dest_type; + if (types_compatible(array_type->element_type, + pointer_type->points_to)) { + return create_cast_expression(expression, dest_type); + } + break; } - break; + + default: + panic("casting of non-atomic types not implemented yet"); } - default: - panic("casting of non-atomic types not implemented yet"); - } + type_error_incompatible("can't implicitly cast types", + expression->source_position, source_type, dest_type); + return expression; - type_error_incompatible("can't implicitly cast types", - expression->source_position, - source_type, dest_type); - return expression; + default: + panic("casting of non-atomic types not implemented yet"); } - - panic("casting of non-atomic types not implemented yet"); } +/** Implements the rules from § 6.5.16.1 */ static void semantic_assign(type_t *orig_type_left, expression_t **right, const char *context) { @@ -719,40 +741,55 @@ static void semantic_assign(type_t *orig_type_left, expression_t **right, type_t *const type_left = skip_typeref(orig_type_left); type_t *const type_right = skip_typeref(orig_type_right); - if (type_left == type_right) { - return; - } - if ((is_type_arithmetic(type_left) && is_type_arithmetic(type_right)) || - (type_left->type == TYPE_POINTER && is_null_expression(*right)) || - (type_left->type == TYPE_POINTER && type_right->type == TYPE_POINTER)) { + (is_type_pointer(type_left) && is_null_expression(*right)) || + (is_type_atomic(type_left, ATOMIC_TYPE_BOOL) + && is_type_pointer(type_right))) { *right = create_implicit_cast(*right, type_left); return; } - if (type_left->type == TYPE_POINTER) { - switch (type_right->type) { - case TYPE_FUNCTION: { - pointer_type_t *const ptr_type = (pointer_type_t*)type_left; - if (ptr_type->points_to == type_right) { - return; - } - break; - } + if (is_type_pointer(type_left) && is_type_pointer(type_right)) { + pointer_type_t *pointer_type_left = (pointer_type_t*) type_left; + pointer_type_t *pointer_type_right = (pointer_type_t*) type_right; + type_t *points_to_left = pointer_type_left->points_to; + type_t *points_to_right = pointer_type_right->points_to; - case TYPE_ARRAY: { - pointer_type_t *const ptr_type = (pointer_type_t*)type_left; - array_type_t *const arr_type = (array_type_t*)type_right; - if (ptr_type->points_to == arr_type->element_type) { - return; - } - break; - } + points_to_left = skip_typeref(points_to_left); + points_to_right = skip_typeref(points_to_right); + + if(!is_type_atomic(points_to_left, ATOMIC_TYPE_VOID) + && !is_type_atomic(points_to_right, ATOMIC_TYPE_VOID) + && !types_compatible(points_to_left, points_to_right)) { + goto incompatible_assign_types; + } - default: break; + /* the left type has all qualifiers from the right type */ + unsigned missing_qualifiers + = points_to_right->qualifiers & ~points_to_left->qualifiers; + if(missing_qualifiers != 0) { + parser_print_error_prefix(); + fprintf(stderr, "destination type "); + print_type_quoted(type_left); + fprintf(stderr, " in %s from type ", context); + print_type_quoted(type_right); + fprintf(stderr, " lacks qualifiers '"); + print_type_qualifiers(missing_qualifiers); + fprintf(stderr, "' in pointed-to type\n"); + return; } + + *right = create_implicit_cast(*right, type_left); + return; + } + + if (is_type_compound(type_left) + && types_compatible(type_left, type_right)) { + *right = create_implicit_cast(*right, type_left); + return; } +incompatible_assign_types: /* TODO: improve error message */ parser_print_error_prefix(); fprintf(stderr, "incompatible types in %s\n", context); @@ -897,11 +934,21 @@ static designator_t *parse_designation(void) } #endif +static initializer_t *initializer_from_string(array_type_t *type, + const char *string) +{ + /* TODO: check len vs. size of array type */ + (void) type; + + initializer_t *initializer = allocate_initializer(INITIALIZER_STRING); + initializer->string.string = string; + + return initializer; +} + static initializer_t *initializer_from_expression(type_t *type, expression_t *expression) { - initializer_value_t *result = allocate_ast_zero(sizeof(result[0])); - /* TODO check that expression is a constant expression */ /* § 6.7.8.14/15 char array may be initialized by string literals */ @@ -917,19 +964,19 @@ static initializer_t *initializer_from_expression(type_t *type, if(atype == ATOMIC_TYPE_CHAR || atype == ATOMIC_TYPE_SCHAR || atype == ATOMIC_TYPE_UCHAR) { - /* it's fine TODO: check for length of string array... */ - goto initializer_from_expression_finished; + + string_literal_t *literal = (string_literal_t*) expression; + return initializer_from_string(array_type, literal->value); } } } semantic_assign(type, &expression, "initializer"); -initializer_from_expression_finished: - result->initializer.type = INITIALIZER_VALUE; - result->value = expression; + initializer_t *result = allocate_initializer(INITIALIZER_VALUE); + result->value.value = expression; - return (initializer_t*) result; + return result; } static initializer_t *parse_sub_initializer(type_t *type, @@ -980,13 +1027,12 @@ static initializer_t *parse_sub_initializer(type_t *type, /* TODO: ignore qualifiers, comparing pointers is probably * not correct */ if(expression != NULL && expression_type == type) { - initializer_t *result = allocate_ast_zero(sizeof(result[0])); - result->type = INITIALIZER_VALUE; + initializer_t *result = allocate_initializer(INITIALIZER_VALUE); if(type != NULL) { semantic_assign(type, &expression, "initializer"); } - //result->v.value = expression; + result->value.value = expression; return result; } @@ -998,14 +1044,48 @@ static initializer_t *parse_sub_initializer(type_t *type, } /* descend into subtype */ - initializer_t *result = NULL; + initializer_t *result = NULL; + initializer_t **elems; if(type->type == TYPE_ARRAY) { array_type_t *array_type = (array_type_t*) type; type_t *element_type = array_type->element_type; element_type = skip_typeref(element_type); - result - = parse_sub_initializer(element_type, expression, expression_type); + initializer_t *sub; + had_initializer_brace_warning = false; + if(expression == NULL) { + sub = parse_sub_initializer_elem(element_type); + } else { + sub = parse_sub_initializer(element_type, expression, + expression_type); + } + + /* didn't match the subtypes -> try the parent type */ + if(sub == NULL) { + assert(!read_paren); + return NULL; + } + + elems = NEW_ARR_F(initializer_t*, 0); + ARR_APP1(initializer_t*, elems, sub); + + while(true) { + if(token.type == '}') + break; + expect_block(','); + if(token.type == '}') + break; + + initializer_t *sub + = parse_sub_initializer(element_type, NULL, NULL); + if(sub == NULL) { + /* TODO error, do nicer cleanup */ + parse_error("member initializer didn't match"); + DEL_ARR_F(elems); + return NULL; + } + ARR_APP1(initializer_t*, elems, sub); + } } else { assert(type->type == TYPE_COMPOUND_STRUCT || type->type == TYPE_COMPOUND_UNION); @@ -1032,7 +1112,7 @@ static initializer_t *parse_sub_initializer(type_t *type, return NULL; } - initializer_t **elems = NEW_ARR_F(initializer_t*, 0); + elems = NEW_ARR_F(initializer_t*, 0); ARR_APP1(initializer_t*, elems, sub); declaration_t *iter = first->next; @@ -1045,11 +1125,12 @@ static initializer_t *parse_sub_initializer(type_t *type, if(token.type == '}') break; expect_block(','); + if(token.type == '}') + break; type_t *iter_type = iter->type; iter_type = skip_typeref(iter_type); - /* read next token */ initializer_t *sub = parse_sub_initializer(iter_type, NULL, NULL); if(sub == NULL) { /* TODO error, do nicer cleanup*/ @@ -1059,20 +1140,19 @@ static initializer_t *parse_sub_initializer(type_t *type, } ARR_APP1(initializer_t*, elems, sub); } + } - int len = ARR_LEN(elems); - size_t elems_size = sizeof(initializer_t*) * len; + int len = ARR_LEN(elems); + size_t elems_size = sizeof(initializer_t*) * len; - initializer_list_t *init - = allocate_ast_zero(sizeof(init[0]) + elems_size); + initializer_list_t *init = allocate_ast_zero(sizeof(init[0]) + elems_size); - init->initializer.type = INITIALIZER_LIST; - init->len = len; - memcpy(init->initializers, elems, elems_size); - DEL_ARR_F(elems); + init->initializer.type = INITIALIZER_LIST; + init->len = len; + memcpy(init->initializers, elems, elems_size); + DEL_ARR_F(elems); - result = (initializer_t*) init; - } + result = (initializer_t*) init; if(read_paren) { if(token.type == ',') @@ -1189,7 +1269,7 @@ static declaration_t *parse_compound_type_specifier(bool is_struct) return declaration; } -static void parse_enum_entries(void) +static void parse_enum_entries(enum_type_t *const enum_type) { eat('{'); @@ -1208,13 +1288,16 @@ static void parse_enum_entries(void) return; } entry->storage_class = STORAGE_CLASS_ENUM_ENTRY; + entry->type = (type_t*) enum_type; entry->symbol = token.v.symbol; entry->source_position = token.source_position; next_token(); if(token.type == '=') { next_token(); - entry->init.initializer = parse_initializer(type_int); + entry->init.enum_value = parse_constant_expression(); + + /* TODO semantic */ } record_declaration(entry); @@ -1227,7 +1310,7 @@ static void parse_enum_entries(void) expect_void('}'); } -static declaration_t *parse_enum_specifier(void) +static type_t *parse_enum_specifier(void) { eat(T_enum); @@ -1256,6 +1339,10 @@ static declaration_t *parse_enum_specifier(void) declaration->symbol = symbol; } + enum_type_t *const enum_type = allocate_type_zero(sizeof(enum_type[0])); + enum_type->type.type = TYPE_ENUM; + enum_type->declaration = declaration; + if(token.type == '{') { if(declaration->init.is_defined) { parser_print_error_prefix(); @@ -1265,11 +1352,11 @@ static declaration_t *parse_enum_specifier(void) record_declaration(declaration); declaration->init.is_defined = 1; - parse_enum_entries(); + parse_enum_entries(enum_type); parse_attributes(); } - return declaration; + return (type_t*) enum_type; } /** @@ -1347,8 +1434,6 @@ typedef enum { SPECIFIER_VOID = 1 << 10, #ifdef PROVIDE_COMPLEX SPECIFIER_COMPLEX = 1 << 11, -#endif -#ifdef PROVIDE_IMAGINARY SPECIFIER_IMAGINARY = 1 << 12, #endif } specifiers_t; @@ -1443,8 +1528,6 @@ static void parse_declaration_specifiers(declaration_specifiers_t *specifiers) MATCH_SPECIFIER(T__Bool, SPECIFIER_BOOL, "_Bool") #ifdef PROVIDE_COMPLEX MATCH_SPECIFIER(T__Complex, SPECIFIER_COMPLEX, "_Complex") -#endif -#ifdef PROVIDE_IMAGINARY MATCH_SPECIFIER(T__Imaginary, SPECIFIER_IMAGINARY, "_Imaginary") #endif case T_inline: @@ -1466,31 +1549,24 @@ static void parse_declaration_specifiers(declaration_specifiers_t *specifiers) /* TODO: if type != NULL for the following rules should issue * an error */ case T_struct: { - compound_type_t *compound_type - = allocate_type_zero(sizeof(compound_type[0])); - compound_type->type.type = TYPE_COMPOUND_STRUCT; - compound_type->declaration = parse_compound_type_specifier(true); + type = allocate_type_zero(sizeof(struct compound_type_t)); - type = (type_t*) compound_type; + compound_type_t *compound_type = (compound_type_t*) type; + compound_type->type.type = TYPE_COMPOUND_STRUCT; + compound_type->declaration = parse_compound_type_specifier(true); break; } case T_union: { - compound_type_t *compound_type - = allocate_type_zero(sizeof(compound_type[0])); - compound_type->type.type = TYPE_COMPOUND_UNION; - compound_type->declaration = parse_compound_type_specifier(false); + type = allocate_type_zero(sizeof(compound_type_t)); - type = (type_t*) compound_type; + compound_type_t *compound_type = (compound_type_t*) type; + compound_type->type.type = TYPE_COMPOUND_UNION; + compound_type->declaration = parse_compound_type_specifier(false); break; } - case T_enum: { - enum_type_t *enum_type = allocate_type_zero(sizeof(enum_type[0])); - enum_type->type.type = TYPE_ENUM; - enum_type->declaration = parse_enum_specifier(); - - type = (type_t*) enum_type; + case T_enum: + type = parse_enum_specifier(); break; - } case T___typeof__: type = parse_typeof(); break; @@ -1603,8 +1679,6 @@ finish_specifiers: case SPECIFIER_LONG | SPECIFIER_DOUBLE | SPECIFIER_COMPLEX: atomic_type = ATOMIC_TYPE_LONG_DOUBLE_COMPLEX; break; -#endif -#ifdef PROVIDE_IMAGINARY case SPECIFIER_FLOAT | SPECIFIER_IMAGINARY: atomic_type = ATOMIC_TYPE_FLOAT_IMAGINARY; break; @@ -1658,9 +1732,9 @@ finish_specifiers: specifiers->type = result; } -static unsigned parse_type_qualifiers(void) +static type_qualifiers_t parse_type_qualifiers(void) { - unsigned type_qualifiers = TYPE_QUALIFIER_NONE; + type_qualifiers_t type_qualifiers = TYPE_QUALIFIER_NONE; while(true) { switch(token.type) { @@ -1710,8 +1784,8 @@ static declaration_t *parse_parameter(void) if (declaration->type->type == TYPE_ARRAY) { const array_type_t *const arr_type = (const array_type_t*)declaration->type; - declaration->type = - make_pointer_type(arr_type->element_type, TYPE_QUALIFIER_NONE); + type_t *element_type = arr_type->element_type; + declaration->type = make_pointer_type(element_type, TYPE_QUALIFIER_NONE); } return declaration; @@ -1722,7 +1796,7 @@ static declaration_t *parse_parameters(function_type_t *type) if(token.type == T_IDENTIFIER) { symbol_t *symbol = token.v.symbol; if(!is_typedef_symbol(symbol)) { - /* TODO */ + /* TODO: K&R style C parameters */ parse_identifier_list(); return NULL; } @@ -1794,7 +1868,7 @@ struct construct_type_t { typedef struct parsed_pointer_t parsed_pointer_t; struct parsed_pointer_t { construct_type_t construct_type; - type_qualifier_t type_qualifiers; + type_qualifiers_t type_qualifiers; }; typedef struct construct_function_type_t construct_function_type_t; @@ -1806,7 +1880,7 @@ struct construct_function_type_t { typedef struct parsed_array_t parsed_array_t; struct parsed_array_t { construct_type_t construct_type; - type_qualifier_t type_qualifiers; + type_qualifiers_t type_qualifiers; bool is_static; bool is_variable; expression_t *size; @@ -1843,7 +1917,7 @@ static construct_type_t *parse_array_declarator(void) next_token(); } - type_qualifier_t type_qualifiers = parse_type_qualifiers(); + type_qualifiers_t type_qualifiers = parse_type_qualifiers(); if(type_qualifiers != 0) { if(token.type == T_static) { array->is_static = true; @@ -1888,19 +1962,24 @@ static construct_type_t *parse_function_declarator(declaration_t *declaration) } static construct_type_t *parse_inner_declarator(declaration_t *declaration, - int may_be_abstract) + bool may_be_abstract) { - construct_type_t *result = NULL; - construct_type_t *last = NULL; + /* construct a single linked list of construct_type_t's which describe + * how to construct the final declarator type */ + construct_type_t *first = NULL; + construct_type_t *last = NULL; + /* pointers */ while(token.type == '*') { construct_type_t *type = parse_pointer_declarator(); - if(last != NULL) { - last->next = type; + + if(last == NULL) { + first = type; + last = type; } else { - result = type; + last->next = type; + last = type; } - last = type; } /* TODO: find out if this is correct */ @@ -1937,6 +2016,8 @@ static construct_type_t *parse_inner_declarator(declaration_t *declaration, return NULL; } + construct_type_t *p = last; + while(true) { construct_type_t *type; switch(token.type) { @@ -1950,27 +2031,32 @@ static construct_type_t *parse_inner_declarator(declaration_t *declaration, goto declarator_finished; } - if(last != NULL) { - last->next = type; + /* insert in the middle of the list (behind p) */ + if(p != NULL) { + type->next = p->next; + p->next = type; } else { - result = type; + type->next = first; + first = type; + } + if(last == p) { + last = type; } - last = type; } declarator_finished: parse_attributes(); - if(inner_types != NULL) { - if(last != NULL) { - last->next = inner_types; - } else { - result = inner_types; - } - last = inner_types; + /* append inner_types at the end of the list, we don't to set last anymore + * as it's not needed anymore */ + if(last == NULL) { + assert(first == NULL); + first = inner_types; + } else { + last->next = inner_types; } - return result; + return first; } static type_t *construct_declarator_type(construct_type_t *construct_list, @@ -2022,7 +2108,11 @@ static type_t *construct_declarator_type(construct_type_t *construct_list, type_t *hashed_type = typehash_insert((type_t*) type); if(hashed_type != type) { - free_type(type); + /* the function type was constructed earlier freeing it here will + * destroy other types... */ + if(iter->type != CONSTRUCT_FUNCTION) { + free_type(type); + } type = hashed_type; } } @@ -2102,7 +2192,8 @@ static void parse_init_declarators(const declaration_specifiers_t *specifiers) declaration_t *declaration = record_declaration(ndeclaration); - type_t *type = declaration->type; + type_t *orig_type = declaration->type; + type_t *type = skip_typeref(orig_type); if(type->type != TYPE_FUNCTION && declaration->is_inline) { parser_print_warning_prefix_pos(declaration->source_position); fprintf(stderr, "variable '%s' declared 'inline'\n", @@ -2118,13 +2209,38 @@ static void parse_init_declarators(const declaration_specifiers_t *specifiers) parser_error_multiple_definition(declaration, ndeclaration); } - ndeclaration->init.initializer = parse_initializer(declaration->type); + initializer_t *initializer = parse_initializer(type); + + if(type->type == TYPE_ARRAY && initializer != NULL) { + array_type_t *array_type = (array_type_t*) type; + + if(array_type->size == NULL) { + const_t *cnst = allocate_ast_zero(sizeof(cnst[0])); + + cnst->expression.type = EXPR_CONST; + cnst->expression.datatype = type_size_t; + + if(initializer->type == INITIALIZER_LIST) { + initializer_list_t *list = &initializer->list; + cnst->v.int_value = list->len; + } else { + assert(initializer->type == INITIALIZER_STRING); + initializer_string_t *string = &initializer->string; + cnst->v.int_value = strlen(string->string) + 1; + } + + array_type->size = (expression_t*) cnst; + } + } + + + ndeclaration->init.initializer = initializer; } else if(token.type == '{') { - if(declaration->type->type != TYPE_FUNCTION) { + if(type->type != TYPE_FUNCTION) { parser_print_error_prefix(); - fprintf(stderr, "Declarator "); - print_type_ext(declaration->type, declaration->symbol, NULL); - fprintf(stderr, " has a body but is not a function type.\n"); + fprintf(stderr, "declarator '"); + print_type_ext(orig_type, declaration->symbol, NULL); + fprintf(stderr, "' has a body but is not a function type.\n"); eat_block(); continue; } @@ -2333,7 +2449,7 @@ static expression_t *parse_int_const(void) const_t *cnst = allocate_ast_zero(sizeof(cnst[0])); cnst->expression.type = EXPR_CONST; - cnst->expression.datatype = type_int; + cnst->expression.datatype = token.datatype; cnst->v.int_value = token.v.intvalue; next_token(); @@ -2346,7 +2462,7 @@ static expression_t *parse_float_const(void) const_t *cnst = allocate_ast_zero(sizeof(cnst[0])); cnst->expression.type = EXPR_CONST; - cnst->expression.datatype = type_double; + cnst->expression.datatype = token.datatype; cnst->v.float_value = token.v.floatvalue; next_token(); @@ -2393,6 +2509,110 @@ static declaration_t *create_implicit_function(symbol_t *symbol, return declaration; } +static type_t *make_function_1_type(type_t *result_type, type_t *argument_type) +{ + function_parameter_t *parameter = allocate_type_zero(sizeof(parameter[0])); + parameter->type = argument_type; + + function_type_t *type = allocate_type_zero(sizeof(type[0])); + type->type.type = TYPE_FUNCTION; + type->result_type = result_type; + type->parameters = parameter; + + type_t *result = typehash_insert((type_t*) type); + if(result != (type_t*) type) { + free_type(type); + } + + return result; +} + +static type_t *get_builtin_symbol_type(symbol_t *symbol) +{ + switch(symbol->ID) { + case T___builtin_alloca: + return make_function_1_type(type_void_ptr, type_size_t); + default: + panic("not implemented builtin symbol found"); + } +} + +/** + * performs automatic type cast as described in § 6.3.2.1 + */ +static type_t *automatic_type_conversion(type_t *type) +{ + if(type == NULL) + return NULL; + + if(type->type == TYPE_ARRAY) { + array_type_t *array_type = (array_type_t*) type; + type_t *element_type = array_type->element_type; + unsigned qualifiers = array_type->type.qualifiers; + + return make_pointer_type(element_type, qualifiers); + } + + if(type->type == TYPE_FUNCTION) { + return make_pointer_type(type, TYPE_QUALIFIER_NONE); + } + + return type; +} + +/** + * reverts the automatic casts of array to pointer types and function + * to function-pointer types as defined § 6.3.2.1 + */ +type_t *revert_automatic_type_conversion(const expression_t *expression) +{ + if(expression->datatype == NULL) + return NULL; + + switch(expression->type) { + case EXPR_REFERENCE: { + const reference_expression_t *ref + = (const reference_expression_t*) expression; + return ref->declaration->type; + } + case EXPR_SELECT: { + const select_expression_t *select + = (const select_expression_t*) expression; + return select->compound_entry->type; + } + case EXPR_UNARY: { + const unary_expression_t *unary + = (const unary_expression_t*) expression; + if(unary->type == UNEXPR_DEREFERENCE) { + expression_t *value = unary->value; + type_t *type = skip_typeref(value->datatype); + pointer_type_t *pointer_type = (pointer_type_t*) type; + + return pointer_type->points_to; + } + break; + } + case EXPR_BUILTIN_SYMBOL: { + const builtin_symbol_expression_t *builtin + = (const builtin_symbol_expression_t*) expression; + return get_builtin_symbol_type(builtin->symbol); + } + case EXPR_ARRAY_ACCESS: { + const array_access_expression_t *array_access + = (const array_access_expression_t*) expression; + type_t *type_left = skip_typeref(array_access->array_ref->datatype); + assert(is_type_pointer(type_left)); + pointer_type_t *pointer_type = (pointer_type_t*) type_left; + return pointer_type->points_to; + } + + default: + break; + } + + return expression->datatype; +} + static expression_t *parse_reference(void) { reference_expression_t *ref = allocate_ast_zero(sizeof(ref[0])); @@ -2424,8 +2644,13 @@ static expression_t *parse_reference(void) } } + type_t *type = declaration->type; + /* we always do the auto-type conversions; the & and sizeof parser contains + * code to revert this! */ + type = automatic_type_conversion(type); + ref->declaration = declaration; - ref->expression.datatype = declaration->type; + ref->expression.datatype = type; return (expression_t*) ref; } @@ -2641,12 +2866,13 @@ static expression_t *parse_builtin_symbol(void) = allocate_ast_zero(sizeof(expression[0])); expression->expression.type = EXPR_BUILTIN_SYMBOL; - /* TODO: set datatype */ - expression->symbol = token.v.symbol; - next_token(); + type_t *type = get_builtin_symbol_type(expression->symbol); + type = automatic_type_conversion(type); + + expression->expression.datatype = type; return (expression_t*) expression; } @@ -2670,6 +2896,7 @@ static expression_t *parse_primary_expression(void) return parse_offsetof(); case T___builtin_va_arg: return parse_va_arg(); + case T___builtin_alloca: case T___builtin_expect: case T___builtin_va_start: case T___builtin_va_end: @@ -2689,33 +2916,46 @@ static expression_t *parse_primary_expression(void) } static expression_t *parse_array_expression(unsigned precedence, - expression_t *array_ref) + expression_t *left) { (void) precedence; eat('['); + expression_t *inside = parse_expression(); + array_access_expression_t *array_access = allocate_ast_zero(sizeof(array_access[0])); - array_access->expression.type = EXPR_ARRAY_ACCESS; - array_access->array_ref = array_ref; - array_access->index = parse_expression(); - - type_t *type = array_ref->datatype; - if(type != NULL) { - if(type->type == TYPE_POINTER) { - pointer_type_t *pointer = (pointer_type_t*) type; - array_access->expression.datatype = pointer->points_to; - } else if(type->type == TYPE_ARRAY) { - array_type_t *array_type = (array_type_t*) type; - array_access->expression.datatype = array_type->element_type; + array_access->expression.type = EXPR_ARRAY_ACCESS; + + type_t *type_left = skip_typeref(left->datatype); + type_t *type_inside = skip_typeref(inside->datatype); + type_t *result_type; + + if(type_left != NULL && type_inside != NULL) { + if(is_type_pointer(type_left)) { + pointer_type_t *pointer = (pointer_type_t*) type_left; + result_type = pointer->points_to; + array_access->array_ref = left; + array_access->index = inside; + } else if(is_type_pointer(type_inside)) { + pointer_type_t *pointer = (pointer_type_t*) type_inside; + result_type = pointer->points_to; + array_access->array_ref = inside; + array_access->index = left; + array_access->flipped = true; } else { parser_print_error_prefix(); - fprintf(stderr, "array access on object with non-pointer type "); - print_type_quoted(type); + fprintf(stderr, "array access on object with non-pointer types "); + print_type_quoted(type_left); + fprintf(stderr, ", "); + print_type_quoted(type_inside); fprintf(stderr, "\n"); } + } else { + array_access->array_ref = left; + array_access->index = inside; } if(token.type != ']') { @@ -2724,6 +2964,9 @@ static expression_t *parse_array_expression(unsigned precedence, } next_token(); + result_type = automatic_type_conversion(result_type); + array_access->expression.datatype = result_type; + return (expression_t*) array_access; } @@ -2760,7 +3003,9 @@ static expression_t *parse_sizeof(unsigned precedence) sizeof_expression->type = parse_typename(); expect(')'); } else { - expression_t *expression = parse_sub_expression(precedence); + expression_t *expression = parse_sub_expression(precedence); + expression->datatype = revert_automatic_type_conversion(expression); + sizeof_expression->type = expression->datatype; sizeof_expression->size_expression = expression; } @@ -2790,16 +3035,18 @@ static expression_t *parse_select_expression(unsigned precedence, select->symbol = symbol; next_token(); - type_t *type = compound->datatype; - if(type == NULL) + type_t *orig_type = compound->datatype; + if(orig_type == NULL) return make_invalid_expression(); + type_t *type = skip_typeref(orig_type); + type_t *type_left = type; if(is_pointer) { if(type->type != TYPE_POINTER) { parser_print_error_prefix(); fprintf(stderr, "left hand side of '->' is not a pointer, but "); - print_type_quoted(type); + print_type_quoted(orig_type); fputc('\n', stderr); return make_invalid_expression(); } @@ -2843,8 +3090,12 @@ static expression_t *parse_select_expression(unsigned precedence, return make_invalid_expression(); } + /* we always do the auto-type conversions; the & and sizeof parser contains + * code to revert this! */ + type_t *expression_type = automatic_type_conversion(iter->type); + select->compound_entry = iter; - select->expression.datatype = iter->type; + select->expression.datatype = expression_type; return (expression_t*) select; } @@ -2857,25 +3108,32 @@ static expression_t *parse_call_expression(unsigned precedence, call->function = expression; function_type_t *function_type; - type_t *type = expression->datatype; - if (type->type == TYPE_FUNCTION) { - function_type = (function_type_t*) type; - call->expression.datatype = function_type->result_type; - } else if (type->type == TYPE_POINTER && - ((pointer_type_t*)type)->points_to->type == TYPE_FUNCTION) { - pointer_type_t *const ptr_type = (pointer_type_t*)type; - function_type = (function_type_t*)ptr_type->points_to; - call->expression.datatype = function_type->result_type; - } else { - parser_print_error_prefix(); - fputs("called object '", stderr); - print_expression(expression); - fputs("' (type ", stderr); - print_type_quoted(type); - fputs(") is not a function\n", stderr); + type_t *orig_type = expression->datatype; + if(orig_type != NULL) { + function_type = NULL; + type_t *type = skip_typeref(orig_type); + + if(is_type_pointer(type)) { + pointer_type_t *pointer_type = (pointer_type_t*) type; + + type = skip_typeref(pointer_type->points_to); + + if (type->type == TYPE_FUNCTION) { + function_type = (function_type_t*) type; + call->expression.datatype = function_type->result_type; + } + } + if(function_type == NULL) { + parser_print_error_prefix(); + fputs("called object '", stderr); + print_expression(expression); + fputs("' (type ", stderr); + print_type_quoted(orig_type); + fputs(") is not a pointer to a function\n", stderr); - function_type = NULL; - call->expression.datatype = NULL; + function_type = NULL; + call->expression.datatype = NULL; + } } /* parse arguments */ @@ -2959,14 +3217,16 @@ static expression_t *parse_conditional_expression(unsigned precedence, conditional_expression_t *conditional = allocate_ast_zero(sizeof(conditional[0])); conditional->expression.type = EXPR_CONDITIONAL; - conditional->condition = expression; + conditional->condition = expression; /* 6.5.15.2 */ type_t *condition_type_orig = conditional->condition->datatype; - type_t *condition_type = skip_typeref(condition_type_orig); - if(condition_type != NULL && !is_type_scalar(condition_type)) { - type_error("expected a scalar type", expression->source_position, - condition_type_orig); + if(condition_type_orig != NULL) { + type_t *condition_type = skip_typeref(condition_type_orig); + if(condition_type != NULL && !is_type_scalar(condition_type)) { + type_error("expected a scalar type", expression->source_position, + condition_type_orig); + } } expression_t *const t_expr = parse_expression(); @@ -3112,35 +3372,30 @@ static void semantic_dereference(unary_expression_t *expression) return; type_t *type = skip_typeref(orig_type); - switch (type->type) { - case TYPE_ARRAY: { - array_type_t *const array_type = (array_type_t*)type; - expression->expression.datatype = array_type->element_type; - break; - } + if(!is_type_pointer(type)) { + parser_print_error_prefix(); + fputs("'Unary *' needs pointer or arrray type, but type ", stderr); + print_type_quoted(orig_type); + fputs(" given.\n", stderr); + return; + } - case TYPE_POINTER: { - pointer_type_t *pointer_type = (pointer_type_t*)type; - expression->expression.datatype = pointer_type->points_to; - break; - } + pointer_type_t *pointer_type = (pointer_type_t*)type; + type_t *result_type = pointer_type->points_to; - default: - parser_print_error_prefix(); - fputs("'Unary *' needs pointer or arrray type, but type ", stderr); - print_type_quoted(orig_type); - fputs(" given.\n", stderr); - return; - } + result_type = automatic_type_conversion(result_type); + expression->expression.datatype = result_type; } static void semantic_take_addr(unary_expression_t *expression) { - type_t *orig_type = expression->value->datatype; + expression_t *value = expression->value; + value->datatype = revert_automatic_type_conversion(value); + + type_t *orig_type = value->datatype; if(orig_type == NULL) return; - expression_t *value = expression->value; if(value->type == EXPR_REFERENCE) { reference_expression_t *reference = (reference_expression_t*) value; declaration_t *declaration = reference->declaration; @@ -3149,7 +3404,7 @@ static void semantic_take_addr(unary_expression_t *expression) } } - expression->expression.datatype = make_pointer_type(orig_type, 0); + expression->expression.datatype = make_pointer_type(orig_type, TYPE_QUALIFIER_NONE); } #define CREATE_UNARY_EXPRESSION_PARSER(token_type, unexpression_type, sfunc) \ @@ -3314,18 +3569,10 @@ static void semantic_add(binary_expression_t *expression) expression->right = create_implicit_cast(right, arithmetic_type); expression->expression.datatype = arithmetic_type; return; - } else if(type_left->type == TYPE_POINTER && is_type_integer(type_right)) { + } else if(is_type_pointer(type_left) && is_type_integer(type_right)) { expression->expression.datatype = type_left; - } else if(type_right->type == TYPE_POINTER && is_type_integer(type_left)) { + } else if(is_type_pointer(type_right) && is_type_integer(type_left)) { expression->expression.datatype = type_right; - } else if (type_left->type == TYPE_ARRAY && is_type_integer(type_right)) { - const array_type_t *const arr_type = (const array_type_t*)type_left; - expression->expression.datatype = - make_pointer_type(arr_type->element_type, TYPE_QUALIFIER_NONE); - } else if (type_right->type == TYPE_ARRAY && is_type_integer(type_left)) { - const array_type_t *const arr_type = (const array_type_t*)type_right; - expression->expression.datatype = - make_pointer_type(arr_type->element_type, TYPE_QUALIFIER_NONE); } else { parser_print_error_prefix(); fprintf(stderr, "invalid operands to binary + ("); @@ -3408,8 +3655,7 @@ static void semantic_comparison(binary_expression_t *expression) expression->left = create_implicit_cast(left, type_right); } else { type_error_incompatible("invalid operands in comparison", - expression->expression.source_position, - type_left, type_right); + token.source_position, type_left, type_right); } expression->expression.datatype = type_int; } @@ -3500,18 +3746,63 @@ static void semantic_logical_op(binary_expression_t *expression) expression->expression.datatype = type_int; } +static bool has_const_fields(type_t *type) +{ + (void) type; + /* TODO */ + return false; +} + static void semantic_binexpr_assign(binary_expression_t *expression) { - expression_t *left = expression->left; - type_t *type_left = left->datatype; + expression_t *left = expression->left; + type_t *orig_type_left = left->datatype; + + if(orig_type_left == NULL) + return; + + type_t *type_left = revert_automatic_type_conversion(left); + type_left = skip_typeref(orig_type_left); + /* must be a modifiable lvalue */ if (type_left->type == TYPE_ARRAY) { - parse_error("Cannot assign to arrays."); - } else if (type_left != NULL) { - semantic_assign(type_left, &expression->right, "assignment"); + parser_print_error_prefix(); + fprintf(stderr, "Cannot assign to arrays ('"); + print_expression(left); + fprintf(stderr, "')\n"); + return; + } + if(type_left->qualifiers & TYPE_QUALIFIER_CONST) { + parser_print_error_prefix(); + fprintf(stderr, "assignment to readonly location '"); + print_expression(left); + fprintf(stderr, "' (type "); + print_type_quoted(orig_type_left); + fprintf(stderr, ")\n"); + return; + } + if(is_type_incomplete(type_left)) { + parser_print_error_prefix(); + fprintf(stderr, "left-hand side of assignment '"); + print_expression(left); + fprintf(stderr, "' has incomplete type "); + print_type_quoted(orig_type_left); + fprintf(stderr, "\n"); + return; + } + if(is_type_compound(type_left) && has_const_fields(type_left)) { + parser_print_error_prefix(); + fprintf(stderr, "can't assign to '"); + print_expression(left); + fprintf(stderr, "' because compound type "); + print_type_quoted(orig_type_left); + fprintf(stderr, " has readonly fields\n"); + return; } - expression->expression.datatype = type_left; + semantic_assign(orig_type_left, &expression->right, "assignment"); + + expression->expression.datatype = orig_type_left; } static void semantic_comma(binary_expression_t *expression) @@ -3558,7 +3849,6 @@ CREATE_BINEXPR_PARSER('|', BINEXPR_BITWISE_OR, semantic_binexpr_arithmetic, CREATE_BINEXPR_PARSER('^', BINEXPR_BITWISE_XOR, semantic_binexpr_arithmetic, 1) CREATE_BINEXPR_PARSER(T_ANDAND, BINEXPR_LOGICAL_AND, semantic_logical_op, 1) CREATE_BINEXPR_PARSER(T_PIPEPIPE, BINEXPR_LOGICAL_OR, semantic_logical_op, 1) -/* TODO shift has a bit special semantic */ CREATE_BINEXPR_PARSER(T_LESSLESS, BINEXPR_SHIFTLEFT, semantic_shift_op, 1) CREATE_BINEXPR_PARSER(T_GREATERGREATER, BINEXPR_SHIFTRIGHT, @@ -3745,7 +4035,7 @@ static statement_t *parse_case_statement(void) label->expression = parse_expression(); expect(':'); - label->statement.next = parse_statement(); + label->label_statement = parse_statement(); return (statement_t*) label; } @@ -3759,7 +4049,7 @@ static statement_t *parse_default_statement(void) label->statement.source_position = token.source_position; expect(':'); - label->statement.next = parse_statement(); + label->label_statement = parse_statement(); return (statement_t*) label; } @@ -4262,16 +4552,17 @@ void init_parser(void) init_expression_parsers(); obstack_init(&temp_obst); - type_int = make_atomic_type(ATOMIC_TYPE_INT, 0); - type_uint = make_atomic_type(ATOMIC_TYPE_UINT, 0); - type_long_double = make_atomic_type(ATOMIC_TYPE_LONG_DOUBLE, 0); - type_double = make_atomic_type(ATOMIC_TYPE_DOUBLE, 0); - type_float = make_atomic_type(ATOMIC_TYPE_FLOAT, 0); - type_size_t = make_atomic_type(ATOMIC_TYPE_ULONG, 0); - type_ptrdiff_t = make_atomic_type(ATOMIC_TYPE_LONG, 0); - type_const_char = make_atomic_type(ATOMIC_TYPE_CHAR, TYPE_QUALIFIER_CONST); - type_void = make_atomic_type(ATOMIC_TYPE_VOID, 0); - type_string = make_pointer_type(type_const_char, 0); + type_int = make_atomic_type(ATOMIC_TYPE_INT, TYPE_QUALIFIER_NONE); + type_uint = make_atomic_type(ATOMIC_TYPE_UINT, TYPE_QUALIFIER_NONE); + type_long_double = make_atomic_type(ATOMIC_TYPE_LONG_DOUBLE, TYPE_QUALIFIER_NONE); + type_double = make_atomic_type(ATOMIC_TYPE_DOUBLE, TYPE_QUALIFIER_NONE); + type_float = make_atomic_type(ATOMIC_TYPE_FLOAT, TYPE_QUALIFIER_NONE); + type_size_t = make_atomic_type(ATOMIC_TYPE_ULONG, TYPE_QUALIFIER_NONE); + type_ptrdiff_t = make_atomic_type(ATOMIC_TYPE_LONG, TYPE_QUALIFIER_NONE); + type_char = make_atomic_type(ATOMIC_TYPE_CHAR, TYPE_QUALIFIER_NONE); + type_void = make_atomic_type(ATOMIC_TYPE_VOID, TYPE_QUALIFIER_NONE); + type_void_ptr = make_pointer_type(type_void, TYPE_QUALIFIER_NONE); + type_string = make_pointer_type(type_char, TYPE_QUALIFIER_NONE); } void exit_parser(void)