2 * This file is part of cparser.
3 * Copyright (C) 2007-2009 Matthias Braun <matze@braunis.de>
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version 2
8 * of the License, or (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
29 #include "lang_features.h"
30 #include "adt/array.h"
31 #include "adt/error.h"
34 static symbol_t *token_symbols[T_LAST_TOKEN];
35 static symbol_t *pp_token_symbols[TP_LAST_TOKEN];
37 const source_position_t builtin_source_position = { "<built-in>", 0, 0, true };
39 static token_kind_t last_id;
41 static symbol_t *intern_register_token(token_kind_t id, const char *string)
43 assert(id < T_LAST_TOKEN);
44 symbol_t *symbol = symbol_table_insert(string);
45 if (token_symbols[id] == NULL)
46 token_symbols[id] = symbol;
50 static symbol_t *intern_register_pp_token(preprocessor_token_kind_t id, const char *string)
52 assert(id < TP_LAST_TOKEN);
53 symbol_t *symbol = symbol_table_insert(string);
54 if (pp_token_symbols[id] == NULL)
55 pp_token_symbols[id] = symbol;
59 static void register_token(unsigned mode, token_kind_t id, const char *string)
62 assert(id >= last_id);
66 symbol_t *symbol = intern_register_token(id, string);
71 static void register_pp_token(unsigned mode, preprocessor_token_kind_t id,
74 if (! (c_mode & mode))
77 symbol_t *symbol = intern_register_pp_token(id, string);
81 void init_tokens(void)
83 memset(token_symbols, 0, T_LAST_TOKEN * sizeof(token_symbols[0]));
84 memset(pp_token_symbols, 0, TP_LAST_TOKEN * sizeof(pp_token_symbols[0]));
86 #define T(mode,x,str,val) register_token(mode, T_##x, str);
87 #define TS(x,str,val) intern_register_token(T_##x, str);
92 #define T(mode,x,str,val) register_pp_token(mode, TP_##x, str);
93 #define TS(x,str,val) intern_register_pp_token(TP_##x, str);
94 #include "tokens_preprocessor.inc"
99 void exit_tokens(void)
103 void print_token_kind(FILE *f, token_kind_t token_kind)
105 if(token_kind == T_EOF) {
106 fputs("end of file", f);
110 if (token_kind >= lengthof(token_symbols)) {
111 fputs("invalid token", f);
115 const symbol_t *symbol = token_symbols[token_kind];
117 fputs(symbol->string, f);
119 if (token_kind < 256) {
120 fputc(token_kind, f);
123 fputs("unknown token", f);
127 char const *get_string_encoding_prefix(string_encoding_t const enc)
130 case STRING_ENCODING_CHAR: return "";
131 case STRING_ENCODING_WIDE: return "L";
133 panic("invalid string encoding");
136 static void print_stringrep(const string_t *string, FILE *f)
138 for (size_t i = 0; i < string->size; ++i) {
139 fputc(string->begin[i], f);
143 void print_token(FILE *f, const token_t *token)
145 switch(token->kind) {
147 fprintf(f, "identifier '%s'", token->base.symbol->string);
150 case T_FLOATINGPOINT:
151 print_token_kind(f, (token_kind_t)token->kind);
153 print_stringrep(&token->number.number, f);
154 if (token->number.suffix.size > 0)
155 print_stringrep(&token->number.suffix, f);
159 case T_STRING_LITERAL:
160 print_token_kind(f, (token_kind_t)token->kind);
161 fprintf(f, " %s\"%s\"", get_string_encoding_prefix(token->string.encoding), token->string.string.begin);
164 case T_CHARACTER_CONSTANT:
165 print_token_kind(f, (token_kind_t)token->kind);
166 fprintf(f, " %s'", get_string_encoding_prefix(token->string.encoding));
167 print_stringrep(&token->string.string, f);
172 if (token->base.symbol) {
173 fprintf(f, "'%s'", token->base.symbol->string);
176 print_token_kind(f, (token_kind_t)token->kind);
183 void print_pp_token_kind(FILE *f, int token_kind)
185 if (token_kind == TP_EOF) {
186 fputs("end of file", f);
190 int token_symbols_len = TP_LAST_TOKEN;
191 if (token_kind < 0 || token_kind >= token_symbols_len) {
192 fputs("invalid token", f);
196 const symbol_t *symbol = pp_token_symbols[token_kind];
197 if (symbol != NULL) {
198 fputs(symbol->string, f);
200 if(token_kind >= 0 && token_kind < 256) {
201 fputc(token_kind, f);
204 fputs("unknown token", f);
208 void print_pp_token(FILE *f, const token_t *token)
210 switch((preprocessor_token_kind_t) token->kind) {
212 fprintf(f, "identifier '%s'", token->base.symbol->string);
215 fprintf(f, "number '%s'", token->number.number.begin);
217 case TP_STRING_LITERAL:
218 fprintf(f, "string \"%s\"", token->string.string.begin);
221 print_pp_token_kind(f, (preprocessor_token_kind_t) token->kind);
226 bool tokens_would_paste(preprocessor_token_kind_t token1,
227 preprocessor_token_kind_t token2)
229 char c = token2 < 256 ? (char) token2 : pp_token_symbols[token2]->string[0];
232 case '>': return c == '>' || c == '=';
233 case '<': return c == '<' || c == '=' || c == '%' || c == ':';
234 case '+': return c == '+' || c == '=';
235 case '-': return c == '-' || c == '>';
236 case '/': return c == '/' || c == '=' || c == '*';
237 case '%': return c == ':' || c == '=' || c == '>';
238 case '&': return c == '&' || c == '=';
239 case '|': return c == '|' || c == '=';
240 case ':': return c == ':' || c == '>';
241 case '*': return c == '*' || c == '=';
242 case '.': return c == '.' || c == '%' || token2 == TP_NUMBER;
243 case '#': return c == '#' || c == '%';
244 case TP_GREATERGREATER: return c == '=';
245 case TP_LESSLESS: return c == '=';
246 case '^': return c == '=';
247 case '!': return c == '=';
249 return token2 == TP_IDENTIFIER || token2 == TP_NUMBER ||
250 token2 == TP_CHARACTER_CONSTANT ||
251 token2 == TP_WIDE_CHARACTER_CONSTANT ||
252 token2 == TP_WIDE_STRING_LITERAL ||
253 token2 == TP_STRING_LITERAL; /* L */
255 return token2 == TP_NUMBER || token2 == TP_IDENTIFIER ||
256 token2 == '.' || token2 == '+' || token2 == '-';