eat() the ':' token of a label statement instead of expect()ing it, because the looka...
[cparser] / main.c
1 #include <config.h>
2
3 #define _GNU_SOURCE
4
5 #include <stdio.h>
6 #include <stdlib.h>
7 #include <stdbool.h>
8 #include <errno.h>
9 #include <string.h>
10 #include <assert.h>
11
12 #ifdef _WIN32
13
14 #include <fcntl.h>
15 #include <io.h>
16
17 /* no eXecute on Win32 */
18 #define X_OK 0
19 #define W_OK 2
20 #define R_OK 4
21
22 #define O_RDWR          _O_RDWR
23 #define O_CREAT         _O_CREAT
24 #define O_EXCL          _O_EXCL
25 #define O_BINARY        _O_BINARY
26
27 /* remap some names, we are not in the POSIX world */
28 #define access(fname, mode)      _access(fname, mode)
29 #define mktemp(tmpl)             _mktemp(tmpl)
30 #define open(fname, oflag, mode) _open(fname, oflag, mode)
31 #define fdopen(fd, mode)         _fdopen(fd, mode)
32 #define popen(cmd, mode)         _popen(cmd, mode)
33 #define pclose(file)             _pclose(file)
34
35 #else
36 #include <unistd.h>
37 #define HAVE_MKSTEMP
38 #endif
39
40 #ifndef WITH_LIBCORE
41 #define WITH_LIBCORE
42 #endif
43
44 #include <libfirm/firm.h>
45 #include <libfirm/be.h>
46
47 #include "lexer.h"
48 #include "token_t.h"
49 #include "types.h"
50 #include "type_hash.h"
51 #include "parser.h"
52 #include "ast2firm.h"
53 #include "diagnostic.h"
54 #include "lang_features.h"
55 #include "driver/firm_opt.h"
56 #include "driver/firm_cmdline.h"
57 #include "adt/error.h"
58 #include "write_fluffy.h"
59 #include "revision.h"
60
61 #ifndef PREPROCESSOR
62 #define PREPROCESSOR "cpp -std=c99 -U__WCHAR_TYPE__ -D__WCHAR_TYPE__=int"
63 #endif
64
65 #ifndef LINKER
66 #define LINKER    "gcc -m32"
67 #endif
68
69 #ifndef ASSEMBLER
70 #define ASSEMBLER "as --32"
71 #endif
72
73 /** The current c mode/dialect. */
74 unsigned int c_mode = _C89|_C99|_GNUC;
75
76 /** The 'machine size', 16, 32 or 64 bit, 32bit is the default. */
77 unsigned int machine_size = 32;
78
79 /** true if the char type is signed. */
80 bool char_is_signed = true;
81
82 /** true for strict language checking. */
83 bool strict_mode = false;
84
85 static int            verbose;
86 static struct obstack cppflags_obst;
87
88 #if defined(_DEBUG) || defined(FIRM_DEBUG)
89 /**
90  * Debug printf implementation.
91  *
92  * @param fmt  printf style format parameter
93  */
94 void dbg_printf(const char *fmt, ...)
95 {
96         va_list list;
97
98         if (firm_dump.debug_print) {
99                 va_start(list, fmt);
100                 vprintf(fmt, list);
101                 va_end(list);
102         }  /* if */
103 }
104 #endif /* defined(_DEBUG) || defined(FIRM_DEBUG) */
105
106 static void initialize_firm(void)
107 {
108         firm_early_init();
109
110         dump_consts_local(1);
111         dump_keepalive_edges(1);
112 }
113
114 static void get_output_name(char *buf, size_t buflen, const char *inputname,
115                             const char *newext)
116 {
117         size_t last_dot = 0xffffffff;
118         size_t i = 0;
119
120         if(inputname == NULL) {
121                 snprintf(buf, buflen, "a%s", newext);
122                 return;
123         }
124
125         for(const char *c = inputname; *c != 0; ++c) {
126                 if(*c == '.')
127                         last_dot = i;
128                 ++i;
129         }
130         if(last_dot == 0xffffffff)
131                 last_dot = i;
132
133         if(last_dot >= buflen)
134                 panic("filename too long");
135         memcpy(buf, inputname, last_dot);
136
137         size_t extlen = strlen(newext) + 1;
138         if(extlen + last_dot >= buflen)
139                 panic("filename too long");
140         memcpy(buf+last_dot, newext, extlen);
141 }
142
143 static translation_unit_t *do_parsing(FILE *const in, const char *const input)
144 {
145         lexer_open_stream(in, input);
146         translation_unit_t *unit = parse();
147         return unit;
148 }
149
150 static void lextest(FILE *in, const char *fname)
151 {
152         lexer_open_stream(in, fname);
153
154         do {
155                 lexer_next_preprocessing_token();
156                 print_token(stdout, &lexer_token);
157                 puts("");
158         } while(lexer_token.type != T_EOF);
159 }
160
161 static FILE* preprocess(FILE* in, const char *fname)
162 {
163         char buf[4096];
164         const char *flags = obstack_finish(&cppflags_obst);
165
166         if(in != stdin) {
167                 snprintf(buf, sizeof(buf), PREPROCESSOR " %s %s", flags, fname);
168         } else {
169                 /* read from stdin */
170                 snprintf(buf, sizeof(buf), PREPROCESSOR " %s -", flags);
171         }
172
173         if(verbose) {
174                 puts(buf);
175         }
176         FILE* f = popen(buf, "r");
177         if (f == NULL) {
178                 fprintf(stderr, "invoking preprocessor failed\n");
179                 exit(1);
180         }
181         return f;
182 }
183
184 static void do_link(const char *out, const char *in)
185 {
186         char buf[4096];
187
188         snprintf(buf, sizeof(buf), "%s %s -o %s", LINKER, in, out);
189         if(verbose) {
190                 puts(buf);
191         }
192         int err = system(buf);
193         if(err != 0) {
194                 fprintf(stderr, "linker reported an error\n");
195                 exit(1);
196         }
197 }
198
199 static void assemble(const char *out, const char *in)
200 {
201         char buf[4096];
202
203         snprintf(buf, sizeof(buf), "%s %s -o %s", ASSEMBLER, in, out);
204         if(verbose) {
205                 puts(buf);
206         }
207
208         int err = system(buf);
209         if(err != 0) {
210                 fprintf(stderr, "assembler reported an error\n");
211                 exit(1);
212         }
213 }
214
215 static const char *try_dir(const char *dir)
216 {
217         if(dir == NULL)
218                 return dir;
219         if(access(dir, R_OK | W_OK | X_OK) == 0)
220                 return dir;
221         return NULL;
222 }
223
224 static const char *get_tempdir(void)
225 {
226         static const char *tmpdir = NULL;
227
228         if(tmpdir != NULL)
229                 return tmpdir;
230
231         if(tmpdir == NULL)
232                 tmpdir = try_dir(getenv("TMPDIR"));
233         if(tmpdir == NULL)
234                 tmpdir = try_dir(getenv("TMP"));
235         if(tmpdir == NULL)
236                 tmpdir = try_dir(getenv("TEMP"));
237
238 #ifdef P_tmpdir
239         if(tmpdir == NULL)
240                 tmpdir = try_dir(P_tmpdir);
241 #endif
242
243         if(tmpdir == NULL)
244                 tmpdir = try_dir("/var/tmp");
245         if(tmpdir == NULL)
246                 tmpdir = try_dir("/usr/tmp");
247         if(tmpdir == NULL)
248                 tmpdir = try_dir("/tmp");
249
250         if(tmpdir == NULL)
251                 tmpdir = ".";
252
253         return tmpdir;
254 }
255
256 #ifndef HAVE_MKSTEMP
257 /* cheap and nasty mkstemp replacement */
258 static int mkstemp(char *templ)
259 {
260         mktemp(templ);
261         return open(templ, O_RDWR|O_CREAT|O_EXCL|O_BINARY, 0600);
262 }
263 #endif
264
265 /**
266  * an own version of tmpnam, which: writes in a buffer, appends a user specified
267  * suffix, emits no warnings during linking (like glibc/gnu ld do for tmpnam)...
268  */
269 static FILE *make_temp_file(char *buffer, size_t buflen,
270                             const char *prefix, const char *suffix)
271 {
272         const char *tempdir = get_tempdir();
273
274         /* oh well... mkstemp doesn't accept a suffix after XXXXXX... */
275         (void) suffix;
276         suffix = "";
277
278         snprintf(buffer, buflen, "%s/%sXXXXXX%s", tempdir, prefix, suffix);
279
280         int fd = mkstemp(buffer);
281         if(fd == -1) {
282                 fprintf(stderr, "couldn't create temporary file: %s\n",
283                         strerror(errno));
284                 exit(1);
285         }
286         FILE *out = fdopen(fd, "w");
287         if(out == NULL) {
288                 fprintf(stderr, "couldn't create temporary file FILE*\n");
289                 exit(1);
290         }
291
292         return out;
293 }
294
295 /**
296  * Do the necessary lowering for compound parameters.
297  */
298 void lower_compound_params(void)
299 {
300         lower_params_t params;
301
302         params.def_ptr_alignment    = 4;
303         params.flags                = LF_COMPOUND_RETURN | LF_RETURN_HIDDEN;
304         params.hidden_params        = ADD_HIDDEN_ALWAYS_IN_FRONT;
305         params.find_pointer_type    = NULL;
306         params.ret_compound_in_regs = NULL;
307         lower_calls_with_compounds(&params);
308 }
309
310 typedef enum compile_mode_t {
311         ParseOnly,
312         Compile,
313         CompileDump,
314         CompileAssemble,
315         CompileAssembleLink,
316         LexTest,
317         PrintAst,
318         PrintFluffy
319 } compile_mode_t;
320
321 static void usage(const char *argv0)
322 {
323         fprintf(stderr, "Usage %s input [-o output] [-c]\n", argv0);
324 }
325
326 int main(int argc, char **argv)
327 {
328         initialize_firm();
329
330         const char     *input        = NULL;
331         const char     *outname      = NULL;
332         const char     *dumpfunction = NULL;
333         compile_mode_t  mode         = CompileAssembleLink;
334
335         obstack_init(&cppflags_obst);
336
337 #define GET_ARG_AFTER(def, args)                                             \
338         def = &arg[sizeof(args)-1];                                              \
339         if(def[0] == '\0') {                                                     \
340                 ++i;                                                                 \
341                 if(i >= argc) {                                                      \
342                         fprintf(stderr, "error: expected argument after '" args "'\n");  \
343                         argument_errors = true;                                          \
344                         break;                                                           \
345                 }                                                                    \
346                 def = argv[i];                                                       \
347                 if(def[0] == '-' && def[1] != '\0') {                                \
348                         fprintf(stderr, "error: expected argument after '" args "'\n");  \
349                         argument_errors = true;                                          \
350                         continue;                                                        \
351                 }                                                                    \
352         }
353
354         bool help_displayed  = false;
355         bool argument_errors = false;
356         for(int i = 1; i < argc; ++i) {
357                 const char *arg = argv[i];
358                 if(strncmp(arg, "-o", 2) == 0) {
359                         GET_ARG_AFTER(outname, "-o");
360                 } else if(strcmp(arg, "-c") == 0) {
361                         mode = CompileAssemble;
362                 } else if(strcmp(arg, "-S") == 0) {
363                         mode = Compile;
364                 } else if(strcmp(arg, "--gcc") == 0) {
365                         c_mode |= _GNUC;
366                 } else if(strcmp(arg, "--no-gcc") == 0) {
367                         c_mode &= ~_GNUC;
368                 } else if(strcmp(arg, "--ms") == 0) {
369                         c_mode |= _MS;
370                 } else if(strcmp(arg, "--signed-chars") == 0) {
371                         char_is_signed = true;
372                 } else if(strcmp(arg, "--unsigned-chars") == 0) {
373                         char_is_signed = false;
374                 } else if(strcmp(arg, "--strict") == 0) {
375                         strict_mode = true;
376                 } else if(strcmp(arg, "--no-ms") == 0) {
377                         c_mode &= ~_MS;
378                 } else if(strcmp(arg, "--lextest") == 0) {
379                         mode = LexTest;
380                 } else if(strcmp(arg, "--print-ast") == 0) {
381                         mode = PrintAst;
382                 } else if(strcmp(arg, "--print-fluffy") == 0) {
383                         mode = PrintFluffy;
384                 } else if(strcmp(arg, "--version") == 0) {
385                         firm_version_t ver;
386                         firm_get_version(&ver);
387                         printf("cparser (%d.%d %s) using libFirm (%u.%u", 0, 1, cparser_REVISION, ver.major, ver.minor);
388                         if(ver.revision[0] != 0) {
389                                 putchar(' ');
390                                 fputs(ver.revision, stdout);
391                         }
392                         if(ver.build[0] != 0) {
393                                 putchar(' ');
394                                 fputs(ver.build, stdout);
395                         }
396                         puts(")\n");
397                         exit(EXIT_SUCCESS);
398                 } else if(strcmp(arg, "-fsyntax-only") == 0) {
399                         mode = ParseOnly;
400                 } else if(strncmp(arg, "-I", 2) == 0) {
401                         const char *opt;
402                         GET_ARG_AFTER(opt, "-I");
403                         obstack_printf(&cppflags_obst, " -I%s", opt);
404                 } else if(strncmp(arg, "-D", 2) == 0) {
405                         const char *opt;
406                         GET_ARG_AFTER(opt, "-D");
407                         obstack_printf(&cppflags_obst, " -D%s", opt);
408                 } else if(strncmp(arg, "-U", 2) == 0) {
409                         const char *opt;
410                         GET_ARG_AFTER(opt, "-U");
411                         obstack_printf(&cppflags_obst, " -U%s", opt);
412                 } else if(strcmp(arg, "--dump-function") == 0) {
413                         ++i;
414                         if(i >= argc) {
415                                 fprintf(stderr, "error: "
416                                         "expected argument after '--dump-function'\n");
417                                 argument_errors = true;
418                                 break;
419                         }
420                         dumpfunction = argv[i];
421                         mode         = CompileDump;
422                 } else if(strcmp(arg, "-v") == 0) {
423                         verbose = 1;
424                 } else if(arg[0] == '-' && arg[1] == 'f') {
425                         const char *opt;
426                         GET_ARG_AFTER(opt, "-f");
427
428                         if(strcmp(opt, "omit-frame-pointer") == 0) {
429                                 firm_be_option("omitfp");
430                         } else if(strcmp(opt, "no-omit-frame-pointer") == 0) {
431                                 firm_be_option("omitfp=no");
432                         } else {
433                                 int res = firm_option(opt);
434                                 if (res == 0) {
435                                         fprintf(stderr, "error: unknown Firm option '-f %s'\n",
436                                                 opt);
437                                         argument_errors = true;
438                                         continue;
439                                 } else if (res == -1) {
440                                         help_displayed = true;
441                                 }
442                         }
443                 } else if(arg[0] == '-' && arg[1] == 'b') {
444                         const char *opt;
445                         GET_ARG_AFTER(opt, "-b");
446                         int res = firm_be_option(opt);
447                         if (res == 0) {
448                                 fprintf(stderr, "error: unknown Firm backend option '-b %s'\n",
449                                         opt);
450                                 argument_errors = true;
451                         } else if (res == -1) {
452                                 help_displayed = true;
453                         }
454                 } else if(arg[0] == '-' && arg[1] == 'm') {
455                         const char *opt;
456                         GET_ARG_AFTER(opt, "-m");
457                         char *endptr;
458                         long int value = strtol(opt, &endptr, 10);
459                         if (*endptr != '\0') {
460                                 fprintf(stderr, "error: wrong option '-m %s'\n",  opt);
461                                 argument_errors = true;
462                         }
463                         if (value != 16 && value != 32 && value != 64) {
464                                 fprintf(stderr, "error: option -m supports only 16, 32 or 64\n");
465                                 argument_errors = true;
466                         } else {
467                                 machine_size = (unsigned int)value;
468                         }
469                 } else if(arg[0] == '-') {
470                         if (arg[1] == '\0') {
471                                 if(input != NULL) {
472                                         fprintf(stderr, "error: multiple input files specified\n");
473                                         argument_errors = true;
474                                 } else {
475                                         input = arg;
476                                 }
477                         } else if(strcmp(arg, "-pedantic") == 0) {
478                                 fprintf(stderr, "warning: ignoring gcc option '%s'\n", arg);
479                         } else if(arg[1] == 'O' ||
480                                         arg[1] == 'W' ||
481                                         arg[1] == 'g' ||
482                                         strncmp(arg + 1, "std=", 4) == 0) {
483                                 fprintf(stderr, "warning: ignoring gcc option '%s'\n", arg);
484                         } else {
485                                 fprintf(stderr, "error: unknown argument '%s'\n", arg);
486                                 argument_errors = true;
487                         }
488                 } else {
489                         if(input != NULL) {
490                                 fprintf(stderr, "error: multiple input files specified\n");
491                                 argument_errors = true;
492                         } else {
493                                 input = arg;
494                         }
495                 }
496         }
497
498         /* we do the lowering in ast2firm */
499         firm_opt.lower_bitfields = FALSE;
500
501         if(help_displayed) {
502                 return !argument_errors;
503         }
504         if(argument_errors) {
505                 usage(argv[0]);
506                 return 1;
507         }
508
509         gen_firm_init();
510         init_symbol_table();
511         init_tokens();
512         init_types();
513         init_typehash();
514         init_basic_types();
515         init_lexer();
516         init_ast();
517         init_parser();
518         init_ast2firm();
519
520         FILE *out = NULL;
521         char  outnamebuf[4096];
522         if(outname == NULL) {
523                 switch(mode) {
524                 case PrintAst:
525                 case PrintFluffy:
526                 case LexTest:
527                         if(outname == NULL)
528                                 outname = "-";
529                         break;
530                 case ParseOnly:
531                         break;
532                 case Compile:
533                         get_output_name(outnamebuf, sizeof(outnamebuf), input, ".s");
534                         outname = outnamebuf;
535                         break;
536                 case CompileAssemble:
537                         get_output_name(outnamebuf, sizeof(outnamebuf), input, ".o");
538                         outname = outnamebuf;
539                         break;
540                 case CompileDump:
541                         get_output_name(outnamebuf, sizeof(outnamebuf), dumpfunction,
542                                         ".vcg");
543                         outname = outnamebuf;
544                         break;
545                 case CompileAssembleLink:
546                         outname = "a.out";
547                         break;
548                 }
549         }
550
551         if(outname != NULL) {
552                 if(strcmp(outname, "-") == 0) {
553                         out = stdout;
554                 } else {
555                         out = fopen(outname, "w");
556                         if(out == NULL) {
557                                 fprintf(stderr, "Couldn't open '%s' for writing: %s\n", outname,
558                                         strerror(errno));
559                                 return 1;
560                         }
561                 }
562         }
563
564         FILE *in;
565         if(input == NULL) {
566                 fprintf(stderr, "%s: no input files\n", argv[0]);
567                 return 1;
568         } else if(strcmp(input, "-") == 0) {
569                 in    = stdin;
570                 input = "<stdin>";
571         } else {
572                 in = fopen(input, "r");
573                 if(in == NULL) {
574                         fprintf(stderr, "Couldn't open '%s': %s\n", input, strerror(errno));
575                         return 1;
576                 }
577         }
578
579         if(mode == LexTest) {
580                 lextest(in, input);
581                 fclose(in);
582                 return 0;
583         }
584
585         FILE *preprocessed_in = preprocess(in, input);
586         translation_unit_t *const unit = do_parsing(preprocessed_in, input);
587         pclose(preprocessed_in);
588         if(unit == NULL) {
589                 /* parsing failed because of errors */
590                 fprintf(stderr, "%u error(s), %u warnings\n", error_count, warning_count);
591                 return EXIT_FAILURE;
592         }
593         if (warning_count > 0) {
594                 fprintf(stderr, "%u warnings\n", warning_count);
595         }
596
597         if(mode == PrintAst) {
598                 type_set_output(out);
599                 ast_set_output(out);
600                 print_ast(unit);
601                 return 0;
602         }
603         if(mode == PrintFluffy) {
604                 type_set_output(out);
605                 ast_set_output(out);
606                 write_fluffy_decls(out, unit);
607         }
608
609         translation_unit_to_firm(unit);
610
611         if(mode == ParseOnly) {
612                 return 0;
613         }
614
615         FILE *asm_out;
616         char  asm_tempfile[1024];
617         if(mode == CompileDump) {
618                 asm_out = NULL;
619                 firm_be_opt.selection = BE_NONE;
620         } else if(mode == Compile) {
621                 asm_out = out;
622         } else {
623                 asm_out
624                         = make_temp_file(asm_tempfile, sizeof(asm_tempfile), "cc", ".s");
625         }
626         gen_firm_finish(asm_out, input, /*c_mode=*/1, /*firm_const_exists=*/0);
627
628         if(mode == CompileDump) {
629                 /* find irg */
630                 ident    *id     = new_id_from_str(dumpfunction);
631                 ir_graph *irg    = NULL;
632                 int       n_irgs = get_irp_n_irgs();
633                 for(int i = 0; i < n_irgs; ++i) {
634                         ir_graph *tirg   = get_irp_irg(i);
635                         ident    *irg_id = get_entity_ident(get_irg_entity(tirg));
636                         if(irg_id == id) {
637                                 irg = tirg;
638                                 break;
639                         }
640                 }
641
642                 if(irg == NULL) {
643                         fprintf(stderr, "No graph for function '%s' found\n", dumpfunction);
644                         return 1;
645                 }
646
647                 dump_ir_block_graph_file(irg, out);
648                 fclose(out);
649                 return 0;
650         }
651
652         fclose(asm_out);
653
654         /* assemble assembler and create object file */
655         char obj_tfile[1024];
656         if(mode == CompileAssemble || mode == CompileAssembleLink) {
657                 const char *obj_outfile;
658                 if(mode == CompileAssemble) {
659                         fclose(out);
660                         obj_outfile = outname;
661                 } else {
662                         FILE *tempf
663                                 = make_temp_file(obj_tfile, sizeof(obj_tfile), "cc", ".o");
664                         fclose(tempf);
665                         obj_outfile = obj_tfile;
666                 }
667
668                 assemble(obj_outfile, asm_tempfile);
669         }
670
671         /* link object file */
672         if(mode == CompileAssembleLink) {
673                 do_link(outname, obj_tfile);
674         }
675
676         obstack_free(&cppflags_obst, NULL);
677
678         exit_ast2firm();
679         exit_parser();
680         exit_ast();
681         exit_lexer();
682         exit_typehash();
683         exit_types();
684         exit_tokens();
685         exit_symbol_table();
686         return 0;
687 }