2 * Copyright (C) 1995-2008 University of Karlsruhe. All right reserved.
4 * This file is part of libFirm.
6 * This file may be distributed and/or modified under the terms of the
7 * GNU General Public License version 2 as published by the Free Software
8 * Foundation and appearing in the file LICENSE.GPL included in the
9 * packaging of this file.
11 * Licensees holding valid libFirm Professional Edition licenses may use
12 * this file in accordance with the libFirm Commercial License.
13 * Agreement provided with the Software.
15 * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
16 * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * @brief Main Backend driver.
23 * @author Sebastian Hack
33 #include "lc_opts_enum.h"
43 #include "iredges_t.h"
48 #include "iroptimize.h"
51 #include "irprofile.h"
60 #include "belistsched.h"
63 #include "bechordal_t.h"
65 #include "beifg_impl.h"
66 #include "becopyopt.h"
67 #include "becopystat.h"
68 #include "bessadestr.h"
71 #include "beschedmris.h"
74 #include "be_dbgout.h"
77 #define NEW_ID(s) new_id_from_chars(s, sizeof(s) - 1)
80 #include "beilpsched.h"
83 /* options visible for anyone */
84 static be_options_t be_options = {
85 DUMP_NONE, /* dump flags */
86 BE_TIME_OFF, /* no timing */
87 0, /* no opt profile */
88 0, /* try to omit frame pointer */
89 0, /* try to omit leaf frame pointer */
90 0, /* create PIC code */
91 0, /* create gprof compatible profiling code */
92 BE_VRFY_WARN, /* verification level: warn */
93 BE_SCHED_LIST, /* scheduler: list scheduler */
94 "linux", /* target OS name */
95 "i44pc52.info.uni-karlsruhe.de", /* ilp server */
96 "cplex", /* ilp solver */
97 0, /* enable statistic event dumping */
98 "", /* print stat events */
102 static char config_file[256] = { 0 };
104 /* back end instruction set architecture to use */
105 static const arch_isa_if_t *isa_if = NULL;
107 /* possible dumping options */
108 static const lc_opt_enum_mask_items_t dump_items[] = {
109 { "none", DUMP_NONE },
110 { "initial", DUMP_INITIAL },
112 { "sched", DUMP_SCHED },
113 { "prepared", DUMP_PREPARED },
114 { "regalloc", DUMP_RA },
115 { "final", DUMP_FINAL },
117 { "all", 2 * DUMP_BE - 1 },
121 /* verify options. */
122 static const lc_opt_enum_int_items_t vrfy_items[] = {
123 { "off", BE_VRFY_OFF },
124 { "warn", BE_VRFY_WARN },
125 { "assert", BE_VRFY_ASSERT },
129 /* scheduling options. */
130 static const lc_opt_enum_int_items_t sched_items[] = {
131 { "list", BE_SCHED_LIST },
133 { "ilp", BE_SCHED_ILP },
134 #endif /* WITH_ILP */
138 static lc_opt_enum_mask_var_t dump_var = {
139 &be_options.dump_flags, dump_items
142 static lc_opt_enum_int_var_t vrfy_var = {
143 &be_options.vrfy_option, vrfy_items
146 static lc_opt_enum_int_var_t sched_var = {
147 &be_options.scheduler, sched_items
150 static const lc_opt_table_entry_t be_main_options[] = {
151 LC_OPT_ENT_STR ("config", "read another config file containing backend options", config_file, sizeof(config_file)),
152 LC_OPT_ENT_ENUM_MASK("dump", "dump irg on several occasions", &dump_var),
153 LC_OPT_ENT_BOOL ("omitfp", "omit frame pointer", &be_options.omit_fp),
154 LC_OPT_ENT_BOOL ("omitleaffp", "omit frame pointer in leaf routines", &be_options.omit_leaf_fp),
155 LC_OPT_ENT_BOOL ("pic", "create PIC code", &be_options.pic),
156 LC_OPT_ENT_BOOL ("gprof", "create gprof profiling code", &be_options.gprof),
157 LC_OPT_ENT_ENUM_PTR ("verify", "verify the backend irg", &vrfy_var),
158 LC_OPT_ENT_BOOL ("time", "get backend timing statistics", &be_options.timing),
159 LC_OPT_ENT_BOOL ("profile", "instrument the code for execution count profiling", &be_options.opt_profile),
160 LC_OPT_ENT_ENUM_PTR ("sched", "select a scheduler", &sched_var),
161 LC_OPT_ENT_STR ("os", "specify target operating system", &be_options.target_os, sizeof(be_options.target_os)),
162 #ifdef FIRM_STATISTICS
163 LC_OPT_ENT_BOOL ("statev", "dump statistic events", &be_options.statev),
164 LC_OPT_ENT_STR ("filtev", "filter for stat events (regex if support is active", &be_options.filtev, sizeof(be_options.filtev)),
168 LC_OPT_ENT_STR ("ilp.server", "the ilp server name", be_options.ilp_server, sizeof(be_options.ilp_server)),
169 LC_OPT_ENT_STR ("ilp.solver", "the ilp solver name", be_options.ilp_solver, sizeof(be_options.ilp_solver)),
170 #endif /* WITH_ILP */
174 static be_module_list_entry_t *isa_ifs = NULL;
177 unsigned short asm_constraint_flags[256];
179 void be_init_default_asm_constraint_flags(void)
181 asm_constraint_flags['?'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT;
182 asm_constraint_flags['!'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT;
183 asm_constraint_flags['&'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT
184 | ASM_CONSTRAINT_FLAG_MODIFIER_EARLYCLOBBER;
185 asm_constraint_flags['%'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT
186 | ASM_CONSTRAINT_FLAG_MODIFIER_COMMUTATIVE;
187 asm_constraint_flags['!'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT;
189 asm_constraint_flags['='] = ASM_CONSTRAINT_FLAG_MODIFIER_WRITE
190 | ASM_CONSTRAINT_FLAG_MODIFIER_NO_READ;
191 asm_constraint_flags['+'] = ASM_CONSTRAINT_FLAG_MODIFIER_READ
192 | ASM_CONSTRAINT_FLAG_MODIFIER_WRITE;
194 asm_constraint_flags['i'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
195 asm_constraint_flags['s'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
196 asm_constraint_flags['E'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
197 asm_constraint_flags['F'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
198 asm_constraint_flags['G'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
199 asm_constraint_flags['H'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
200 asm_constraint_flags['I'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
201 asm_constraint_flags['J'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
202 asm_constraint_flags['K'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
203 asm_constraint_flags['L'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
204 asm_constraint_flags['M'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
205 asm_constraint_flags['N'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
206 asm_constraint_flags['O'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
207 asm_constraint_flags['P'] = ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
209 asm_constraint_flags['m'] = ASM_CONSTRAINT_FLAG_SUPPORTS_MEMOP;
210 asm_constraint_flags['o'] = ASM_CONSTRAINT_FLAG_SUPPORTS_MEMOP;
211 asm_constraint_flags['V'] = ASM_CONSTRAINT_FLAG_SUPPORTS_MEMOP;
212 asm_constraint_flags['<'] = ASM_CONSTRAINT_FLAG_SUPPORTS_MEMOP;
213 asm_constraint_flags['>'] = ASM_CONSTRAINT_FLAG_SUPPORTS_MEMOP;
215 asm_constraint_flags['p'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
216 asm_constraint_flags['0'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
217 asm_constraint_flags['1'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
218 asm_constraint_flags['2'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
219 asm_constraint_flags['3'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
220 asm_constraint_flags['4'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
221 asm_constraint_flags['5'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
222 asm_constraint_flags['6'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
223 asm_constraint_flags['7'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
224 asm_constraint_flags['8'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
225 asm_constraint_flags['9'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER;
227 asm_constraint_flags['X'] = ASM_CONSTRAINT_FLAG_SUPPORTS_REGISTER
228 | ASM_CONSTRAINT_FLAG_SUPPORTS_MEMOP
229 | ASM_CONSTRAINT_FLAG_SUPPORTS_IMMEDIATE;
231 /* these should have been catched by the parsing code already */
232 asm_constraint_flags['#'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT;
233 asm_constraint_flags['*'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT;
234 asm_constraint_flags[' '] = ASM_CONSTRAINT_FLAG_NO_SUPPORT;
235 asm_constraint_flags['\t'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT;
236 asm_constraint_flags['\n'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT;
237 asm_constraint_flags['\r'] = ASM_CONSTRAINT_FLAG_NO_SUPPORT;
240 asm_constraint_flags_t be_parse_asm_constraints(const char *constraint)
242 asm_constraint_flags_t flags = 0;
244 asm_constraint_flags_t tflags;
246 for (c = constraint; *c != '\0'; ++c) {
249 /* 'comment' stuff */
250 while(*c != 0 && *c != ',')
254 /* 'comment' character */
263 tflags = asm_constraint_flags[(int) *c];
267 flags |= isa_if->parse_asm_constraint(&c);
274 flags & ASM_CONSTRAINT_FLAG_MODIFIER_WRITE &&
275 flags & ASM_CONSTRAINT_FLAG_MODIFIER_NO_WRITE
277 flags & ASM_CONSTRAINT_FLAG_MODIFIER_READ &&
278 flags & ASM_CONSTRAINT_FLAG_MODIFIER_NO_READ
280 flags |= ASM_CONSTRAINT_FLAG_INVALID;
282 if (!(flags & (ASM_CONSTRAINT_FLAG_MODIFIER_READ |
283 ASM_CONSTRAINT_FLAG_MODIFIER_WRITE |
284 ASM_CONSTRAINT_FLAG_MODIFIER_NO_WRITE |
285 ASM_CONSTRAINT_FLAG_MODIFIER_NO_READ)
287 flags |= ASM_CONSTRAINT_FLAG_MODIFIER_READ;
293 int be_is_valid_clobber(const char *clobber)
295 /* memory is a valid clobber. (the frontend has to detect this case too,
296 * because it has to add memory edges to the asm) */
297 if (strcmp(clobber, "memory") == 0)
299 /* cc (condition code) is always valid */
300 if (strcmp(clobber, "cc") == 0)
303 return isa_if->is_valid_clobber(clobber);
306 void be_register_isa_if(const char *name, const arch_isa_if_t *isa)
311 be_add_module_to_list(&isa_ifs, name, (void*) isa);
314 void be_opt_register(void)
316 lc_opt_entry_t *be_grp;
317 static int run_once = 0;
323 be_grp = lc_opt_get_grp(firm_opt_get_root(), "be");
324 lc_opt_add_table(be_grp, be_main_options);
326 be_add_module_list_opt(be_grp, "isa", "the instruction set architecture",
327 &isa_ifs, (void**) &isa_if);
332 /* Parse one argument. */
333 int be_parse_arg(const char *arg) {
334 lc_opt_entry_t *be_grp = lc_opt_get_grp(firm_opt_get_root(), "be");
335 if (strcmp(arg, "help") == 0 || (arg[0] == '?' && arg[1] == '\0')) {
336 lc_opt_print_help_for_entry(be_grp, '-', stdout);
339 return lc_opt_from_single_arg(be_grp, NULL, arg, NULL);
342 /** The be parameters returned by default, all off. */
343 static const backend_params be_params = {
344 0, /* need dword lowering */
345 0, /* don't support inline assembler yet */
346 NULL, /* will be set later */
347 NULL, /* but yet no creator function */
348 NULL, /* context for create_intrinsic_fkt */
349 NULL, /* no if conversion settings */
350 NULL, /* no float arithmetic mode */
351 0, /* no trampoline support: size 0 */
352 0, /* no trampoline support: align 0 */
353 NULL, /* no trampoline support: no trampoline builder */
354 4 /* alignment of stack parameter */
357 /* Perform schedule verification if requested. */
358 static void be_sched_vrfy(be_irg_t *birg, int vrfy_opt) {
359 if (vrfy_opt == BE_VRFY_WARN) {
360 be_verify_schedule(birg);
361 } else if (vrfy_opt == BE_VRFY_ASSERT) {
362 assert(be_verify_schedule(birg) && "Schedule verification failed.");
366 /* Initialize the Firm backend. Must be run first in init_firm()! */
367 void firm_be_init(void)
373 /* Finalize the Firm backend. */
374 void firm_be_finish(void)
379 /* Returns the backend parameter */
380 const backend_params *be_get_backend_param(void)
382 if (isa_if->get_params)
383 return isa_if->get_params();
388 * Initializes the main environment for the backend.
390 * @param env an empty environment
391 * @param file_handle the file handle where the output will be written to
393 static be_main_env_t *be_init_env(be_main_env_t *env, FILE *file_handle)
395 memset(env, 0, sizeof(*env));
396 env->options = &be_options;
397 env->ent_trampoline_map = pmap_create();
398 env->pic_trampolines_type = new_type_class(NEW_ID("$PIC_TRAMPOLINE_TYPE"));
399 env->ent_pic_symbol_map = pmap_create();
400 env->pic_symbols_type = new_type_struct(NEW_ID("$PIC_SYMBOLS_TYPE"));
402 remove_irp_type(env->pic_trampolines_type);
403 remove_irp_type(env->pic_symbols_type);
404 set_class_final(env->pic_trampolines_type, 1);
406 memset(asm_constraint_flags, 0, sizeof(asm_constraint_flags));
407 env->arch_env = arch_env_init(isa_if, file_handle, env);
414 * Called when the be_main_env_t can be destroyed.
416 static void be_done_env(be_main_env_t *env)
418 arch_env_done(env->arch_env);
421 pmap_destroy(env->ent_trampoline_map);
422 pmap_destroy(env->ent_pic_symbol_map);
423 free_type(env->pic_trampolines_type);
424 free_type(env->pic_symbols_type);
428 * A wrapper around a firm dumper. Dumps only, if
431 * @param mask a bitmask containing the reason what will be dumped
432 * @param irg the IR graph to dump
433 * @param suffix the suffix for the dumper
434 * @param dumper the dumper to be called
436 static void dump(int mask, ir_graph *irg, const char *suffix,
437 void (*dumper)(ir_graph *, const char *))
439 if(be_options.dump_flags & mask)
440 be_dump(irg, suffix, dumper);
444 * Prepare a backend graph for code generation and initialize its birg
446 static void initialize_birg(be_irg_t *birg, ir_graph *irg, be_main_env_t *env)
448 memset(birg, 0, sizeof(*birg));
450 birg->main_env = env;
451 obstack_init(&birg->obst);
453 edges_deactivate_kind(irg, EDGE_KIND_DEP);
454 edges_activate_kind(irg, EDGE_KIND_DEP);
456 dump(DUMP_INITIAL, irg, "-begin", dump_ir_block_graph);
458 /* set the current graph (this is important for several firm functions) */
459 current_ir_graph = irg;
461 /* Normalize proj nodes. */
462 normalize_proj_nodes(irg);
464 /* we do this before critical edge split. As this produces less returns,
465 because sometimes (= 164.gzip) multiple returns are slower */
466 normalize_n_returns(irg);
468 /* Remove critical edges */
469 remove_critical_cf_edges_ex(irg, /*ignore_exception_edges=*/0);
471 /* Ensure, that the ir_edges are computed. */
474 set_irg_phase_state(irg, phase_backend);
475 be_info_init_irg(irg);
477 dump(DUMP_INITIAL, irg, "-prepared", dump_ir_block_graph);
480 #define BE_TIMER_ONLY(code) do { if (be_timing) { code; } } while(0)
484 ir_timer_t *t_codegen;
485 ir_timer_t *t_ra_preparation;
487 ir_timer_t *t_constr;
488 ir_timer_t *t_finish;
491 ir_timer_t *t_verify;
492 ir_timer_t *t_heights;
494 ir_timer_t *t_execfreq;
495 ir_timer_t *t_ssa_constr;
496 ir_timer_t *t_ra_constr;
497 ir_timer_t *t_ra_prolog;
498 ir_timer_t *t_ra_epilog;
499 ir_timer_t *t_ra_spill;
500 ir_timer_t *t_ra_spill_apply;
501 ir_timer_t *t_ra_color;
502 ir_timer_t *t_ra_ifg;
503 ir_timer_t *t_ra_copymin;
504 ir_timer_t *t_ra_ssa;
505 ir_timer_t *t_ra_other;
508 * The Firm backend main loop.
509 * Do architecture specific lowering for all graphs
510 * and call the architecture specific code generator.
512 * @param file_handle the file handle the output will be written to
513 * @param cup_name name of the compilation unit
515 static void be_main_loop(FILE *file_handle, const char *cup_name)
517 static const char suffix[] = ".prof";
519 int i, num_birgs, stat_active = 0;
521 char prof_filename[256];
523 ir_graph **irg_list, **backend_irg_list;
524 arch_env_t *arch_env;
526 be_timing = (be_options.timing == BE_TIME_ON);
529 t_abi = ir_timer_register("bemain_time_beabi", "be abi introduction");
530 t_codegen = ir_timer_register("bemain_time_codegen", "codegeneration");
531 t_ra_preparation = ir_timer_register("bemain_time_ra_preparation", "ra preparation");
532 t_sched = ir_timer_register("bemain_time_sched", "scheduling");
533 t_constr = ir_timer_register("bemain_time_constr", "assure constraints");
534 t_finish = ir_timer_register("bemain_time_finish", "graph finish");
535 t_emit = ir_timer_register("bemain_time_emiter", "code emiter");
536 t_verify = ir_timer_register("bemain_time_verify", "graph verification");
537 t_other = ir_timer_register("bemain_time_other", "other");
538 t_heights = ir_timer_register("bemain_time_heights", "heights");
539 t_live = ir_timer_register("bemain_time_liveness", "be liveness");
540 t_execfreq = ir_timer_register("bemain_time_execfreq", "execfreq");
541 t_ssa_constr = ir_timer_register("bemain_time_ssa_constr", "ssa reconstruction");
542 t_ra_prolog = ir_timer_register("bemain_time_ra_prolog", "regalloc prolog");
543 t_ra_epilog = ir_timer_register("bemain_time_ra_epilog", "regalloc epilog");
544 t_ra_constr = ir_timer_register("bemain_time_ra_constr", "regalloc constraints");
545 t_ra_spill = ir_timer_register("bemain_time_ra_spill", "spiller");
547 = ir_timer_register("bemain_time_ra_spill_apply", "apply spills");
548 t_ra_color = ir_timer_register("bemain_time_ra_color", "graph coloring");
549 t_ra_ifg = ir_timer_register("bemain_time_ra_ifg", "interference graph");
550 t_ra_copymin = ir_timer_register("bemain_time_ra_copymin", "copy minimization");
551 t_ra_ssa = ir_timer_register("bemain_time_ra_ssadestr", "ssa destruction");
552 t_ra_other = ir_timer_register("bemain_time_ra_other", "regalloc other");
555 be_init_env(&env, file_handle);
556 env.cup_name = cup_name;
561 arch_env = env.arch_env;
563 /* backend may provide an ordered list of irgs where code should be
565 irg_list = NEW_ARR_F(ir_graph *, 0);
566 backend_irg_list = arch_env_get_backend_irg_list(arch_env, &irg_list);
568 /* we might need 1 birg more for instrumentation constructor */
569 num_birgs = backend_irg_list ? ARR_LEN(backend_irg_list) : get_irp_n_irgs();
570 birgs = ALLOCAN(be_irg_t, num_birgs + 1);
574 /* First: initialize all birgs */
575 for(i = 0; i < num_birgs; ++i) {
576 ir_graph *irg = backend_irg_list ? backend_irg_list[i] : get_irp_irg(i);
577 irg->be_data = &birgs[i];
578 initialize_birg(&birgs[i], irg, &env);
580 arch_env_handle_intrinsics(arch_env);
584 Get the filename for the profiling data.
585 Beware: '\0' is already included in sizeof(suffix)
587 memset(prof_filename, 0, sizeof(prof_filename));
588 strncpy(prof_filename, cup_name, sizeof(prof_filename) - sizeof(suffix));
589 strcat(prof_filename, suffix);
592 Next: Either instruments all irgs with profiling code
593 or try to read in profile data for current translation unit.
595 if (be_options.opt_profile) {
596 ir_graph *prof_init_irg = ir_profile_instrument(prof_filename, profile_default);
597 initialize_birg(&birgs[num_birgs], prof_init_irg, &env);
600 ir_profile_read(prof_filename);
603 #ifdef FIRM_STATISTICS
604 stat_active = stat_is_active();
605 #endif /* FIRM_STATISTICS */
608 for (i = 0; i < num_birgs; ++i) {
609 be_irg_t *birg = &birgs[i];
610 ir_graph *irg = birg->irg;
611 optimization_state_t state;
612 const arch_code_generator_if_t *cg_if;
614 /* set the current graph (this is important for several firm functions) */
615 current_ir_graph = irg;
618 stat_ev_ctx_push_fobj("bemain_irg", irg);
619 be_stat_ev("bemain_insns_start", be_count_insns(irg));
620 be_stat_ev("bemain_blocks_start", be_count_blocks(irg));
623 /* stop and reset timers */
624 BE_TIMER_PUSH(t_other); /* t_other */
626 /* Verify the initial graph */
627 BE_TIMER_PUSH(t_verify);
628 if (be_options.vrfy_option == BE_VRFY_WARN) {
629 irg_verify(irg, VRFY_ENFORCE_SSA);
630 be_check_dominance(irg);
631 } else if (be_options.vrfy_option == BE_VRFY_ASSERT) {
632 assert(irg_verify(irg, VRFY_ENFORCE_SSA) && "irg verification failed");
633 assert(be_check_dominance(irg) && "Dominance verification failed");
635 BE_TIMER_POP(t_verify);
637 /* Get the code generator interface. */
638 cg_if = arch_env_get_code_generator_if(arch_env);
640 /* get a code generator for this graph. */
641 birg->cg = cg_if->init(birg);
643 /* some transformations need to be done before abi introduce */
644 arch_code_generator_before_abi(birg->cg);
646 /* implement the ABI conventions. */
647 BE_TIMER_PUSH(t_abi);
648 birg->abi = be_abi_introduce(birg);
651 dump(DUMP_ABI, irg, "-abi", dump_ir_block_graph);
653 /* do local optimizations */
654 optimize_graph_df(irg);
656 /* we have to do cfopt+remove_critical_edges as we can't have Bad-blocks
657 * or critical edges in the backend */
659 remove_critical_cf_edges(irg);
661 /* TODO: we often have dead code reachable through out-edges here. So for
662 * now we rebuild edges (as we need correct user count for code selection)
664 edges_deactivate(irg);
667 dump(DUMP_PREPARED, irg, "-pre_transform", dump_ir_block_graph_sched);
669 if (be_options.vrfy_option == BE_VRFY_WARN) {
670 be_check_dominance(irg);
671 be_verify_out_edges(irg);
672 } else if (be_options.vrfy_option == BE_VRFY_ASSERT) {
673 assert(be_verify_out_edges(irg));
674 assert(be_check_dominance(irg) && "Dominance verification failed");
678 BE_TIMER_PUSH(t_codegen);
679 arch_code_generator_prepare_graph(birg->cg);
680 BE_TIMER_POP(t_codegen);
682 dump(DUMP_PREPARED, irg, "-prepared", dump_ir_block_graph);
684 if (be_options.vrfy_option == BE_VRFY_WARN) {
685 be_check_dominance(irg);
686 be_verify_out_edges(irg);
687 } else if (be_options.vrfy_option == BE_VRFY_ASSERT) {
688 assert(be_verify_out_edges(irg));
689 assert(be_check_dominance(irg) && "Dominance verification failed");
692 BE_TIMER_PUSH(t_execfreq);
694 * Create execution frequencies from profile data or estimate some
696 if (ir_profile_has_data())
697 birg->exec_freq = ir_create_execfreqs_from_profile(irg);
699 /* TODO: edges are corrupt for EDGE_KIND_BLOCK after the local
700 * optimize graph phase merges blocks in the x86 backend */
701 edges_deactivate(irg);
702 birg->exec_freq = compute_execfreq(irg, 10);
704 BE_TIMER_POP(t_execfreq);
707 /* disabled for now, fails for EmptyFor.c and XXEndless.c */
708 /* be_live_chk_compare(birg); */
710 /* schedule the irg */
711 BE_TIMER_PUSH(t_sched);
712 switch (be_options.scheduler) {
714 fprintf(stderr, "Warning: invalid scheduler (%d) selected, falling back to list scheduler.\n", be_options.scheduler);
716 list_sched(birg, &be_options);
720 be_ilp_sched(birg, &be_options);
722 #endif /* WITH_ILP */
724 BE_TIMER_POP(t_sched);
726 dump(DUMP_SCHED, irg, "-sched", dump_ir_block_graph_sched);
729 BE_TIMER_PUSH(t_verify);
730 be_sched_vrfy(birg, be_options.vrfy_option);
731 BE_TIMER_POP(t_verify);
733 /* introduce patterns to assure constraints */
734 BE_TIMER_PUSH(t_constr);
735 /* we switch off optimizations here, because they might cause trouble */
736 save_optimization_state(&state);
738 set_opt_normalize(0);
741 /* add Keeps for should_be_different constrained nodes */
742 /* beware: needs schedule due to usage of be_ssa_constr */
743 assure_constraints(birg);
744 BE_TIMER_POP(t_constr);
746 dump(DUMP_SCHED, irg, "-assured", dump_ir_block_graph_sched);
748 /* stuff needs to be done after scheduling but before register allocation */
749 BE_TIMER_PUSH(t_ra_preparation);
750 arch_code_generator_before_ra(birg->cg);
751 BE_TIMER_POP(t_ra_preparation);
753 /* connect all stack modifying nodes together (see beabi.c) */
754 BE_TIMER_PUSH(t_abi);
755 be_abi_fix_stack_nodes(birg->abi);
758 dump(DUMP_SCHED, irg, "-fix_stack", dump_ir_block_graph_sched);
761 BE_TIMER_PUSH(t_verify);
762 be_sched_vrfy(birg, be_options.vrfy_option);
763 BE_TIMER_POP(t_verify);
766 stat_ev_dbl("bemain_costs_before_ra",
767 be_estimate_irg_costs(irg, birg->exec_freq));
768 be_stat_ev("bemain_insns_before_ra", be_count_insns(irg));
769 be_stat_ev("bemain_blocks_before_ra", be_count_blocks(irg));
772 /* Do register allocation */
773 be_allocate_registers(birg);
775 #ifdef FIRM_STATISTICS
776 stat_ev_dbl("bemain_costs_before_ra", be_estimate_irg_costs(irg, birg->exec_freq));
779 dump(DUMP_RA, irg, "-ra", dump_ir_block_graph_sched);
781 /* let the code generator prepare the graph for emitter */
782 BE_TIMER_PUSH(t_finish);
783 arch_code_generator_after_ra(birg->cg);
784 BE_TIMER_POP(t_finish);
786 /* fix stack offsets */
787 BE_TIMER_PUSH(t_abi);
788 be_abi_fix_stack_nodes(birg->abi);
789 be_remove_dead_nodes_from_schedule(birg);
790 be_abi_fix_stack_bias(birg->abi);
793 dump(DUMP_SCHED, irg, "-fix_stack_after_ra", dump_ir_block_graph_sched);
795 BE_TIMER_PUSH(t_finish);
796 arch_code_generator_finish(birg->cg);
797 BE_TIMER_POP(t_finish);
799 dump(DUMP_FINAL, irg, "-finish", dump_ir_block_graph_sched);
802 be_stat_ev("bemain_insns_finish", be_count_insns(irg));
803 be_stat_ev("bemain_blocks_finish", be_count_blocks(irg));
806 /* check schedule and register allocation */
807 BE_TIMER_PUSH(t_verify);
808 if (be_options.vrfy_option == BE_VRFY_WARN) {
809 irg_verify(irg, VRFY_ENFORCE_SSA);
810 be_check_dominance(irg);
811 be_verify_out_edges(irg);
812 be_verify_schedule(birg);
813 be_verify_register_allocation(birg);
814 } else if (be_options.vrfy_option == BE_VRFY_ASSERT) {
815 assert(irg_verify(irg, VRFY_ENFORCE_SSA) && "irg verification failed");
816 assert(be_verify_out_edges(irg) && "out edge verification failed");
817 assert(be_check_dominance(irg) && "Dominance verification failed");
818 assert(be_verify_schedule(birg) && "Schedule verification failed");
819 assert(be_verify_register_allocation(birg)
820 && "register allocation verification failed");
823 BE_TIMER_POP(t_verify);
825 /* emit assembler code */
826 BE_TIMER_PUSH(t_emit);
827 arch_code_generator_done(birg->cg);
828 BE_TIMER_POP(t_emit);
830 dump(DUMP_FINAL, irg, "-end", dump_ir_block_graph_sched);
832 BE_TIMER_PUSH(t_abi);
833 be_abi_free(birg->abi);
836 restore_optimization_state(&state);
838 BE_TIMER_POP(t_other);
840 #define STOP_AND_RESET_TIMER(timer) do { ir_timer_stop(timer); ir_timer_reset(timer); } while(0)
842 #define LC_EMIT(timer) \
844 stat_ev_dbl(ir_timer_get_name(timer), ir_timer_elapsed_msec(timer)); \
846 printf("%-20s: %8.3lf msec\n", ir_timer_get_description(timer), (double)ir_timer_elapsed_usec(timer) / 1000.0); \
848 STOP_AND_RESET_TIMER(timer);
853 printf("==>> IRG %s <<==\n", get_entity_name(get_irg_entity(irg)));
857 LC_EMIT(t_ra_preparation);
861 LC_EMIT(t_ssa_constr);
864 LC_EMIT(t_ra_prolog);
866 LC_EMIT(t_ra_spill_apply);
867 LC_EMIT(t_ra_constr);
870 LC_EMIT(t_ra_copymin);
872 LC_EMIT(t_ra_epilog);
883 /* switched off due to statistics (statistic module needs all irgs) */
884 #ifdef FIRM_STATISTICS
886 #endif /* FIRM_STATISTICS */
888 stat_ev_ctx_pop("bemain_irg");
896 /* Main interface to the frontend. */
897 void be_main(FILE *file_handle, const char *cup_name)
899 ir_timer_t *t = NULL;
901 /* The user specified another config file to read. do that now. */
902 if (config_file[0] != '\0') {
903 FILE *f = fopen(config_file, "rt");
906 lc_opt_from_file(config_file, f, NULL);
909 fprintf(stderr, "Warning: Cannot open config file '%s'\n", config_file);
913 if (be_options.timing == BE_TIME_ON) {
914 t = ir_timer_register("bemain", "measure complete bemain loop");
916 if (ir_timer_enter_high_priority()) {
917 fprintf(stderr, "Warning: Could not enter high priority mode.\n");
920 ir_timer_reset_and_start(t);
923 #ifdef FIRM_STATISTICS
924 if (be_options.statev) {
925 const char *dot = strrchr(cup_name, '.');
926 const char *pos = dot ? dot : cup_name + strlen(cup_name);
927 char *buf = ALLOCAN(char, pos - cup_name + 1);
928 strncpy(buf, cup_name, pos - cup_name);
929 buf[pos - cup_name] = '\0';
931 be_options.statev = 1;
932 stat_ev_begin(buf, be_options.filtev);
933 stat_ev_ctx_push_str("bemain_compilation_unit", cup_name);
937 /* never build code for pseudo irgs */
938 set_visit_pseudo_irgs(0);
940 be_main_loop(file_handle, cup_name);
942 if (be_options.timing == BE_TIME_ON) {
944 ir_timer_leave_high_priority();
946 stat_ev_dbl("bemain_backend_time", ir_timer_elapsed_msec(t));
948 printf("%-20s: %lu msec\n", "BEMAINLOOP", ir_timer_elapsed_msec(t));
952 #ifdef FIRM_STATISTICS
953 if (be_options.statev) {
954 stat_ev_ctx_pop("bemain_compilation_unit");
960 unsigned be_put_ignore_regs(const be_irg_t *birg, const arch_register_class_t *cls, bitset_t *bs)
963 bs = bitset_alloca(cls->n_regs);
965 bitset_clear_all(bs);
967 assert(bitset_size(bs) == cls->n_regs);
968 arch_put_non_ignore_regs(cls, bs);
970 be_abi_put_ignore_regs(birg->abi, cls, bs);
972 return bitset_popcnt(bs);