2 * Author: Daniel Grund, Sebastian Hack
4 * Copyright: (c) Universitaet Karlsruhe
5 * Licence: This file protected by GPL - GNU GENERAL PUBLIC LICENSE.
16 #include "iredges_t.h"
26 #include "besched_t.h"
29 #include "bechordal_t.h"
32 /* This enables re-computation of values. Current state: Unfinished and buggy. */
35 typedef struct _reloader_t reloader_t;
36 typedef struct _spill_info_t spill_info_t;
43 struct _spill_info_t {
44 ir_node *spilled_node;
45 reloader_t *reloaders;
48 typedef struct _spill_ctx_t {
49 ir_node *spilled; /**< The spilled node. */
50 ir_node *user; /**< The node this spill is for. */
51 ir_node *spill; /**< The spill itself. */
55 const arch_register_class_t *cls;
56 const be_chordal_env_t *chordal_env;
59 set *spills; /**< all spill_info_t's, which must be placed */
60 pset *mem_phis; /**< set of all special spilled phis. allocated and freed separately */
61 decide_irn_t is_mem_phi; /**< callback func to decide if a phi needs special spilling */
62 void *data; /**< data passed to all callbacks */
63 DEBUG_ONLY(firm_dbg_module_t *dbg;)
66 /* associated Phi -> Spill*/
67 typedef struct _phi_spill_assoc_t {
73 * Compare two Phi->Spill associations.
75 static int cmp_phi_spill_assoc(const void *a, const void *b) {
76 const phi_spill_assoc_t *p1 = a;
77 const phi_spill_assoc_t *p2 = b;
78 return p1->phi != p2->phi;
82 * compare two spill contexts.
84 static int cmp_spillctx(const void *a, const void *b, size_t n) {
85 const spill_ctx_t *p = a;
86 const spill_ctx_t *q = b;
87 return p->user != q->user || p->spilled != q->spilled;
91 * Compare two spill infos.
93 static int cmp_spillinfo(const void *x, const void *y, size_t size) {
94 const spill_info_t *xx = x;
95 const spill_info_t *yy = y;
96 return xx->spilled_node != yy->spilled_node;
100 /* Sets the debug module of a spill environment. */
101 void be_set_spill_env_dbg_module(spill_env_t *env, firm_dbg_module_t *dbg) {
106 /* Creates a new spill environment. */
107 spill_env_t *be_new_spill_env(const be_chordal_env_t *chordal_env, decide_irn_t is_mem_phi, void *data) {
108 spill_env_t *env = xmalloc(sizeof(env[0]));
109 env->spill_ctxs = new_set(cmp_spillctx, 1024);
110 env->spills = new_set(cmp_spillinfo, 1024);
111 env->cls = chordal_env->cls;
112 env->is_mem_phi = is_mem_phi;
114 env->chordal_env = chordal_env;
115 obstack_init(&env->obst);
119 /* Deletes a spill environment. */
120 void be_delete_spill_env(spill_env_t *senv) {
121 del_set(senv->spill_ctxs);
122 del_set(senv->spills);
123 obstack_free(&senv->obst, NULL);
128 * Returns a spill context. If the context did not exists, create one.
130 * @param sc the set containing all spill contexts
131 * @param to_spill the node that should be spilled
132 * @param ctx_irn an user of the spilled node
134 * @return a spill context.
136 static spill_ctx_t *be_get_spill_ctx(set *sc, ir_node *to_spill, ir_node *ctx_irn) {
139 templ.spilled = to_spill;
140 templ.user = ctx_irn;
143 return set_insert(sc, &templ, sizeof(templ), HASH_COMBINE(HASH_PTR(to_spill), HASH_PTR(ctx_irn)));
149 * @param senv the spill environment
150 * @param irn the node that should be spilled
151 * @param ctx_irn an user of the spilled node
153 * @return a be_Spill node
155 static ir_node *be_spill_irn(spill_env_t *senv, ir_node *irn, ir_node *ctx_irn) {
157 DBG((senv->dbg, LEVEL_1, "%+F in ctx %+F\n", irn, ctx_irn));
159 ctx = be_get_spill_ctx(senv->spill_ctxs, irn, ctx_irn);
161 const be_main_env_t *env = senv->chordal_env->birg->main_env;
162 ctx->spill = be_spill(env->arch_env, irn, ctx_irn);
169 * If the first usage of a Phi result would be out of memory
170 * there is no sense in allocating a register for it.
171 * Thus we spill it and all its operands to the same spill slot.
172 * Therefore the phi/dataB becomes a phi/Memory
174 * @param senv the spill environment
175 * @param phi the Phi node that should be spilled
176 * @param ctx_irn an user of the spilled node
178 * @return a be_Spill node
180 static ir_node *be_spill_phi(spill_env_t *senv, ir_node *phi, ir_node *ctx_irn, unsigned visited_nr, pset *already_visited_phis) {
181 int i, n = get_irn_arity(phi);
182 ir_graph *irg = senv->chordal_env->irg;
183 ir_mode *phi_mode = get_irn_mode(phi);
184 ir_node *bl = get_nodes_block(phi);
185 ir_node **ins, *phi_spill;
186 phi_spill_assoc_t key;
190 DBG((senv->dbg, LEVEL_1, "%+F in ctx %+F\n", phi, ctx_irn));
192 if (get_irn_node_nr(phi) == 2219 || get_irn_node_nr(phi) == 2214)
195 /* build a new PhiM */
196 NEW_ARR_A(ir_node *, ins, n);
197 for (i = 0; i < n; ++i) {
198 ins[i] = new_rd_Unknown(irg, phi_mode);
200 phi_spill = new_r_Phi(senv->chordal_env->irg, bl, n, ins, mode_M);
202 key.spill = phi_spill;
203 pset_insert(already_visited_phis, &key, HASH_PTR(phi));
205 /* search an existing spill for this context */
206 ctx = be_get_spill_ctx(senv->spill_ctxs, phi, ctx_irn);
208 /* if not found spill the phi */
210 set_irn_visited(phi, visited_nr);
212 /* collect all arguments of the phi */
213 for (i = 0; i < n; ++i) {
214 ir_node *arg = get_irn_n(phi, i);
216 phi_spill_assoc_t *entry;
218 if(is_Phi(arg) && pset_find_ptr(senv->mem_phis, arg)) {
219 if (get_irn_visited(arg) < visited_nr)
220 sub_res = be_spill_phi(senv, arg, ctx_irn, visited_nr, already_visited_phis);
222 /* we already visited the argument phi: get it's spill */
225 entry = pset_find(already_visited_phis, &key, HASH_PTR(arg));
226 assert(entry && "argument phi already visited, but no spill found?!?");
227 sub_res = entry->spill;
231 sub_res = be_spill_irn(senv, arg, ctx_irn);
233 set_irn_n(phi_spill, i, sub_res);
236 ctx->spill = phi_spill;
244 * @param senv the spill environment
245 * @param irn the node that should be spilled
246 * @param ctx_irn an user of the spilled node
248 * @return a be_Spill node
250 static ir_node *be_spill_node(spill_env_t *senv, ir_node *to_spill, unsigned visited_nr) {
251 ir_graph *irg = get_irn_irg(to_spill);
252 int save_optimize = get_optimize();
253 int save_normalize = get_opt_normalize();
254 pset *already_visited_phis = new_pset(cmp_phi_spill_assoc, 10);
258 * Disable optimization so that the phi functions do not
262 set_opt_normalize(0);
264 if (pset_find_ptr(senv->mem_phis, to_spill))
265 res = be_spill_phi(senv, to_spill, to_spill, visited_nr, already_visited_phis);
267 res = be_spill_irn(senv, to_spill, to_spill);
269 del_pset(already_visited_phis);
271 /* reset the optimizations */
272 set_optimize(save_optimize);
273 set_opt_normalize(save_normalize);
283 * Check if a spilled node could be rematerialized.
285 * @param senv the spill environment
286 * @param spill the Spill node
287 * @param spilled the node that was spilled
288 * @param reloader a irn that requires a reload
290 static int check_remat_conditions(spill_env_t *senv, ir_node *spill, ir_node *spilled, ir_node *reloader) {
293 /* check for 'normal' spill and general remat condition */
294 if (!be_is_Spill(spill) || !arch_irn_is(senv->chordal_env->birg->main_env->arch_env, spilled, rematerializable))
297 /* check availability of original arguments */
298 if (is_Block(reloader)) {
300 /* we want to remat at the end of a block.
301 * thus all arguments must be alive at the end of the block
303 for (pos=0, max=get_irn_arity(spilled); pos<max; ++pos) {
304 ir_node *arg = get_irn_n(spilled, pos);
305 if (!is_live_end(reloader, arg))
311 /* we want to remat before the insn reloader
312 * thus an arguments is alive if
313 * - it interferes with the reloaders result
315 * - or it is (last-) used by reloader itself
317 for (pos=0, max=get_irn_arity(spilled); pos<max; ++pos) {
318 ir_node *arg = get_irn_n(spilled, pos);
321 if (values_interfere(reloader, arg))
324 for (i=0, m=get_irn_arity(reloader); i<m; ++i) {
325 ir_node *rel_arg = get_irn_n(reloader, i);
330 /* arg is not alive before reloader */
342 #else /* BUGGY_REMAT */
345 * A very simple rematerialization checker.
347 * @param senv the spill environment
348 * @param spill the Spill node
349 * @param spilled the node that was spilled
350 * @param reloader a irn that requires a reload
352 static int check_remat_conditions(spill_env_t *senv, ir_node *spill, ir_node *spilled, ir_node *reloader) {
353 const arch_env_t *aenv = senv->chordal_env->birg->main_env->arch_env;
355 return get_irn_arity(spilled) == 0 &&
356 be_is_Spill(spill) &&
357 arch_irn_is(aenv, spilled, rematerializable);
360 #endif /* BUGGY_REMAT */
365 * Re-materialize a node.
367 * @param senv the spill environment
368 * @param spilled the node that was spilled
369 * @param reloader a irn that requires a reload
371 static ir_node *do_remat(spill_env_t *senv, ir_node *spilled, ir_node *reloader) {
373 ir_node *bl = (is_Block(reloader)) ? reloader : get_nodes_block(reloader);
375 /* recompute the value */
376 res = new_ir_node(get_irn_dbg_info(spilled), senv->chordal_env->irg, bl,
378 get_irn_mode(spilled),
379 get_irn_arity(spilled),
380 get_irn_in(spilled) + 1);
381 copy_node_attr(spilled, res);
383 DBG((senv->dbg, LEVEL_1, "Insert remat %+F before reloader %+F\n", res, reloader));
385 /* insert in schedule */
386 if (is_Block(reloader)) {
387 ir_node *insert = sched_skip(reloader, 0, sched_skip_cf_predicator, (void *) senv->chordal_env->birg->main_env->arch_env);
388 sched_add_after(insert, res);
390 sched_add_before(reloader, res);
397 * Walker: fills the mem_phis set by evaluating Phi nodes
398 * using the is_mem_phi() callback.
400 static void phi_walker(ir_node *irn, void *env) {
401 spill_env_t *senv = env;
404 const arch_env_t *arch = senv->chordal_env->birg->main_env->arch_env;
405 if (arch_irn_has_reg_class(arch, irn, 0, senv->cls) &&
406 senv->is_mem_phi(irn, senv->data)) {
407 DBG((senv->dbg, LEVEL_1, " %+F\n", irn));
408 pset_insert_ptr(senv->mem_phis, irn);
413 void be_insert_spills_reloads(spill_env_t *senv, pset *reload_set) {
414 const arch_env_t *aenv = senv->chordal_env->birg->main_env->arch_env;
415 ir_graph *irg = senv->chordal_env->irg;
421 /* get all special spilled phis */
422 DBG((senv->dbg, LEVEL_1, "Mem-phis:\n"));
423 senv->mem_phis = pset_new_ptr_default();
424 irg_walk_graph(senv->chordal_env->irg, phi_walker, NULL, senv);
426 /* Add reloads for mem_phis */
427 /* BETTER: These reloads (1) should only be inserted, if they are really needed */
428 DBG((senv->dbg, LEVEL_1, "Reloads for mem-phis:\n"));
429 for(irn = pset_first(senv->mem_phis); irn; irn = pset_next(senv->mem_phis)) {
431 DBG((senv->dbg, LEVEL_1, " Mem-phi %+F\n", irn));
432 foreach_out_edge(irn, e) {
433 ir_node *user = e->src;
434 if (is_Phi(user) && !pset_find_ptr(senv->mem_phis, user)) {
435 ir_node *use_bl = get_nodes_block(user);
436 DBG((senv->dbg, LEVEL_1, " non-mem-phi user %+F\n", user));
437 be_add_reload_on_edge(senv, irn, use_bl, e->pos); /* (1) */
442 visited_nr = get_irg_visited(irg) + 1;
443 set_irg_visited(irg, visited_nr);
445 /* process each spilled node */
446 DBG((senv->dbg, LEVEL_1, "Insert spills and reloads:\n"));
447 possibly_dead = new_pdeq();
448 for(si = set_first(senv->spills); si; si = set_next(senv->spills)) {
450 ir_mode *mode = get_irn_mode(si->spilled_node);
451 pset *values = pset_new_ptr(16);
453 /* go through all reloads for this spill */
454 for(rld = si->reloaders; rld; rld = rld->next) {
457 /* the spill for this reloader */
458 ir_node *spill = be_spill_node(senv, si->spilled_node, visited_nr);
461 if (check_remat_conditions(senv, spill, si->spilled_node, rld->reloader)) {
462 new_val = do_remat(senv, si->spilled_node, rld->reloader);
463 pdeq_putl(possibly_dead, spill);
468 new_val = be_reload(aenv, senv->cls, rld->reloader, mode, spill);
470 DBG((senv->dbg, LEVEL_1, " %+F of %+F before %+F\n", new_val, si->spilled_node, rld->reloader));
471 pset_insert_ptr(values, new_val);
473 pset_insert_ptr(reload_set, new_val);
476 /* introduce copies, rewire the uses */
477 assert(pset_count(values) > 0 && "???");
478 pset_insert_ptr(values, si->spilled_node);
479 be_ssa_constr_set_ignore(senv->chordal_env->dom_front, values, senv->mem_phis);
484 foreach_pset(senv->mem_phis, irn) {
486 for (i = 0, n = get_irn_arity(irn); i < n; ++i) {
487 pdeq_putl(possibly_dead, get_irn_n(irn, i));
488 set_irn_n(irn, i, new_r_Bad(senv->chordal_env->irg));
493 /* check if possibly dead nodes are really dead yet */
494 while (! pdeq_empty(possibly_dead)) {
495 ir_node *irn = pdeq_getr(possibly_dead);
496 const ir_edge_t *edge = get_irn_out_edge_first(irn);
500 for (i = get_irn_arity(irn) - 1; i >= 0; --i) {
501 pdeq_putl(possibly_dead, get_irn_n(irn, i));
502 set_irn_n(irn, i, new_r_Bad(senv->chordal_env->irg));
507 del_pdeq(possibly_dead);
508 del_pset(senv->mem_phis);
511 void be_add_reload(spill_env_t *senv, ir_node *to_spill, ir_node *before) {
512 spill_info_t templ, *res;
515 templ.spilled_node = to_spill;
516 templ.reloaders = NULL;
517 res = set_insert(senv->spills, &templ, sizeof(templ), HASH_PTR(to_spill));
519 rel = obstack_alloc(&senv->obst, sizeof(rel[0]));
520 rel->reloader = before;
521 rel->next = res->reloaders;
522 res->reloaders = rel;
525 void be_add_reload_on_edge(spill_env_t *senv, ir_node *to_spill, ir_node *bl, int pos) {
526 ir_node *insert_bl = get_irn_arity(bl) == 1 ? sched_first(bl) : get_Block_cfgpred_block(bl, pos);
527 be_add_reload(senv, to_spill, insert_bl);
532 /****************************************
534 SPILL SLOT MANAGEMENT AND OPTS
536 ****************************************/
538 typedef struct _spill_slot_t {
542 ir_mode *largest_mode; /* the mode of all members with largest size */
545 typedef struct _ss_env_t {
547 be_chordal_env_t *cenv;
548 pmap *slots; /* maps spill_contexts to spill_slots */
549 pmap *types; /* maps modes to types */
550 DEBUG_ONLY(firm_dbg_module_t *dbg;)
555 * Walker: compute the spill slots
557 static void compute_spill_slots_walker(ir_node *spill, void *env) {
558 ss_env_t *ssenv = env;
563 if (!be_is_Spill(spill))
566 /* check, if this spill is for a context already known */
567 ctx = be_get_Spill_context(spill);
568 entry = pmap_find(ssenv->slots, ctx);
571 struct _arch_env_t *arch_env = ssenv->cenv->birg->main_env->arch_env;
572 const arch_register_class_t *cls = arch_get_irn_reg_class(arch_env, spill, be_pos_Spill_val);
573 ir_mode *largest_mode = arch_register_class_mode(cls);
575 /* this is a new spill context */
576 ss = obstack_alloc(&ssenv->ob, sizeof(*ss));
577 ss->members = pset_new_ptr(8);
578 ss->largest_mode = largest_mode;
579 ss->size = get_mode_size_bytes(ss->largest_mode);
580 ss->align = arch_isa_get_reg_class_alignment(arch_env->isa, cls);
581 pmap_insert(ssenv->slots, ctx, ss);
583 /* values with the same spill_ctx must go into the same spill slot */
587 /* ugly mega assert :-) */
590 struct _arch_env_t *arch_env = ssenv->cenv->birg->main_env->arch_env;
591 const arch_register_class_t *cls = arch_get_irn_reg_class(arch_env, spill, be_pos_Spill_val);
592 int size = get_mode_size_bytes(arch_register_class_mode(cls));
593 assert(ss->size == size && "Different sizes for the same spill slot are not allowed.");
594 for (irn = pset_first(ss->members); irn; irn = pset_next(ss->members)) {
595 /* use values_interfere here, because it uses the dominance check,
596 which does work for values in memory */
597 assert(!values_interfere(spill, irn) && "Spills for the same spill slot must not interfere!");
603 pset_insert_ptr(ss->members, spill);
607 * qsort compare function, sort spill slots by size.
609 static int ss_sorter(const void *v1, const void *v2) {
610 const spill_slot_t **ss1 = v1;
611 const spill_slot_t **ss2 = v2;
612 return ((int) (*ss2)->size) - ((int) (*ss1)->size);
617 * This function should optimize the spill slots.
618 * - Coalescing of multiple slots
619 * - Ordering the slots
621 * Input slots are in @p ssenv->slots
622 * @p size The count of initial spill slots in @p ssenv->slots
623 * This also is the size of the preallocated array @p ass
625 * @return An array of spill slots @p ass in specific order
627 static void optimize_slots(ss_env_t *ssenv, int size, spill_slot_t *ass[]) {
628 int i, o, used_slots;
632 pmap_foreach(ssenv->slots, entr)
633 ass[i++] = entr->value;
635 /* Sort the array to minimize fragmentation and cache footprint.
636 Large slots come first */
637 qsort(ass, size, sizeof(ass[0]), ss_sorter);
639 /* For each spill slot:
640 - assign a new offset to this slot
641 - xor find another slot to coalesce with */
643 for (i=0; i<size; ++i) { /* for each spill slot */
647 DBG((ssenv->dbg, LEVEL_1, "Spill slot %d members:\n", i));
648 for(n1 = pset_first(ass[i]->members); n1; n1 = pset_next(ass[i]->members))
649 DBG((ssenv->dbg, LEVEL_1, " %+F\n", n1));
652 for (o=0; o < used_slots && tgt_slot == -1; ++o) { /* for each offset-assigned spill slot */
653 /* check inter-slot-pairs for interference */
655 for(n1 = pset_first(ass[i]->members); n1; n1 = pset_next(ass[i]->members))
656 for(n2 = pset_first(ass[o]->members); n2; n2 = pset_next(ass[o]->members))
657 if(values_interfere(n1, n2)) {
658 pset_break(ass[i]->members);
659 pset_break(ass[o]->members);
660 DBG((ssenv->dbg, LEVEL_1, " Interf %+F -- %+F\n", n1, n2));
661 goto interf_detected;
664 /* if we are here, there is no interference between ass[i] and ass[o] */
667 interf_detected: /*nothing*/ ;
670 /* now the members of ass[i] join the members of ass[tgt_slot] */
672 /* do we need a new slot? */
673 if (tgt_slot == -1) {
674 tgt_slot = used_slots;
679 ass[tgt_slot]->size = ass[i]->size;
680 del_pset(ass[tgt_slot]->members);
681 ass[tgt_slot]->members = pset_new_ptr(8);
685 /* copy the members to the target pset */
686 /* NOTE: If src and tgt pset are the same, inserting while iterating is not allowed */
688 for(n1 = pset_first(ass[i]->members); n1; n1 = pset_next(ass[i]->members))
689 pset_insert_ptr(ass[tgt_slot]->members, n1);
693 #define ALIGN_SPILL_AREA 16
694 #define pset_foreach(pset, elm) for(elm=pset_first(pset); elm; elm=pset_next(pset))
697 * Returns a spill type for a mode. Keep them in a map to reduce
698 * the number of types.
700 * @param types a map containing all created types
701 * @param ss the spill slot
703 * Note that type types should are identical for every mode.
704 * This rule might break if two different register classes return the same
705 * mode but different alignments.
707 static ir_type *get_spill_type(pmap *types, spill_slot_t *ss) {
708 pmap_entry *e = pmap_find(types, ss->largest_mode);
713 snprintf(buf, sizeof(buf), "spill_slot_type_%s", get_mode_name(ss->largest_mode));
714 res = new_type_primitive(new_id_from_str(buf), ss->largest_mode);
715 set_type_alignment_bytes(res, ss->align);
716 pmap_insert(types, ss->largest_mode, res);
720 assert(get_type_alignment_bytes(res) == (int)ss->align);
726 * Create spill slot entities on the frame type.
728 * @param ssenv the spill environment
729 * @param n number of spill slots
730 * @param ss array of spill slots
732 static void assign_entities(ss_env_t *ssenv, int n_slots, spill_slot_t *ss[]) {
733 int i, offset, frame_align;
734 ir_type *frame = get_irg_frame_type(ssenv->cenv->irg);
736 /* aligning by increasing frame size */
737 offset = get_type_size_bits(frame) / 8;
738 offset = round_up2(offset, ALIGN_SPILL_AREA);
739 set_type_size_bytes(frame, -1);
741 /* create entities and assign offsets according to size and alignment*/
742 for (i = 0; i < n_slots; ++i) {
749 snprintf(buf, sizeof(buf), "spill_slot_%d", i);
750 name = new_id_from_str(buf);
752 spill_ent = new_entity(frame, name, get_spill_type(ssenv->types, ss[i]));
755 offset = round_up2(offset, ss[i]->align);
757 set_entity_offset_bytes(spill_ent, offset);
758 /* next possible offset */
759 offset += round_up2(ss[i]->size, ss[i]->align);
761 pset_foreach(ss[i]->members, irn)
762 be_set_Spill_entity(irn, spill_ent);
765 /* set final size of stack frame */
766 frame_align = get_type_alignment_bytes(frame);
767 set_type_size_bytes(frame, round_up2(offset, frame_align));
770 void be_compute_spill_offsets(be_chordal_env_t *cenv) {
776 obstack_init(&ssenv.ob);
778 ssenv.slots = pmap_create();
779 ssenv.types = pmap_create();
780 FIRM_DBG_REGISTER(ssenv.dbg, "ir.be.spillslots");
782 /* Get initial spill slots */
783 irg_walk_graph(cenv->irg, NULL, compute_spill_slots_walker, &ssenv);
785 /* Build an empty array for optimized spill slots */
786 ss_size = pmap_count(ssenv.slots);
787 ss = obstack_alloc(&ssenv.ob, ss_size * sizeof(*ss));
788 optimize_slots(&ssenv, ss_size, ss);
790 /* Integrate slots into the stack frame entity */
791 assign_entities(&ssenv, ss_size, ss);
794 pmap_foreach(ssenv.slots, pme)
795 del_pset(((spill_slot_t *)pme->value)->members);
796 pmap_destroy(ssenv.slots);
797 pmap_destroy(ssenv.types);
798 obstack_free(&ssenv.ob, NULL);
800 be_copy_entities_to_reloads(cenv->irg);