2 * Author: Matthias Braun
4 * Copyright: (c) Universitaet Karlsruhe
5 * License: This file protected by GPL - GNU GENERAL PUBLIC LICENSE.
12 #include "bespillmorgan.h"
14 #include "bechordal.h"
15 #include "bechordal_t.h"
24 #include "interval_analysis.h"
28 #include "irgraph_t.h"
30 #include "irphase_t.h"
33 #include "bespillbelady.h"
37 #define DBG_PRESSURE 2
38 DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)
40 typedef struct _morgan_env_t {
41 const arch_env_t *arch;
42 const arch_register_class_t *cls;
45 // maximum safe register pressure
46 int registers_available;
48 be_insn_env_t insn_env;
56 typedef struct _loop_out_edge_t {
61 typedef struct _loop_attr_t {
64 /// The set of all values that live through the loop and are not used
65 bitset_t *livethrough_unused;
68 typedef struct _block_attr_t {
70 bitset_t *livethrough_unused;
73 //---------------------------------------------------------------------------
75 int loop_out_edge_cmp(const void* p1, const void* p2, size_t s) {
76 loop_out_edge_t *e1 = (loop_out_edge_t*) p1;
77 loop_out_edge_t *e2 = (loop_out_edge_t*) p2;
79 return e1->block != e2->block || e1->pos != e2->pos;
82 int loop_attr_cmp(const void *e1, const void *e2, size_t s) {
83 loop_attr_t *la1 = (loop_attr_t*) e1;
84 loop_attr_t *la2 = (loop_attr_t*) e2;
86 return la1->loop != la2->loop;
89 int block_attr_cmp(const void *e1, const void *e2, size_t s) {
90 block_attr_t *b1 = (block_attr_t*) e1;
91 block_attr_t *b2 = (block_attr_t*) e2;
93 return b1->block != b2->block;
96 static INLINE int loop_attr_hash(const loop_attr_t *a) {
97 return HASH_PTR(a->loop);
100 static INLINE int block_attr_hash(const block_attr_t *b) {
101 return HASH_PTR(b->block);
104 static INLINE int loop_out_edge_hash(const loop_out_edge_t *e) {
105 return HASH_PTR(e->block) ^ (e->pos * 31);
108 static INLINE loop_attr_t *get_loop_attr(morgan_env_t *env, ir_loop *loop) {
109 loop_attr_t l_attr, *res;
113 hash = loop_attr_hash(&l_attr);
114 res = set_find(env->loop_attr_set, &l_attr, sizeof(l_attr), hash);
116 // create new loop_attr if none exists yet
118 l_attr.out_edges = new_set(loop_out_edge_cmp, 1);
119 l_attr.livethrough_unused = bitset_obstack_alloc(&env->phase.obst, get_irg_last_idx(env->irg));
120 res = set_insert(env->loop_attr_set, &l_attr, sizeof(l_attr), hash);
126 static INLINE block_attr_t *get_block_attr(morgan_env_t *env, ir_node *block) {
127 block_attr_t b_attr, *res;
129 b_attr.block = block;
131 hash = block_attr_hash(&b_attr);
132 res = set_find(env->block_attr_set, &b_attr, sizeof(b_attr), hash);
135 b_attr.livethrough_unused = bitset_obstack_alloc(&env->phase.obst, get_irg_last_idx(env->irg));
136 res = set_insert(env->block_attr_set, &b_attr, sizeof(b_attr), hash);
142 static int is_mem_phi(const ir_node *node, void *data) {
143 // TODO what is this for?
148 //---------------------------------------------------------------------------
151 * Determine edges going out of a loop (= edges that go to a block that is not inside
152 * the loop or one of its subloops)
154 static INLINE void construct_loop_out_edges(ir_node* block, void* e) {
155 morgan_env_t *env = (morgan_env_t*) e;
156 int n_cfgpreds = get_Block_n_cfgpreds(block);
158 ir_loop* loop = get_irn_loop(block);
160 for(i = 0; i < n_cfgpreds; ++i) {
161 ir_node* cfgpred = get_Block_cfgpred(block, i);
162 ir_node* cfgpred_block = get_nodes_block(cfgpred);
163 ir_loop* cfgpred_loop = get_irn_loop(cfgpred_block);
164 loop_attr_t *outedges = get_loop_attr(env, cfgpred_loop);
166 if(cfgpred_loop != loop && get_loop_depth(cfgpred_loop) >= get_loop_depth(loop)) {
167 loop_out_edge_t edge;
170 set_insert(outedges->out_edges, &edge, sizeof(edge), loop_out_edge_hash(&edge));
175 static void free_loop_out_edges(morgan_env_t *env) {
178 for(l_attr = set_first(env->loop_attr_set); l_attr != NULL; l_attr = set_next(env->loop_attr_set)) {
179 del_set(l_attr->out_edges);
184 * Construct the livethrough unused information for a block
186 static bitset_t *construct_block_livethrough_unused(morgan_env_t* env, ir_node* block) {
190 block_attr_t *block_attr = get_block_attr(env, block);
193 * This is the first block in a sequence, all variables that are livethrough this block are potential
194 * candidates for livethrough_unused
198 // copy all live-outs into the livethrough_unused set
199 live_foreach(block, li) {
200 if(!live_is_in(li) || !live_is_out(li))
202 if(!arch_irn_consider_in_reg_alloc(env->arch, env->cls, li->irn))
205 node_idx = get_irn_idx(li->irn);
206 bitset_set(block_attr->livethrough_unused, node_idx);
210 * All values that are used within the block are not unused (and therefore not
211 * livethrough_unused)
213 sched_foreach(block, irn) {
214 be_insn_t *insn = be_scan_insn(&env->insn_env, irn);
216 for(i = insn->use_start; i < insn->n_ops; ++i) {
217 const be_operand_t *op = &insn->ops[i];
218 int idx = get_irn_idx(op->irn);
219 bitset_clear(block_attr->livethrough_unused, idx);
223 return block_attr->livethrough_unused;
227 * Debugging help, shows all nodes in a (node-)bitset
229 static void show_nodebitset(ir_graph* irg, bitset_t* bitset) {
232 bitset_foreach(bitset, i) {
233 ir_node* node = get_idx_irn(irg, i);
234 DBG((dbg, DBG_LIVE, "\t%+F\n", node));
238 static bitset_t *construct_loop_livethrough_unused(morgan_env_t *env, ir_loop *loop) {
240 loop_attr_t* loop_attr = get_loop_attr(env, loop);
242 DBG((dbg, DBG_LIVE, "Processing Loop %d\n", loop->loop_nr));
243 assert(get_loop_n_elements(loop) > 0);
244 for(i = 0; i < get_loop_n_elements(loop); ++i) {
245 loop_element elem = get_loop_element(loop, i);
246 switch (*elem.kind) {
248 bitset_t *livethrough_block_unused;
249 assert(is_Block(elem.node));
250 livethrough_block_unused = construct_block_livethrough_unused(env, elem.node);
252 bitset_copy(loop_attr->livethrough_unused, livethrough_block_unused);
254 bitset_and(loop_attr->livethrough_unused, livethrough_block_unused);
259 bitset_t *livethrough_son_unused;
261 livethrough_son_unused = construct_loop_livethrough_unused(env, elem.son);
263 bitset_copy(loop_attr->livethrough_unused, livethrough_son_unused);
265 bitset_and(loop_attr->livethrough_unused, livethrough_son_unused);
275 // remove all unused livethroughs that are remembered for this loop from child loops and blocks
276 for(i = 0; i < get_loop_n_elements(loop); ++i) {
277 const loop_element elem = get_loop_element(loop, i);
279 if(*elem.kind == k_ir_loop) {
280 loop_attr_t *son_attr = get_loop_attr(env, elem.son);
281 bitset_andnot(son_attr->livethrough_unused, loop_attr->livethrough_unused);
283 DBG((dbg, DBG_LIVE, "Livethroughs for loop %d:\n", loop->loop_nr));
284 show_nodebitset(env->irg, son_attr->livethrough_unused);
285 } else if(*elem.kind == k_ir_node) {
286 block_attr_t *block_attr = get_block_attr(env, elem.node);
287 bitset_andnot(block_attr->livethrough_unused, loop_attr->livethrough_unused);
289 DBG((dbg, DBG_LIVE, "Livethroughs for block %+F\n", elem.node));
290 show_nodebitset(env->irg, block_attr->livethrough_unused);
296 return loop_attr->livethrough_unused;
299 //---------------------------------------------------------------------------
301 static int reduce_register_pressure_in_block(morgan_env_t *env, ir_node* block, int loop_unused_spills_possible) {
304 int max_pressure = 0;
306 int loop_unused_spills_needed;
307 block_attr_t *block_attr = get_block_attr(env, block);
308 int block_unused_spills_possible = bitset_popcnt(block_attr->livethrough_unused);
309 int unused_spills_possible = loop_unused_spills_possible + block_unused_spills_possible;
310 pset *live_nodes = pset_new_ptr_default();
312 be_liveness_end_of_block(env->arch, env->cls, block, live_nodes);
313 pressure = pset_count(live_nodes);
315 DBG((dbg, DBG_LIVE, "Reduce pressure to %d In Block %+F:\n", env->registers_available, block));
318 * Walk over all irns in the schedule and check register pressure for each of them
320 sched_foreach_reverse(block, irn) {
321 // do we need more spills than possible with unused libethroughs?
322 int spills_needed = pressure - unused_spills_possible - env->registers_available;
323 if(spills_needed > 0) {
324 DBG((dbg, DBG_PRESSURE, "\tWARNING %d more spills needed at %+F\n", spills_needed, irn));
325 // TODO further spills needed
328 if(pressure > max_pressure) {
329 max_pressure = pressure;
332 /* Register pressure is only important until we reach the first phi (the rest of the block
333 * will only be phis.)
340 int pressure_old = pressure;
341 be_liveness_transfer(env->arch, env->cls, irn, live_nodes);
342 pressure = pset_count(live_nodes);
343 DBG((dbg, DBG_PRESSURE, "\tPressure at %+F - before: %d after: %d\n", irn, pressure_old, pressure));
348 * Calculate number of spills from loop_unused_spills_possible that we want to use,
349 * and spill unused livethroughs from the block if we still don't have enough registers
351 spills_needed = max_pressure - env->registers_available;
352 if(spills_needed < 0) {
353 loop_unused_spills_needed = 0;
354 } else if(spills_needed > loop_unused_spills_possible) {
356 int block_unused_spills_needed;
358 loop_unused_spills_needed = loop_unused_spills_possible;
359 block_unused_spills_needed = spills_needed - loop_unused_spills_possible;
360 if(block_unused_spills_needed > block_unused_spills_possible) {
361 block_unused_spills_needed = block_unused_spills_possible;
366 * Spill/Reload unused livethroughs from the block
368 bitset_foreach(block_attr->livethrough_unused, i) {
370 const ir_edge_t *edge;
372 if(spills >= block_unused_spills_needed)
375 to_spill = get_idx_irn(env->irg, i);
376 foreach_block_succ(block, edge) {
377 DBG((dbg, DBG_PRESSURE, "Spilling node %+F around block %+F\n", to_spill, block));
378 be_add_reload_on_edge(env->senv, to_spill, edge->src, edge->pos);
382 loop_unused_spills_needed = spills_needed;
385 del_pset(live_nodes);
387 DBG((dbg, DBG_PRESSURE, "Unused spills for Block %+F needed: %d\n", block, loop_unused_spills_needed));
388 return loop_unused_spills_needed;
392 * Reduce register pressure in a loop
394 * @param unused_spills_possible Number of spills from livethrough_unused variables possible in outer loops
395 * @return Number of spills of livethrough_unused variables needed in outer loops
397 static int reduce_register_pressure_in_loop(morgan_env_t *env, ir_loop *loop, int outer_spills_possible) {
399 loop_attr_t* loop_attr = get_loop_attr(env, loop);
400 int spills_needed = 0;
401 int spills_possible = outer_spills_possible + bitset_popcnt(loop_attr->livethrough_unused);
402 int outer_spills_needed;
404 DBG((dbg, DBG_PRESSURE, "Reducing Pressure in loop %d\n", loop->loop_nr));
405 for(i = 0; i < get_loop_n_elements(loop); ++i) {
406 loop_element elem = get_loop_element(loop, i);
407 switch (*elem.kind) {
410 assert(is_Block(elem.node));
411 needed = reduce_register_pressure_in_block(env, elem.node, spills_possible);
412 assert(needed <= spills_possible);
413 if(needed > spills_needed)
414 spills_needed = needed;
418 int needed = reduce_register_pressure_in_loop(env, elem.son, spills_possible);
419 assert(needed <= spills_possible);
420 if(needed > spills_needed)
421 spills_needed = needed;
430 // calculate number of spills needed in outer loop and spill
431 // unused livethrough nodes around this loop
432 if(spills_needed > outer_spills_possible) {
433 outer_spills_needed = outer_spills_possible;
434 spills_needed -= outer_spills_possible;
436 bitset_foreach(loop_attr->livethrough_unused, i) {
437 loop_out_edge_t *edge;
438 ir_node *to_spill = get_idx_irn(env->irg, i);
440 for(edge = set_first(loop_attr->out_edges); edge != NULL; edge = set_next(loop_attr->out_edges)) {
441 be_add_reload_on_edge(env->senv, to_spill, edge->block, edge->pos);
445 outer_spills_needed = spills_needed;
448 return outer_spills_needed;
451 static void *init_phase_data(phase_t *phase, ir_node *irn, void *old) {
455 void be_spill_morgan(const be_chordal_env_t *chordal_env) {
458 FIRM_DBG_REGISTER(dbg, "ir.be.spillmorgan");
460 env.arch = chordal_env->birg->main_env->arch_env;
461 env.irg = chordal_env->irg;
462 env.cls = chordal_env->cls;
463 env.senv = be_new_spill_env(chordal_env, is_mem_phi, NULL);
464 DEBUG_ONLY(be_set_spill_env_dbg_module(env.senv, dbg);)
465 env.uses = be_begin_uses(env.irg, env.arch, env.cls);
467 phase_init(&env.phase, "spillmorgan", env.irg, PHASE_DEFAULT_GROWTH, init_phase_data);
469 env.registers_available = arch_count_non_ignore_regs(env.arch, env.cls);
471 be_insn_env_init(&env.insn_env, chordal_env->birg, chordal_env->cls, &env.phase.obst);
473 env.loop_attr_set = new_set(loop_attr_cmp, 5);
474 env.block_attr_set = new_set(block_attr_cmp, 20);
476 /*-- Part1: Analysis --*/
477 be_liveness(env.irg);
479 // construct control flow loop tree
480 construct_cf_backedges(chordal_env->irg);
482 // construct loop out edges and livethrough_unused sets for loops and blocks
483 irg_block_walk_graph(chordal_env->irg, construct_loop_out_edges, NULL, &env);
484 construct_loop_livethrough_unused(&env, get_irg_loop(env.irg));
486 /*-- Part2: Transformation --*/
488 // reduce register pressure to number of available registers
489 reduce_register_pressure_in_loop(&env, get_irg_loop(env.irg), 0);
491 be_insert_spills_reloads(env.senv);
492 if (chordal_env->opts->vrfy_option == BE_CH_VRFY_WARN)
493 be_verify_schedule(env.irg);
494 else if (chordal_env->opts->vrfy_option == BE_CH_VRFY_ASSERT)
495 assert(be_verify_schedule(env.irg));
498 be_end_uses(env.uses);
499 be_dump(env.irg, "-spillmorgan", dump_ir_block_graph_sched);
500 free_loop_out_edges(&env);
501 del_set(env.loop_attr_set);
502 del_set(env.block_attr_set);
504 // fix the remaining places with too high register pressure with beladies algorithm
505 be_remove_dead_nodes_from_schedule(env.irg);
506 be_liveness(env.irg);
507 be_spill_belady_spill_env(chordal_env, env.senv);
509 be_delete_spill_env(env.senv);
510 phase_free(&env.phase);