X-Git-Url: http://nsz.repo.hu/git/?a=blobdiff_plain;f=ir%2Fbe%2Fbespillmorgan.c;h=cdb5ca7897128a176179f08a86a7172a811cb50d;hb=6ae2d84d2d3e245249b5a9baec13895838d22b64;hp=1656645062b110dd951e0b0466aa891b3bb44f22;hpb=f436f72951577e35b60e0ea1f2e6a536e4f479bb;p=libfirm diff --git a/ir/be/bespillmorgan.c b/ir/be/bespillmorgan.c index 165664506..cdb5ca789 100644 --- a/ir/be/bespillmorgan.c +++ b/ir/be/bespillmorgan.c @@ -2,7 +2,7 @@ * Author: Matthias Braun * Date: 05.05.2006 * Copyright: (c) Universitaet Karlsruhe - * License: This file protected by GPL - GNU GENERAL PUBLIC LICENSE. + * License: This file is protected by GPL - GNU GENERAL PUBLIC LICENSE. * */ #ifdef HAVE_CONFIG_H @@ -11,82 +11,75 @@ #include "bespillmorgan.h" -#include "bechordal.h" #include "bechordal_t.h" #include "bespill.h" -#include "belive.h" #include "belive_t.h" -#include "beinsn_t.h" #include "irgwalk.h" #include "besched.h" #include "beutil.h" -#include "beuses.h" -#include "interval_analysis.h" -#include "irloop.h" #include "irloop_t.h" -#include "irgraph.h" #include "irgraph_t.h" -#include "irphase.h" -#include "irphase_t.h" #include "irprintf.h" +#include "obstack.h" -// remove me later #include "bespillbelady.h" +#include "beverify.h" #define DBG_LIVE 1 -#define DBG_PRESSURE 2 +#define DBG_LOOPANA 2 +#define DBG_PRESSURE 4 DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;) -typedef struct _morgan_env_t { +typedef struct morgan_env { const arch_env_t *arch; const arch_register_class_t *cls; ir_graph *irg; - phase_t phase; - // maximum safe register pressure + struct obstack obst; + /** maximum safe register pressure */ int registers_available; - be_insn_env_t insn_env; spill_env_t *senv; - be_uses_t *uses; set *loop_attr_set; set *block_attr_set; } morgan_env_t; -typedef struct _loop_out_edge_t { +typedef struct loop_edge { ir_node *block; int pos; -} loop_out_edge_t; +} loop_edge_t; -typedef struct _loop_attr_t { - ir_loop *loop; +typedef struct loop_attr { + const ir_loop *loop; set *out_edges; - /// The set of all values that live through the loop and are not used + set *in_edges; + /** The set of all values that are live in the loop but not used in the loop */ bitset_t *livethrough_unused; } loop_attr_t; -typedef struct _block_attr_t { - ir_node *block; +typedef struct block_attr { + const ir_node *block; + /** set of all values that are live in the block but not used in the block */ bitset_t *livethrough_unused; } block_attr_t; //--------------------------------------------------------------------------- -int loop_out_edge_cmp(const void* p1, const void* p2, size_t s) { - loop_out_edge_t *e1 = (loop_out_edge_t*) p1; - loop_out_edge_t *e2 = (loop_out_edge_t*) p2; +static int loop_edge_cmp(const void* p1, const void* p2, size_t s) { + loop_edge_t *e1 = (loop_edge_t*) p1; + loop_edge_t *e2 = (loop_edge_t*) p2; return e1->block != e2->block || e1->pos != e2->pos; } -int loop_attr_cmp(const void *e1, const void *e2, size_t s) { +static int loop_attr_cmp(const void *e1, const void *e2, size_t s) { loop_attr_t *la1 = (loop_attr_t*) e1; loop_attr_t *la2 = (loop_attr_t*) e2; return la1->loop != la2->loop; } -int block_attr_cmp(const void *e1, const void *e2, size_t s) { +static int block_attr_cmp(const void *e1, const void *e2, size_t s) { block_attr_t *b1 = (block_attr_t*) e1; block_attr_t *b2 = (block_attr_t*) e2; @@ -101,11 +94,11 @@ static INLINE int block_attr_hash(const block_attr_t *b) { return HASH_PTR(b->block); } -static INLINE int loop_out_edge_hash(const loop_out_edge_t *e) { +static INLINE int loop_edge_hash(const loop_edge_t *e) { return HASH_PTR(e->block) ^ (e->pos * 31); } -static INLINE loop_attr_t *get_loop_attr(morgan_env_t *env, ir_loop *loop) { +static INLINE loop_attr_t *get_loop_attr(morgan_env_t *env, const ir_loop *loop) { loop_attr_t l_attr, *res; int hash; l_attr.loop = loop; @@ -114,16 +107,17 @@ static INLINE loop_attr_t *get_loop_attr(morgan_env_t *env, ir_loop *loop) { res = set_find(env->loop_attr_set, &l_attr, sizeof(l_attr), hash); // create new loop_attr if none exists yet - if (!res) { - l_attr.out_edges = new_set(loop_out_edge_cmp, 1); - l_attr.livethrough_unused = bitset_obstack_alloc(&env->phase.obst, get_irg_last_idx(env->irg)); + if (res == NULL) { + l_attr.out_edges = new_set(loop_edge_cmp, 1); + l_attr.in_edges = new_set(loop_edge_cmp, 1); + l_attr.livethrough_unused = bitset_obstack_alloc(&env->obst, get_irg_last_idx(env->irg)); res = set_insert(env->loop_attr_set, &l_attr, sizeof(l_attr), hash); } return res; } -static INLINE block_attr_t *get_block_attr(morgan_env_t *env, ir_node *block) { +static INLINE block_attr_t *get_block_attr(morgan_env_t *env, const ir_node *block) { block_attr_t b_attr, *res; int hash; b_attr.block = block; @@ -131,30 +125,34 @@ static INLINE block_attr_t *get_block_attr(morgan_env_t *env, ir_node *block) { hash = block_attr_hash(&b_attr); res = set_find(env->block_attr_set, &b_attr, sizeof(b_attr), hash); - if(!res) { - b_attr.livethrough_unused = bitset_obstack_alloc(&env->phase.obst, get_irg_last_idx(env->irg)); + if(res == NULL) { + b_attr.livethrough_unused = bitset_obstack_alloc(&env->obst, get_irg_last_idx(env->irg)); res = set_insert(env->block_attr_set, &b_attr, sizeof(b_attr), hash); } return res; } -static int is_mem_phi(const ir_node *irn, void *data) { - // TODO what is this for? - return 0; -} - //--------------------------------------------------------------------------- +static INLINE int consider_for_spilling(const arch_env_t *env, const arch_register_class_t *cls, const ir_node *node) { + if(!arch_irn_has_reg_class(env, node, -1, cls)) + return 0; + + return !(arch_irn_get_flags(env, node) & (arch_irn_flags_ignore | arch_irn_flags_dont_spill)); +} + /** * Determine edges going out of a loop (= edges that go to a block that is not inside * the loop or one of its subloops) */ -static INLINE void construct_loop_out_edges(ir_node* block, void* e) { +static INLINE void construct_loop_edges(ir_node* block, void* e) { morgan_env_t *env = (morgan_env_t*) e; int n_cfgpreds = get_Block_n_cfgpreds(block); int i; ir_loop* loop = get_irn_loop(block); + loop_attr_t *loop_attr = get_loop_attr(env, loop); + DBG((dbg, DBG_LOOPANA, "Loop for %+F: %d (depth %d)\n", block, loop->loop_nr, loop->depth)); for(i = 0; i < n_cfgpreds; ++i) { ir_node* cfgpred = get_Block_cfgpred(block, i); @@ -162,35 +160,95 @@ static INLINE void construct_loop_out_edges(ir_node* block, void* e) { ir_loop* cfgpred_loop = get_irn_loop(cfgpred_block); loop_attr_t *outedges = get_loop_attr(env, cfgpred_loop); - if(cfgpred_loop != loop && get_loop_depth(cfgpred_loop) >= get_loop_depth(loop)) { - loop_out_edge_t edge; + if(cfgpred_loop == loop) + continue; + + // is it an edge into the loop? + if(get_loop_depth(loop) > get_loop_depth(cfgpred_loop)) { + loop_edge_t edge; + edge.block = block; + edge.pos = i; + DBG((dbg, DBG_LOOPANA, "Loop in edge from %+F (loop %d) to %+F (loop %d)\n", cfgpred_block, get_loop_loop_nr(cfgpred_loop), block, get_loop_loop_nr(loop))); + set_insert(loop_attr->in_edges, &edge, sizeof(edge), loop_edge_hash(&edge)); + } else { + ir_loop *p_loop = cfgpred_loop; + while(get_loop_depth(p_loop) > get_loop_depth(loop)) { + p_loop = get_loop_outer_loop(p_loop); + } + if(p_loop != loop) { + loop_edge_t edge; + edge.block = block; + edge.pos = i; + DBG((dbg, DBG_LOOPANA, "Loop in edge from %+F (loop %d) to %+F (loop %d)\n", cfgpred_block, get_loop_loop_nr(cfgpred_loop), block, get_loop_loop_nr(loop))); + set_insert(loop_attr->in_edges, &edge, sizeof(edge), loop_edge_hash(&edge)); + } + } + + // an edge out of the loop? + if(get_loop_depth(cfgpred_loop) >= get_loop_depth(loop)) { + loop_edge_t edge; edge.block = block; edge.pos = i; - set_insert(outedges->out_edges, &edge, sizeof(edge), loop_out_edge_hash(&edge)); + DBG((dbg, DBG_LOOPANA, "Loop out edge from %+F (loop %d) to %+F\n", cfgpred_block, cfgpred_loop->loop_nr, block)); + set_insert(outedges->out_edges, &edge, sizeof(edge), loop_edge_hash(&edge)); + } else { + ir_loop *o_loop = loop; + + // we might jump in the middle of another inner loop which is not inside + // our loop (happens for irreducible graphs). This would be a + // real out edge then. + while(get_loop_depth(o_loop) > get_loop_depth(cfgpred_loop)) { + o_loop = get_loop_outer_loop(o_loop); + } + + if(cfgpred_loop != o_loop) { + loop_edge_t edge; + edge.block = block; + edge.pos = i; + DBG((dbg, DBG_LOOPANA, "Loop out edge from %+F (loop %d) to %+F (into jump)\n", cfgpred_block, cfgpred_loop->loop_nr, block)); + set_insert(outedges->out_edges, &edge, sizeof(edge), loop_edge_hash(&edge)); + } } } } +static void free_loop_edges(morgan_env_t *env) { + loop_attr_t *l_attr; + + for(l_attr = set_first(env->loop_attr_set); l_attr != NULL; l_attr = set_next(env->loop_attr_set)) { + del_set(l_attr->out_edges); + del_set(l_attr->in_edges); + } +} + /** - * Construct the livethrough unused information for a block + * Debugging help, shows all nodes in a (node-)bitset */ -static bitset_t *construct_block_livethrough_unused(morgan_env_t* env, ir_node* block) { +static void show_nodebitset(ir_graph* irg, const bitset_t* bitset) { int i; - int node_idx; - ir_node *irn; - block_attr_t *block_attr = get_block_attr(env, block); - /* - * This is the first block in a sequence, all variables that are livethrough this block are potential - * candidates for livethrough_unused - */ + bitset_foreach(bitset, i) { + ir_node* node = get_idx_irn(irg, i); + DBG((dbg, DBG_LIVE, "\t%+F\n", node)); + } +} + +/** + * Construct the livethrough unused set for a block + */ +static bitset_t *construct_block_livethrough_unused(morgan_env_t* env, const ir_node* block) { + block_attr_t *block_attr = get_block_attr(env, block); irn_live_t *li; + ir_node *node; + DBG((dbg, DBG_LIVE, "Processing block %d\n", get_irn_node_nr(block))); // copy all live-outs into the livethrough_unused set live_foreach(block, li) { + int node_idx; + if(!live_is_in(li) || !live_is_out(li)) continue; - if(!arch_irn_consider_in_reg_alloc(env->arch, env->cls, li->irn)) + if(!consider_for_spilling(env->arch, env->cls, li->irn)) continue; node_idx = get_irn_idx(li->irn); @@ -201,32 +259,23 @@ static bitset_t *construct_block_livethrough_unused(morgan_env_t* env, ir_node* * All values that are used within the block are not unused (and therefore not * livethrough_unused) */ - sched_foreach(block, irn) { - be_insn_t *insn = be_scan_insn(&env->insn_env, irn); + sched_foreach(block, node) { + int i, arity; - for(i = insn->use_start; i < insn->n_ops; ++i) { - const be_operand_t *op = &insn->ops[i]; - int idx = get_irn_idx(op->irn); + for(i = 0, arity = get_irn_arity(node); i < arity; ++i) { + int idx = get_irn_idx(get_irn_n(node, i)); bitset_clear(block_attr->livethrough_unused, idx); } } + show_nodebitset(env->irg, block_attr->livethrough_unused); return block_attr->livethrough_unused; } /** - * Debugging help, shows all nodes in a (node-)bitset + * Construct the livethrough unused set for a loop (and all its subloops+blocks) */ -static void show_nodebitset(ir_graph* irg, bitset_t* bitset) { - int i; - - bitset_foreach(bitset, i) { - ir_node* node = get_idx_irn(irg, i); - DBG((dbg, DBG_LIVE, "\t%+F\n", node)); - } -} - -static bitset_t *construct_loop_livethrough_unused(morgan_env_t *env, ir_loop *loop) { +static bitset_t *construct_loop_livethrough_unused(morgan_env_t *env, const ir_loop *loop) { int i; loop_attr_t* loop_attr = get_loop_attr(env, loop); @@ -262,6 +311,7 @@ static bitset_t *construct_loop_livethrough_unused(morgan_env_t *env, ir_loop *l break; } } + DBG((dbg, DBG_LIVE, "Done with loop %d\n", loop->loop_nr)); // remove all unused livethroughs that are remembered for this loop from child loops and blocks for(i = 0; i < get_loop_n_elements(loop); ++i) { @@ -287,9 +337,9 @@ static bitset_t *construct_loop_livethrough_unused(morgan_env_t *env, ir_loop *l return loop_attr->livethrough_unused; } -//--------------------------------------------------------------------------- +/*---------------------------------------------------------------------------*/ -static int reduce_register_pressure_in_block(morgan_env_t *env, ir_node* block, int loop_unused_spills_possible) { +static int reduce_register_pressure_in_block(morgan_env_t *env, const ir_node* block, int loop_unused_spills_possible) { int pressure; ir_node *irn; int max_pressure = 0; @@ -310,7 +360,7 @@ static int reduce_register_pressure_in_block(morgan_env_t *env, ir_node* block, */ sched_foreach_reverse(block, irn) { // do we need more spills than possible with unused libethroughs? - int spills_needed = pressure - unused_spills_possible - env->registers_available; + int spills_needed = pressure - env->registers_available - unused_spills_possible; if(spills_needed > 0) { DBG((dbg, DBG_PRESSURE, "\tWARNING %d more spills needed at %+F\n", spills_needed, irn)); // TODO further spills needed @@ -327,14 +377,12 @@ static int reduce_register_pressure_in_block(morgan_env_t *env, ir_node* block, break; // update pressure - { - int pressure_old = pressure; - be_liveness_transfer(env->arch, env->cls, irn, live_nodes); - pressure = pset_count(live_nodes); - DBG((dbg, DBG_PRESSURE, "\tPressure at %+F - before: %d after: %d\n", irn, pressure_old, pressure)); - } + be_liveness_transfer(env->arch, env->cls, irn, live_nodes); + pressure = pset_count(live_nodes); } + DBG((dbg, DBG_PRESSURE, "\tMax Pressure in %+F: %d\n", block, max_pressure)); + /* * Calculate number of spills from loop_unused_spills_possible that we want to use, * and spill unused livethroughs from the block if we still don't have enough registers @@ -368,6 +416,7 @@ static int reduce_register_pressure_in_block(morgan_env_t *env, ir_node* block, DBG((dbg, DBG_PRESSURE, "Spilling node %+F around block %+F\n", to_spill, block)); be_add_reload_on_edge(env->senv, to_spill, edge->src, edge->pos); } + spills++; } } else { loop_unused_spills_needed = spills_needed; @@ -385,7 +434,7 @@ static int reduce_register_pressure_in_block(morgan_env_t *env, ir_node* block, * @param unused_spills_possible Number of spills from livethrough_unused variables possible in outer loops * @return Number of spills of livethrough_unused variables needed in outer loops */ -static int reduce_register_pressure_in_loop(morgan_env_t *env, ir_loop *loop, int outer_spills_possible) { +static int reduce_register_pressure_in_loop(morgan_env_t *env, const ir_loop *loop, int outer_spills_possible) { int i; loop_attr_t* loop_attr = get_loop_attr(env, loop); int spills_needed = 0; @@ -418,19 +467,29 @@ static int reduce_register_pressure_in_loop(morgan_env_t *env, ir_loop *loop, in } } - // calculate number of spills needed in outer loop and spill - // unused livethrough nodes around this loop + /* calculate number of spills needed in outer loop and spill + * unused livethrough nodes around this loop + */ if(spills_needed > outer_spills_possible) { + int spills_to_place; outer_spills_needed = outer_spills_possible; spills_needed -= outer_spills_possible; + spills_to_place = spills_needed; + bitset_foreach(loop_attr->livethrough_unused, i) { - loop_out_edge_t *edge; + loop_edge_t *edge; ir_node *to_spill = get_idx_irn(env->irg, i); for(edge = set_first(loop_attr->out_edges); edge != NULL; edge = set_next(loop_attr->out_edges)) { + DBG((dbg, DBG_PRESSURE, "Spilling node %+F around loop %d\n", to_spill, loop->loop_nr)); be_add_reload_on_edge(env->senv, to_spill, edge->block, edge->pos); } + + spills_to_place--; + if(spills_to_place <= 0) { + break; + } } } else { outer_spills_needed = spills_needed; @@ -439,143 +498,70 @@ static int reduce_register_pressure_in_loop(morgan_env_t *env, ir_loop *loop, in return outer_spills_needed; } -static void *init_phase_data(phase_t *phase, ir_node *irn, void *old) { - return old; -} - -typedef struct _liveness_dump_env_t { - const be_chordal_env_t *chordal_env; - FILE *f; -} liveness_dump_env_t; - -/** - * Pre-walker: dump liveness data to a file - */ -static void dump_liveness_walker(ir_node *bl, void *data) -{ - liveness_dump_env_t *env = (liveness_dump_env_t*) data; - FILE *f = env->f; - const irn_live_t *li; - ir_node* irn; - int in = 0, end = 0, out = 0; - int max_pressure = 0; - pset *live_nodes; - - // collect some statistics - live_foreach(bl, li) { - const ir_node* irn = li->irn; - if(!arch_irn_consider_in_reg_alloc(env->chordal_env->birg->main_env->arch_env, env->chordal_env->cls, irn)) - continue; - - if(live_is_in(li)) - in++; - if(live_is_end(li)) - end++; - if(live_is_out(li)) - out++; - } - - // collect register pressure info - live_nodes = pset_new_ptr_default(); - be_liveness_end_of_block(env->chordal_env->birg->main_env->arch_env, env->chordal_env->cls, bl, live_nodes); - max_pressure = pset_count(live_nodes); - sched_foreach_reverse(bl, irn) { - int pressure; - - if(is_Phi(irn)) - break; - - be_liveness_transfer(env->chordal_env->birg->main_env->arch_env, env->chordal_env->cls, irn, live_nodes); - pressure = pset_count(live_nodes); - if(pressure > max_pressure) - max_pressure = pressure; - } - del_pset(live_nodes); - - ir_fprintf(f, "%+20F (%d in) (%d end) (%d out) (max_pressure %d)\n", bl, in, end, out, max_pressure); - live_foreach(bl, li) { - const ir_node* irn = li->irn; - if(!arch_irn_consider_in_reg_alloc(env->chordal_env->birg->main_env->arch_env, env->chordal_env->cls, irn)) - continue; - - ir_fprintf(f, "\t%+30F %4s %4s %4s\n", - irn, - live_is_in(li) ? "in" : "", - live_is_end(li) ? "end" : "", - live_is_out(li) ? "out" : ""); - } -} - -static void dump_liveness_info(const be_chordal_env_t *chordal_env, const char* name) { - char buf[128]; - liveness_dump_env_t env; - - env.chordal_env = chordal_env; - ir_snprintf(buf, sizeof(buf), "%F_%s_%s-live.txt", chordal_env->irg, chordal_env->cls->name, name); - env.f = fopen(buf, "wt"); - if(env.f == NULL) - return; - - irg_block_walk_graph(chordal_env->irg, dump_liveness_walker, NULL, &env); - fclose(env.f); -} - - void be_spill_morgan(const be_chordal_env_t *chordal_env) { morgan_env_t env; FIRM_DBG_REGISTER(dbg, "ir.be.spillmorgan"); - //firm_dbg_set_mask(dbg, DBG_LIVE | DBG_PRESSURE); + //firm_dbg_set_mask(dbg, DBG_LOOPANA | DBG_PRESSURE); env.arch = chordal_env->birg->main_env->arch_env; env.irg = chordal_env->irg; env.cls = chordal_env->cls; - env.senv = be_new_spill_env(chordal_env, is_mem_phi, NULL); + env.senv = be_new_spill_env(chordal_env); DEBUG_ONLY(be_set_spill_env_dbg_module(env.senv, dbg);) - env.uses = be_begin_uses(env.irg, env.arch, env.cls); - phase_init(&env.phase, "spillmorgan", env.irg, PHASE_DEFAULT_GROWTH, init_phase_data); + obstack_init(&env.obst); env.registers_available = arch_count_non_ignore_regs(env.arch, env.cls); - be_insn_env_init(&env.insn_env, chordal_env->birg, chordal_env->cls, &env.phase.obst); - env.loop_attr_set = new_set(loop_attr_cmp, 5); env.block_attr_set = new_set(block_attr_cmp, 20); - /*-- Part1: Analysis --*/ be_liveness(env.irg); - // construct control flow loop tree + /* construct control flow loop tree */ construct_cf_backedges(chordal_env->irg); - // construct loop out edges and livethrough_unused sets for loops and blocks - irg_block_walk_graph(chordal_env->irg, construct_loop_out_edges, NULL, &env); + /* construct loop out edges and livethrough_unused sets for loops and blocks */ + irg_block_walk_graph(chordal_env->irg, NULL, construct_loop_edges, &env); construct_loop_livethrough_unused(&env, get_irg_loop(env.irg)); /*-- Part2: Transformation --*/ - // reduce register pressure to number of available registers + /* spill unused livethrough values around loops and blocks where + * the pressure is too high + */ reduce_register_pressure_in_loop(&env, get_irg_loop(env.irg), 0); - be_insert_spills_reloads(env.senv, NULL); + /* Place copies for spilled phis */ + be_place_copies(env.senv); + /* Insert real spill/reload nodes and fix usages */ + be_insert_spills_reloads(env.senv); - // cleanup - be_end_uses(env.uses); - be_dump(env.irg, "-spillmorgan", dump_ir_block_graph_sched); + /* Verify the result */ + if (chordal_env->opts->vrfy_option == BE_CH_VRFY_WARN) { + be_verify_schedule(env.irg); + } else if (chordal_env->opts->vrfy_option == BE_CH_VRFY_ASSERT) { + assert(be_verify_schedule(env.irg)); + } + + if (chordal_env->opts->dump_flags & BE_CH_DUMP_SPILL) + be_dump(env.irg, "-spillmorgan", dump_ir_block_graph_sched); + + /* cleanup */ + free_loop_edges(&env); del_set(env.loop_attr_set); del_set(env.block_attr_set); + /* fix the remaining places with too high register pressure with beladies algorithm */ + + /* we have to remove dead nodes from schedule to not confuse liveness calculation */ + be_remove_dead_nodes_from_schedule(env.irg); be_liveness(env.irg); - dump_liveness_info(chordal_env, "spillmorgan"); - // fix the remaining places with too high register pressure with beladies algorithm be_spill_belady_spill_env(chordal_env, env.senv); - be_liveness(env.irg); - dump_liveness_info(chordal_env, "spillcomplete"); - be_delete_spill_env(env.senv); - phase_free(&env.phase); + obstack_free(&env.obst, NULL); }