X-Git-Url: http://nsz.repo.hu/git/?a=blobdiff_plain;f=ir%2Fana%2Fexecution_frequency.c;h=a005f4dcd1fef5c0ac0dcd05e06895c333520968;hb=e775a978fff2841e0722c47f13545b54d48b8f98;hp=5d42de84498948587a0e1fb1be28006e1040d253;hpb=6c165ecbc0725a21b7f68a31f8624c218e7d1288;p=libfirm diff --git a/ir/ana/execution_frequency.c b/ir/ana/execution_frequency.c index 5d42de844..a005f4dcd 100644 --- a/ir/ana/execution_frequency.c +++ b/ir/ana/execution_frequency.c @@ -1,29 +1,48 @@ /* - * Project: libFIRM - * File name: ir/ana/execution_frequency.c - * Purpose: Compute an estimate of basic block executions. - * Author: Goetz Lindenmaier - * Modified by: - * Created: 5.11.2004 - * CVS-ID: $Id$ - * Copyright: (c) 2004 Universität Karlsruhe - * Licence: This file protected by GPL - GNU GENERAL PUBLIC LICENSE. + * Copyright (C) 1995-2008 University of Karlsruhe. All right reserved. + * + * This file is part of libFirm. + * + * This file may be distributed and/or modified under the terms of the + * GNU General Public License version 2 as published by the Free Software + * Foundation and appearing in the file LICENSE.GPL included in the + * packaging of this file. + * + * Licensees holding valid libFirm Professional Edition licenses may use + * this file in accordance with the libFirm Commercial License. + * Agreement provided with the Software. + * + * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE + * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR + * PURPOSE. + */ + +/** + * @file + * @brief Compute an estimate of basic block executions. + * @author Goetz Lindenmaier + * @date 5.11.2004 + * @version $Id$ */ -#ifdef HAVE_CONFIG_H #include "config.h" -#endif #include "execution_frequency.h" -#include "firm_common_t.h" #include "set.h" #include "pdeq.h" +#include "hashptr.h" +#include "error.h" -#include "irprog.h" +#include "irprog_t.h" +#include "irgraph_t.h" +#include "irnode_t.h" #include "irloop.h" +#include "irgwalk.h" #include "interval_analysis.h" +void set_irp_exec_freq_state(exec_freq_state s); + /*------------------------------------------------------------------*/ /* A hashmap mapping the frequency to block and loop nodes. Block * and loop nodes are regions. */ @@ -32,46 +51,254 @@ typedef struct { void *reg; double freq; + int prob; } reg_exec_freq; /* We use this set for all nodes in all irgraphs. */ static set *exec_freq_set = NULL; -static int exec_freq_cmp(const void *e1, const void *e2, size_t size) { +static int exec_freq_cmp(const void *e1, const void *e2, size_t size) +{ reg_exec_freq *ef1 = (reg_exec_freq *)e1; reg_exec_freq *ef2 = (reg_exec_freq *)e2; + (void) size; + return (ef1->reg != ef2->reg); } -static INLINE unsigned int exec_freq_hash(void *e) { - unsigned int v = (unsigned int) ((reg_exec_freq *)e)->reg; - return v ^ (v>>8); +static inline unsigned int exec_freq_hash(reg_exec_freq *e) +{ + return HASH_PTR(e->reg); } -static INLINE void set_region_exec_freq(void *reg, double freq) { +static inline void set_region_exec_freq(void *reg, double freq) +{ reg_exec_freq ef; ef.reg = reg; ef.freq = freq; set_insert(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); } -INLINE double get_region_exec_freq(void *reg) { +double get_region_exec_freq(void *reg) +{ reg_exec_freq ef, *found; ef.reg = reg; + assert(exec_freq_set); - found = set_find(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); - assert(found); - return found->freq; + found = (reg_exec_freq*) set_find(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); + + /* Not found if information is invalid. */ + if (found) + return found->freq; + else + return 0; } /* Returns the number of times the block is executed. */ -double get_Block_exec_freq(ir_node *b) { +double get_Block_exec_freq(ir_node *b) +{ return get_region_exec_freq((void *)b); } +double get_irn_exec_freq(ir_node *n) +{ + if (!is_Block(n)) n = get_nodes_block(n); + return get_Block_exec_freq(n); +} + +/*------------------------------------------------------------------*/ +/* A algorithm that precomputes whether Conds lead to an exception. + * Computes a field for all Projs from Conds that says the following: + * - The Proj projs from a normal dual Cond with probability 50:50 + * - This Proj of the Cond leads to an exception, i.e., a raise node. + * It is taken with exception probability. + * - The Proj of the Cond avoids an exception. It is taken with + * 1 - exception probability. */ /*------------------------------------------------------------------*/ -/* The algorithm to compute the execution freqencies. + +#include "irouts.h" + +typedef enum { + Cond_prob_none, + Cond_prob_normal, + Cond_prob_avoid_exception, + Cond_prob_exception_taken, + Cond_prob_was_exception_taken, +} Cond_prob; + +static int just_passed_a_Raise = 0; +static ir_node *Cond_list = NULL; + +/* We do not use an extra set, as Projs are not yet in the existing one. */ +static void set_ProjX_probability(ir_node *n, Cond_prob prob) +{ + reg_exec_freq ef; + ef.reg = n; + ef.prob = prob; + set_insert(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); +} + +static Cond_prob get_ProjX_probability(ir_node *n) +{ + reg_exec_freq ef, *found; + ef.reg = n; + + found = (reg_exec_freq*) set_find(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); + + if (found) + return (Cond_prob)found->prob; + else + return Cond_prob_none; +} + +/* A walker that only visits the nodes we want to see. */ + +static void my_irg_walk_2_both(ir_node *node, irg_walk_func *pre, irg_walk_func *post, void * env) +{ + int i; + set_irn_visited(node, current_ir_graph->visited); + + pre(node, env); + + if (!is_Block(node)) { + ir_node *pred; + if (is_Proj(node)) + pred = get_irn_n(node, 0); + else + pred = get_irn_n(node, -1); + if (pred->visited < current_ir_graph->visited) + my_irg_walk_2_both(pred, pre, post, env); + } + + else { /* a Block */ + for (i = get_irn_arity(node) - 1; i >= 0; --i) { + ir_node *pred = get_irn_n(node, i); + if (pred->visited < current_ir_graph->visited) + my_irg_walk_2_both(pred, pre, post, env); + } + } + + if (is_End(node)) { + for (i = get_irn_arity(node) - 1; i >= 0; --i) { + ir_node *pred = get_irn_n(node, i); + if ((pred->op == op_Block) && (pred->visited < current_ir_graph->visited)) + my_irg_walk_2_both(pred, pre, post, env); + } + } + + post(node, env); +} +static void my_irg_walk_current_graph(irg_walk_func *pre, irg_walk_func *post, void *env) +{ + inc_irg_visited(current_ir_graph); + my_irg_walk_2_both(get_irg_end(current_ir_graph), pre, post, env); +} + + +static void walk_pre(ir_node *n, void *env) +{ + (void) env; + if (is_Raise(n)) + just_passed_a_Raise = 1; + + if (get_irn_op(n) == op_Proj && + is_Cond(get_Proj_pred(n)) && + just_passed_a_Raise) { + ir_node *other_proj; + ir_node *c = get_Proj_pred(n); + + /* If we already visited the other Proj, and it also leads to a Raise, + we are in the middle of something. Continue searching. */ + assert(get_irn_n_outs(c) == 2 && "encountered a switch cond"); + other_proj = get_irn_out(c, 0); + if (other_proj == n) other_proj = get_irn_out(c, 1); + if (get_ProjX_probability(other_proj) == Cond_prob_exception_taken) { + set_ProjX_probability(other_proj, Cond_prob_was_exception_taken); + /* Keep searching for the Proj, so keep just_passed_a_Raise. */ + } else { + set_ProjX_probability(n, Cond_prob_exception_taken); + just_passed_a_Raise = 0; + } + } + + if (is_Cond(n)) { + set_irn_link(n, Cond_list); + Cond_list = n; + } +} + +static void walk_post(ir_node *n, void *env) +{ + (void) env; + if (is_Raise(n)) + just_passed_a_Raise = 0; + + if (get_irn_op(n) == op_Proj && + is_Cond(get_Proj_pred(n)) && ( + get_ProjX_probability(n) == Cond_prob_exception_taken || + get_ProjX_probability(n) == Cond_prob_was_exception_taken + )) { + just_passed_a_Raise = 1; + } +} + +/** Precompute which Conds test for an exception. + * + * Operates on current_ir_graph. */ +static void precompute_cond_evaluation(void) +{ + ir_node *c; + + compute_irg_outs(current_ir_graph); + + just_passed_a_Raise = 0; + Cond_list = NULL; + my_irg_walk_current_graph(walk_pre, walk_post, NULL); + + for (c = Cond_list; c; c = (ir_node*)get_irn_link(c)) { + ir_node *p0, *p1; + + assert(get_irn_n_outs(c) == 2 && "encountered a switch cond"); + p0 = get_irn_out(c, 0); + p1 = get_irn_out(c, 1); + + /* both are exceptions */ + if ((get_ProjX_probability(p0) == Cond_prob_exception_taken) && + (get_ProjX_probability(p1) == Cond_prob_exception_taken) ) { + panic("I tried to avoid these!"); +#if 0 + /* It's a */ + set_ProjX_probability(p0, Cond_prob_normal); + set_ProjX_probability(p1, Cond_prob_normal); +#endif + } + + /* p0 is exception */ + else if (get_ProjX_probability(p0) == Cond_prob_exception_taken) { + set_ProjX_probability(p1, Cond_prob_avoid_exception); + } + + /* p1 is exception */ + else if (get_ProjX_probability(p1) == Cond_prob_exception_taken) { + set_ProjX_probability(p0, Cond_prob_avoid_exception); + } + + /* none is exception */ + else { + set_ProjX_probability(p0, Cond_prob_normal); + set_ProjX_probability(p1, Cond_prob_normal); + } + } +} + +int is_fragile_Proj(ir_node *n) +{ + return is_Proj(n) && (get_ProjX_probability(n) == Cond_prob_exception_taken); +} + +/*------------------------------------------------------------------*/ +/* The algorithm to compute the execution frequencies. * * Walk the control flow loop tree which we consider the interval * tree. Compute the execution for the lowest loop, add inner loops @@ -81,25 +308,34 @@ double get_Block_exec_freq(ir_node *b) { static double exception_prob = 0.001; -static INLINE int is_loop_head(ir_node *cond) { - return false; +static inline int is_loop_head(ir_node *cond) +{ + (void) cond; + return 0; } -static INLINE double get_weighted_region_exec_freq(void *reg, int pos) { - void *pred_reg = get_region_in(reg, pos); - double res, full_freq = get_region_exec_freq(pred_reg); - int n_outs = get_region_n_outs (pred_reg); - int n_exc_outs = get_region_n_exc_outs(pred_reg); +/** Weight a single region in edge. + * + * Given all outs of the predecessor region, we can compute the weight of + * this single edge. */ +static inline double get_weighted_region_exec_freq(void *reg, int pos) +{ + void *pred_reg = get_region_in(reg, pos); + double res, full_freq = get_region_exec_freq (pred_reg); + int n_outs = get_region_n_outs (pred_reg); + int n_exc_outs = get_region_n_exc_outs(pred_reg); ir_node *cfop; if (is_ir_node(reg)) { - cfop = skip_Proj(get_Block_cfgpred((ir_node *)reg, pos)); + cfop = get_Block_cfgpred((ir_node *)reg, pos); + if (is_Proj(cfop) && !is_Cond(get_Proj_pred(cfop))) + cfop = skip_Proj(cfop); } else { assert(is_ir_loop(reg)); - cfop = get_loop_cfop(reg, pos); + cfop = (ir_node*)get_loop_cfop(reg, pos); } - if (is_fragile_op(cfop)) { + if (is_fragile_op(cfop) || is_fragile_Proj(cfop)) { res = full_freq * exception_prob; } else { @@ -110,23 +346,17 @@ static INLINE double get_weighted_region_exec_freq(void *reg, int pos) { return res; } -static INLINE void compute_region_freqency(void *reg, double head_weight) { +static inline void compute_region_freqency(void *reg, double head_weight) +{ int i, n_ins = get_region_n_ins(reg); double my_freq = 0; - //printf("head weight %lf: ", head_weight); DDMR(reg); - for (i = 0; i < n_ins; ++i) { void *pred_reg = get_region_in(reg, i); if (pred_reg) { - if (is_ir_node(reg) && get_irn_node_nr((ir_node *)reg) == 50573) - printf(" + %lf", get_weighted_region_exec_freq(reg, i)); my_freq += get_weighted_region_exec_freq(reg, i); } } - if (is_ir_node(reg) && get_irn_node_nr(reg) == 50573) { - printf(" myfreq %lf", my_freq); DDMN((ir_node *)reg); - } if (my_freq == 0.0) { /* All preds are from outer loop. We are a head or so. */ @@ -135,25 +365,30 @@ static INLINE void compute_region_freqency(void *reg, double head_weight) { set_region_exec_freq(reg, my_freq); } -static void check_proper_head(ir_loop *l, void *reg) { +static void check_proper_head(ir_loop *l, void *reg) +{ int i, n_ins = get_region_n_ins(reg); + (void) l; for (i = 0; i < n_ins; ++i) { assert(!get_region_in(reg, i)); } } /* Compute the ex freq for current_ir_graph */ -static void compute_frequency(int default_loop_weight) { +static void compute_frequency(int default_loop_weight) +{ ir_loop *outermost_l = get_irg_loop(current_ir_graph); pdeq *block_worklist = new_pdeq1(outermost_l); - set_region_exec_freq(outermost_l, 1.0/default_loop_weight); /* outermost start is considered a loop head. */ + /* Outermost start is considered a loop head. We will soon multiply + by default_loop_weight. */ + set_region_exec_freq(outermost_l, 1.0/default_loop_weight); while (!pdeq_empty(block_worklist)) { ir_loop *l = (ir_loop *)pdeq_getl(block_worklist); - int i, n_elems = get_loop_n_elements(l); + size_t i, n_elems = get_loop_n_elements(l); - /* The header is initialized with the freqency of the full loop times the iteration weight. */ + /* The header is initialized with the frequency of the full loop times the iteration weight. */ check_proper_head(l, get_loop_element(l, 0).son); for (i = 0; i < n_elems; ++i) { @@ -171,35 +406,92 @@ static void compute_frequency(int default_loop_weight) { * irg: The graph to be analyzed. * default_loop_weight: The number of executions of a loop. */ -void compute_execution_frequency(ir_graph *irg, int default_loop_weight, double exception_probability) { +void compute_execution_frequency(ir_graph *irg, int default_loop_weight, double exception_probability) +{ ir_graph *rem = current_ir_graph; current_ir_graph = irg; exception_prob = exception_probability; if (!exec_freq_set) exec_freq_set = new_set(exec_freq_cmp, 256); + precompute_cond_evaluation(); construct_intervals(current_ir_graph); compute_frequency(default_loop_weight); + set_irg_exec_freq_state(irg, exec_freq_consistent); + if (get_irp_exec_freq_state() == exec_freq_none) + set_irp_exec_freq_state(exec_freq_inconsistent); + /* - dump_loop_tree (current_ir_graph, "-execfreq"); - dump_ir_block_graph(current_ir_graph, "-execfreq"); - dump_interval_graph(current_ir_graph, "-execfreq"); + dump_loop_tree (current_ir_graph, "-execfreq"); + dump_ir_block_graph(current_ir_graph, "-execfreq"); + dump_interval_graph(current_ir_graph, "-execfreq"); */ current_ir_graph = rem; } -void compute_execution_frequencies(int default_loop_weight, double exception_probability) { - int i, n_irgs = get_irp_n_irgs(); +void compute_execution_frequencies(int default_loop_weight, double exception_probability) +{ + size_t i, n_irgs = get_irp_n_irgs(); free_intervals(); for (i = 0; i < n_irgs; ++i) { compute_execution_frequency(get_irp_irg(i), default_loop_weight, exception_probability); } + set_irp_exec_freq_state(exec_freq_consistent); } /** free occupied memory, reset */ -void free_execution_frequency(void) { +void free_execution_frequency(void) +{ + size_t i, n_irgs = get_irp_n_irgs(); free_intervals(); del_set(exec_freq_set); + + for (i = 0; i < n_irgs; ++i) + set_irg_exec_freq_state(get_irp_irg(i), exec_freq_none); + set_irp_exec_freq_state(exec_freq_none); +} + +exec_freq_state get_irg_exec_freq_state(ir_graph *irg) +{ + return irg->execfreq_state; +} +void set_irg_exec_freq_state(ir_graph *irg, exec_freq_state s) +{ + if ((get_irp_exec_freq_state() == exec_freq_consistent && s != exec_freq_consistent) || + (get_irp_exec_freq_state() == exec_freq_none && s != exec_freq_none)) + irp->execfreq_state = exec_freq_inconsistent; + irg->execfreq_state = s; +} + +/* Sets irg and irp exec freq state to inconsistent if it is set to consistent. */ +void set_irg_exec_freq_state_inconsistent(ir_graph *irg) +{ + if (get_irg_exec_freq_state(irg) == exec_freq_consistent) + set_irg_exec_freq_state(irg, exec_freq_inconsistent); +} + +void set_irp_exec_freq_state(exec_freq_state s) +{ + irp->execfreq_state = s; +} + +exec_freq_state get_irp_exec_freq_state(void) +{ + return irp->execfreq_state; +} + +/* Sets irp and all irg exec freq states to inconsistent if it is set to consistent. */ +void set_irp_exec_freq_state_inconsistent(void) +{ + if (get_irp_exec_freq_state() != exec_freq_none) { + size_t i, n_irgs = get_irp_n_irgs(); + set_irp_exec_freq_state(exec_freq_inconsistent); + for (i = 0; i < n_irgs; ++i) { + ir_graph *irg = get_irp_irg(i); + if (get_irg_exec_freq_state(irg) != exec_freq_none) + irg->execfreq_state = exec_freq_inconsistent; + } + } }