X-Git-Url: http://nsz.repo.hu/git/?a=blobdiff_plain;f=ir%2Fana%2Fexecution_frequency.c;h=a005f4dcd1fef5c0ac0dcd05e06895c333520968;hb=e775a978fff2841e0722c47f13545b54d48b8f98;hp=e740c0bf0483b46060ad66f53be6c1d9efcdcc1a;hpb=c19953ed6384686c23fb9d720a7cfdda3d443d19;p=libfirm diff --git a/ir/ana/execution_frequency.c b/ir/ana/execution_frequency.c index e740c0bf0..a005f4dcd 100644 --- a/ir/ana/execution_frequency.c +++ b/ir/ana/execution_frequency.c @@ -1,31 +1,48 @@ /* - * Project: libFIRM - * File name: ir/ana/execution_frequency.c - * Purpose: Compute an estimate of basic block executions. - * Author: Goetz Lindenmaier - * Modified by: - * Created: 5.11.2004 - * CVS-ID: $Id$ - * Copyright: (c) 2004 Universität Karlsruhe - * Licence: This file protected by GPL - GNU GENERAL PUBLIC LICENSE. + * Copyright (C) 1995-2008 University of Karlsruhe. All right reserved. + * + * This file is part of libFirm. + * + * This file may be distributed and/or modified under the terms of the + * GNU General Public License version 2 as published by the Free Software + * Foundation and appearing in the file LICENSE.GPL included in the + * packaging of this file. + * + * Licensees holding valid libFirm Professional Edition licenses may use + * this file in accordance with the libFirm Commercial License. + * Agreement provided with the Software. + * + * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE + * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR + * PURPOSE. + */ + +/** + * @file + * @brief Compute an estimate of basic block executions. + * @author Goetz Lindenmaier + * @date 5.11.2004 + * @version $Id$ */ -#ifdef HAVE_CONFIG_H #include "config.h" -#endif #include "execution_frequency.h" -#include "firm_common_t.h" #include "set.h" #include "pdeq.h" +#include "hashptr.h" +#include "error.h" -#include "irprog.h" +#include "irprog_t.h" +#include "irgraph_t.h" #include "irnode_t.h" #include "irloop.h" #include "irgwalk.h" #include "interval_analysis.h" +void set_irp_exec_freq_state(exec_freq_state s); + /*------------------------------------------------------------------*/ /* A hashmap mapping the frequency to block and loop nodes. Block * and loop nodes are regions. */ @@ -40,30 +57,35 @@ typedef struct { /* We use this set for all nodes in all irgraphs. */ static set *exec_freq_set = NULL; -static int exec_freq_cmp(const void *e1, const void *e2, size_t size) { +static int exec_freq_cmp(const void *e1, const void *e2, size_t size) +{ reg_exec_freq *ef1 = (reg_exec_freq *)e1; reg_exec_freq *ef2 = (reg_exec_freq *)e2; + (void) size; + return (ef1->reg != ef2->reg); } -static INLINE unsigned int exec_freq_hash(void *e) { - unsigned int v = (unsigned int) ((reg_exec_freq *)e)->reg; - return v ^ (v>>8); +static inline unsigned int exec_freq_hash(reg_exec_freq *e) +{ + return HASH_PTR(e->reg); } -static INLINE void set_region_exec_freq(void *reg, double freq) { +static inline void set_region_exec_freq(void *reg, double freq) +{ reg_exec_freq ef; ef.reg = reg; ef.freq = freq; set_insert(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); } -INLINE double get_region_exec_freq(void *reg) { +double get_region_exec_freq(void *reg) +{ reg_exec_freq ef, *found; ef.reg = reg; assert(exec_freq_set); - found = set_find(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); + found = (reg_exec_freq*) set_find(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); /* Not found if information is invalid. */ if (found) @@ -73,11 +95,13 @@ INLINE double get_region_exec_freq(void *reg) { } /* Returns the number of times the block is executed. */ -double get_Block_exec_freq(ir_node *b) { +double get_Block_exec_freq(ir_node *b) +{ return get_region_exec_freq((void *)b); } -double get_irn_exec_freq(ir_node *n) { +double get_irn_exec_freq(ir_node *n) +{ if (!is_Block(n)) n = get_nodes_block(n); return get_Block_exec_freq(n); } @@ -107,18 +131,20 @@ static int just_passed_a_Raise = 0; static ir_node *Cond_list = NULL; /* We do not use an extra set, as Projs are not yet in the existing one. */ -void set_ProjX_probability(ir_node *n, Cond_prob prob) { +static void set_ProjX_probability(ir_node *n, Cond_prob prob) +{ reg_exec_freq ef; ef.reg = n; ef.prob = prob; set_insert(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); } -Cond_prob get_ProjX_probability(ir_node *n) { +static Cond_prob get_ProjX_probability(ir_node *n) +{ reg_exec_freq ef, *found; ef.reg = n; - found = set_find(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); + found = (reg_exec_freq*) set_find(exec_freq_set, &ef, sizeof(ef), exec_freq_hash(&ef)); if (found) return (Cond_prob)found->prob; @@ -128,16 +154,16 @@ Cond_prob get_ProjX_probability(ir_node *n) { /* A walker that only visits the nodes we want to see. */ -static void -my_irg_walk_2_both(ir_node *node, irg_walk_func *pre, irg_walk_func *post, void * env) { +static void my_irg_walk_2_both(ir_node *node, irg_walk_func *pre, irg_walk_func *post, void * env) +{ int i; set_irn_visited(node, current_ir_graph->visited); pre(node, env); - if (node->op != op_Block) { + if (!is_Block(node)) { ir_node *pred; - if (node->op == op_Proj) + if (is_Proj(node)) pred = get_irn_n(node, 0); else pred = get_irn_n(node, -1); @@ -149,40 +175,43 @@ my_irg_walk_2_both(ir_node *node, irg_walk_func *pre, irg_walk_func *post, void for (i = get_irn_arity(node) - 1; i >= 0; --i) { ir_node *pred = get_irn_n(node, i); if (pred->visited < current_ir_graph->visited) - my_irg_walk_2_both(pred, pre, post, env); + my_irg_walk_2_both(pred, pre, post, env); } } - if (node->op == op_End) { + if (is_End(node)) { for (i = get_irn_arity(node) - 1; i >= 0; --i) { ir_node *pred = get_irn_n(node, i); if ((pred->op == op_Block) && (pred->visited < current_ir_graph->visited)) - my_irg_walk_2_both(pred, pre, post, env); + my_irg_walk_2_both(pred, pre, post, env); } } post(node, env); } -static void my_irg_walk_current_graph(irg_walk_func *pre, irg_walk_func *post, void *env) { +static void my_irg_walk_current_graph(irg_walk_func *pre, irg_walk_func *post, void *env) +{ inc_irg_visited(current_ir_graph); my_irg_walk_2_both(get_irg_end(current_ir_graph), pre, post, env); } -static void walk_pre(ir_node *n, void *env) { - - if (get_irn_op(n) == op_Raise) +static void walk_pre(ir_node *n, void *env) +{ + (void) env; + if (is_Raise(n)) just_passed_a_Raise = 1; - if ( (get_irn_op(n) == op_Proj) - && (get_irn_op(get_Proj_pred(n)) == op_Cond) - && (just_passed_a_Raise)) { + if (get_irn_op(n) == op_Proj && + is_Cond(get_Proj_pred(n)) && + just_passed_a_Raise) { + ir_node *other_proj; ir_node *c = get_Proj_pred(n); /* If we already visited the other Proj, and it also leads to a Raise, we are in the middle of something. Continue searching. */ assert(get_irn_n_outs(c) == 2 && "encountered a switch cond"); - ir_node *other_proj = get_irn_out(c, 0); + other_proj = get_irn_out(c, 0); if (other_proj == n) other_proj = get_irn_out(c, 1); if (get_ProjX_probability(other_proj) == Cond_prob_exception_taken) { set_ProjX_probability(other_proj, Cond_prob_was_exception_taken); @@ -193,21 +222,23 @@ static void walk_pre(ir_node *n, void *env) { } } - if (get_irn_op(n) == op_Cond) { + if (is_Cond(n)) { set_irn_link(n, Cond_list); Cond_list = n; } } -static void walk_post(ir_node *n, void *env) { - - if (get_irn_op(n) == op_Raise) +static void walk_post(ir_node *n, void *env) +{ + (void) env; + if (is_Raise(n)) just_passed_a_Raise = 0; - if ( (get_irn_op(n) == op_Proj) - && (get_irn_op(get_Proj_pred(n)) == op_Cond) - && ((get_ProjX_probability(n) == Cond_prob_exception_taken) || - (get_ProjX_probability(n) == Cond_prob_was_exception_taken) )) { + if (get_irn_op(n) == op_Proj && + is_Cond(get_Proj_pred(n)) && ( + get_ProjX_probability(n) == Cond_prob_exception_taken || + get_ProjX_probability(n) == Cond_prob_was_exception_taken + )) { just_passed_a_Raise = 1; } } @@ -215,27 +246,32 @@ static void walk_post(ir_node *n, void *env) { /** Precompute which Conds test for an exception. * * Operates on current_ir_graph. */ -void precompute_cond_evaluation(void) { +static void precompute_cond_evaluation(void) +{ ir_node *c; - compute_outs(current_ir_graph); + compute_irg_outs(current_ir_graph); just_passed_a_Raise = 0; Cond_list = NULL; my_irg_walk_current_graph(walk_pre, walk_post, NULL); - for (c = Cond_list; c; c = get_irn_link(c)) { + for (c = Cond_list; c; c = (ir_node*)get_irn_link(c)) { + ir_node *p0, *p1; + assert(get_irn_n_outs(c) == 2 && "encountered a switch cond"); - ir_node *p0 = get_irn_out(c, 0); - ir_node *p1 = get_irn_out(c, 1); + p0 = get_irn_out(c, 0); + p1 = get_irn_out(c, 1); /* both are exceptions */ if ((get_ProjX_probability(p0) == Cond_prob_exception_taken) && - (get_ProjX_probability(p1) == Cond_prob_exception_taken) ) { - assert(0 && "I tried to avoid these!"); + (get_ProjX_probability(p1) == Cond_prob_exception_taken) ) { + panic("I tried to avoid these!"); +#if 0 /* It's a */ set_ProjX_probability(p0, Cond_prob_normal); set_ProjX_probability(p1, Cond_prob_normal); +#endif } /* p0 is exception */ @@ -256,12 +292,13 @@ void precompute_cond_evaluation(void) { } } -int is_fragile_Proj(ir_node *n) { +int is_fragile_Proj(ir_node *n) +{ return is_Proj(n) && (get_ProjX_probability(n) == Cond_prob_exception_taken); } /*------------------------------------------------------------------*/ -/* The algorithm to compute the execution freqencies. +/* The algorithm to compute the execution frequencies. * * Walk the control flow loop tree which we consider the interval * tree. Compute the execution for the lowest loop, add inner loops @@ -271,15 +308,18 @@ int is_fragile_Proj(ir_node *n) { static double exception_prob = 0.001; -static INLINE int is_loop_head(ir_node *cond) { - return false; +static inline int is_loop_head(ir_node *cond) +{ + (void) cond; + return 0; } /** Weight a single region in edge. * * Given all outs of the predecessor region, we can compute the weight of * this single edge. */ -static INLINE double get_weighted_region_exec_freq(void *reg, int pos) { +static inline double get_weighted_region_exec_freq(void *reg, int pos) +{ void *pred_reg = get_region_in(reg, pos); double res, full_freq = get_region_exec_freq (pred_reg); int n_outs = get_region_n_outs (pred_reg); @@ -288,11 +328,11 @@ static INLINE double get_weighted_region_exec_freq(void *reg, int pos) { ir_node *cfop; if (is_ir_node(reg)) { cfop = get_Block_cfgpred((ir_node *)reg, pos); - if (is_Proj(cfop) && (get_irn_op(get_Proj_pred(cfop)) != op_Cond)) + if (is_Proj(cfop) && !is_Cond(get_Proj_pred(cfop))) cfop = skip_Proj(cfop); } else { assert(is_ir_loop(reg)); - cfop = get_loop_cfop(reg, pos); + cfop = (ir_node*)get_loop_cfop(reg, pos); } if (is_fragile_op(cfop) || is_fragile_Proj(cfop)) { @@ -306,12 +346,11 @@ static INLINE double get_weighted_region_exec_freq(void *reg, int pos) { return res; } -static INLINE void compute_region_freqency(void *reg, double head_weight) { +static inline void compute_region_freqency(void *reg, double head_weight) +{ int i, n_ins = get_region_n_ins(reg); double my_freq = 0; - //printf("head weight %lf: ", head_weight); DDMR(reg); - for (i = 0; i < n_ins; ++i) { void *pred_reg = get_region_in(reg, i); if (pred_reg) { @@ -326,15 +365,18 @@ static INLINE void compute_region_freqency(void *reg, double head_weight) { set_region_exec_freq(reg, my_freq); } -static void check_proper_head(ir_loop *l, void *reg) { +static void check_proper_head(ir_loop *l, void *reg) +{ int i, n_ins = get_region_n_ins(reg); + (void) l; for (i = 0; i < n_ins; ++i) { assert(!get_region_in(reg, i)); } } /* Compute the ex freq for current_ir_graph */ -static void compute_frequency(int default_loop_weight) { +static void compute_frequency(int default_loop_weight) +{ ir_loop *outermost_l = get_irg_loop(current_ir_graph); pdeq *block_worklist = new_pdeq1(outermost_l); @@ -344,9 +386,9 @@ static void compute_frequency(int default_loop_weight) { while (!pdeq_empty(block_worklist)) { ir_loop *l = (ir_loop *)pdeq_getl(block_worklist); - int i, n_elems = get_loop_n_elements(l); + size_t i, n_elems = get_loop_n_elements(l); - /* The header is initialized with the freqency of the full loop times the iteration weight. */ + /* The header is initialized with the frequency of the full loop times the iteration weight. */ check_proper_head(l, get_loop_element(l, 0).son); for (i = 0; i < n_elems; ++i) { @@ -364,7 +406,8 @@ static void compute_frequency(int default_loop_weight) { * irg: The graph to be analyzed. * default_loop_weight: The number of executions of a loop. */ -void compute_execution_frequency(ir_graph *irg, int default_loop_weight, double exception_probability) { +void compute_execution_frequency(ir_graph *irg, int default_loop_weight, double exception_probability) +{ ir_graph *rem = current_ir_graph; current_ir_graph = irg; exception_prob = exception_probability; @@ -374,6 +417,10 @@ void compute_execution_frequency(ir_graph *irg, int default_loop_weight, double construct_intervals(current_ir_graph); compute_frequency(default_loop_weight); + set_irg_exec_freq_state(irg, exec_freq_consistent); + if (get_irp_exec_freq_state() == exec_freq_none) + set_irp_exec_freq_state(exec_freq_inconsistent); + /* dump_loop_tree (current_ir_graph, "-execfreq"); dump_ir_block_graph(current_ir_graph, "-execfreq"); @@ -384,16 +431,67 @@ void compute_execution_frequency(ir_graph *irg, int default_loop_weight, double } -void compute_execution_frequencies(int default_loop_weight, double exception_probability) { - int i, n_irgs = get_irp_n_irgs(); +void compute_execution_frequencies(int default_loop_weight, double exception_probability) +{ + size_t i, n_irgs = get_irp_n_irgs(); free_intervals(); for (i = 0; i < n_irgs; ++i) { compute_execution_frequency(get_irp_irg(i), default_loop_weight, exception_probability); } + set_irp_exec_freq_state(exec_freq_consistent); } /** free occupied memory, reset */ -void free_execution_frequency(void) { +void free_execution_frequency(void) +{ + size_t i, n_irgs = get_irp_n_irgs(); free_intervals(); del_set(exec_freq_set); + + for (i = 0; i < n_irgs; ++i) + set_irg_exec_freq_state(get_irp_irg(i), exec_freq_none); + set_irp_exec_freq_state(exec_freq_none); +} + +exec_freq_state get_irg_exec_freq_state(ir_graph *irg) +{ + return irg->execfreq_state; +} +void set_irg_exec_freq_state(ir_graph *irg, exec_freq_state s) +{ + if ((get_irp_exec_freq_state() == exec_freq_consistent && s != exec_freq_consistent) || + (get_irp_exec_freq_state() == exec_freq_none && s != exec_freq_none)) + irp->execfreq_state = exec_freq_inconsistent; + irg->execfreq_state = s; +} + +/* Sets irg and irp exec freq state to inconsistent if it is set to consistent. */ +void set_irg_exec_freq_state_inconsistent(ir_graph *irg) +{ + if (get_irg_exec_freq_state(irg) == exec_freq_consistent) + set_irg_exec_freq_state(irg, exec_freq_inconsistent); +} + +void set_irp_exec_freq_state(exec_freq_state s) +{ + irp->execfreq_state = s; +} + +exec_freq_state get_irp_exec_freq_state(void) +{ + return irp->execfreq_state; +} + +/* Sets irp and all irg exec freq states to inconsistent if it is set to consistent. */ +void set_irp_exec_freq_state_inconsistent(void) +{ + if (get_irp_exec_freq_state() != exec_freq_none) { + size_t i, n_irgs = get_irp_n_irgs(); + set_irp_exec_freq_state(exec_freq_inconsistent); + for (i = 0; i < n_irgs; ++i) { + ir_graph *irg = get_irp_irg(i); + if (get_irg_exec_freq_state(irg) != exec_freq_none) + irg->execfreq_state = exec_freq_inconsistent; + } + } }