nsz Git - libfirm/blob - include/libfirm/iroptimize.h

   1 /*
   2  * Copyright (C) 1995-2008 University of Karlsruhe.  All right reserved.
   3  *
   4  * This file is part of libFirm.
   5  *
   6  * This file may be distributed and/or modified under the terms of the
   7  * GNU General Public License version 2 as published by the Free Software
   8  * Foundation and appearing in the file LICENSE.GPL included in the
   9  * packaging of this file.
  10  *
  11  * Licensees holding valid libFirm Professional Edition licenses may use
  12  * this file in accordance with the libFirm Commercial License.
  13  * Agreement provided with the Software.
  14  *
  15  * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
  16  * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
  17  * PURPOSE.
  18  */
  19
  20 /**
  21  * @file
  22  * @brief   Available Optimisations of libFirm.
  23  * @version $Id: cfopt.h 13543 2007-04-29 19:29:02Z beck $
  24  */
  25 #ifndef FIRM_IROPTIMIZE_H
  26 #define FIRM_IROPTIMIZE_H
  27
  28 #include "firm_types.h"
  29
  30 /**
  31  * Control flow optimization.
  32  *
  33  * Removes empty blocks doing if simplifications and loop simplifications.
  34  * A block is empty if it contains only a Jmp node and Phi nodes.
  35  * Merges single entry single exit blocks with their predecessor
  36  * and propagates dead control flow by calling equivalent_node().
  37  * Independent of compiler flag it removes Tuples from cf edges,
  38  * Bad predecessors from Blocks and Phis, and unnecessary predecessors of End.
  39  *
  40  * @bug So far destroys backedge information.
  41  * @bug Chokes on Id nodes if called in a certain order with other
  42  *      optimizations.  Call local_optimize_graph() before to remove
  43  *      Ids.
  44  */
  45 void optimize_cf(ir_graph *irg);
  46
  47 /**
  48  * Perform partial conditional evaluation on the given graph.
  49  *
  50  * @param irg  the graph
  51  */
  52 void opt_cond_eval(ir_graph* irg);
  53
  54 /**
  55  * Try to simplify boolean expression in the given ir graph.
  56  * eg. x < 5 && x < 6 becomes x < 5
  57  *
  58  * @param irg  the graph
  59  */
  60 void opt_bool(ir_graph *irg);
  61
  62 /**
  63  * Try to reduce the number of conv nodes in the given ir graph.
  64  *
  65  * @param irg  the graph
  66  */
  67 void conv_opt(ir_graph *irg);
  68
  69 /**
  70  * Do the scalar replacement optimization.
  71  * Make a date flow analyze and split the
  72  * data flow edges.
  73  *
  74  * @param irg  the graph which should be optimized
  75  */
  76 void data_flow_scalar_replacement_opt(ir_graph *irg);
  77
  78 /**
  79  * A callback that checks whether a entity is an allocation
  80  * routine.
  81  */
  82 typedef int (*check_alloc_entity_func)(ir_entity *ent);
  83
  84 /**
  85  * Do simple and fast escape analysis for one graph.
  86  *
  87  * @param irg       the graph
  88  * @param callback  a callback function to check whether a
  89  *                  given entity is a allocation call
  90  */
  91 void escape_enalysis_irg(ir_graph *irg, check_alloc_entity_func callback);
  92
  93 /**
  94  * Do simple and fast escape analysis for all graphs.
  95  *
  96  * This optimization implements a simple and fast but inexact
  97  * escape analysis. Some addresses might be marked as 'escaped' even
  98  * if they are not.
  99  * The advantage is a low memory footprint and fast speed.
 100  *
 101  * @param run_scalar_replace  if this flag in non-zero, scalar
 102  *                            replacement optimization is run on graphs with removed
 103  *                            allocation
 104  * @param callback            a callback function to check whether a
 105  *                            given entity is a allocation call
 106  *
 107  * This optimization removes allocation which are not used (rare) and replace
 108  * allocation that can be proved dead at the end of the graph which stack variables.
 109  *
 110  * The creation of stack variable allows scalar replacement to be run only
 111  * on those graphs that have been changed.
 112  *
 113  * This is most effective on Java where no other stack variables exists.
 114  */
 115 void escape_analysis(int run_scalar_replace, check_alloc_entity_func callback);
 116
 117 /**
 118  * Optimize function calls by handling const functions.
 119  *
 120  * This optimization first detects all "const functions", i.e.,
 121  * IR graphs that neither read nor write memory (and hence did
 122  * not create exceptions, as these use memory in Firm).
 123  *
 124  * The result of calls to such functions depends only on its
 125  * arguments, hence those calls are no more pinned.
 126  *
 127  * This is a rather strong criteria, so do not expect that a
 128  * lot of functions will be found. Moreover, all of them might
 129  * already be inlined if inlining is activated.
 130  * Anyway, it might be good for handling builtin's or pseudo-graphs,
 131  * even if the later read/write memory (but we know how).
 132  *
 133  * This optimizations read the irg_const_function property of
 134  * entities and and sets the irg_const_function property of
 135  * graphs.
 136  *
 137  * If callee information is valid, we also optimize polymorphic Calls.
 138  *
 139  * @param force_run  if non-zero, an optimization run is started even
 140  *                   if no const function graph was detected.
 141  *                   Else calls are only optimized if at least one
 142  *                   const function graph was detected.
 143  * @param callback   a callback function to check whether a
 144  *                   given entity is a allocation call
 145  *
 146  * If the frontend created external entities with the irg_const_function
 147  * property set, the force_run parameter should be set, else
 148  * should be unset.
 149  *
 150  * @note This optimization destroys the link fields of nodes.
 151  */
 152 void optimize_funccalls(int force_run, check_alloc_entity_func callback);
 153
 154 /**
 155  * Does Partial Redundancy Elimination combined with
 156  * Global Value Numbering.
 157  * Can be used to replace place_code() completely.
 158  *
 159  * Based on VanDrunen and Hosking 2004.
 160  *
 161  * @param irg  the graph
 162  *
 163  * @note
 164  * Currently completely broken because the used sets do NOT
 165  * preserve the topological sort of its elements.
 166  */
 167 void do_gvn_pre(ir_graph *irg);
 168
 169 /**
 170  * This function is called to evaluate, if a mux can build
 171  * of the current architecture.
 172  * If it returns non-zero, a mux is created, else the code
 173  * is not modified.
 174  * @param sel        A selector of a Cond.
 175  * @param phi_list   List of Phi nodes about to be converted (linked via link field)
 176  * @param i          First data predecessor involved in if conversion
 177  * @param j          Second data predecessor involved in if conversion
 178  */
 179 typedef int (*arch_allow_ifconv_func)(ir_node *sel, ir_node* phi_list, int i, int j);
 180
 181 /**
 182  * The parameters structure.
 183  */
 184 struct ir_settings_if_conv_t {
 185         int                 max_depth;       /**< The maximum depth up to which expressions
 186                                                are examined when it has to be decided if they
 187                                                can be placed into another block. */
 188         arch_allow_ifconv_func allow_ifconv; /**< Evaluator function, if not set all possible Psi
 189                                                nodes will be created. */
 190 };
 191
 192 /**
 193  * Perform If conversion on a graph.
 194  *
 195  * @param irg The graph.
 196  * @param params The parameters for the if conversion.
 197  *
 198  * Cannot handle blocks with Bad control predecessors, so call it after control
 199  * flow optimization.
 200  */
 201 void opt_if_conv(ir_graph *irg, const ir_settings_if_conv_t *params);
 202
 203 void opt_ldst2(ir_graph *irg);
 204
 205 /**
 206  * Load/Store optimization.
 207  *
 208  * Removes redundant non-volatile Loads and Stores.
 209  * May introduce Bad nodes if exceptional control flow
 210  * is removed. The following cases are optimized:
 211  *
 212  * Load without result: A Load which has only a memory use
 213  *   is removed.
 214  *
 215  * Load after Store: A Load after a Store is removed, if
 216  *   the Load doesn't have an exception handler OR is in
 217  *   the same block as the Store.
 218  *
 219  * Load after Load: A Load after a Load is removed, if the
 220  *   Load doesn't have an exception handler OR is in the
 221  *   same block as the previous Load.
 222  *
 223  * Store before Store: A Store immediately before another
 224  *   Store in the same block is removed, if the Store doesn't
 225  *   have an exception handler.
 226  *
 227  * Store after Load: A Store after a Load is removed, if the
 228  *   Store doesn't have an exception handler.
 229  */
 230 void optimize_load_store(ir_graph *irg);
 231
 232 /**
 233  * Do Loop unrolling in the given graph.
 234  */
 235 void optimize_loop_unrolling(ir_graph *irg);
 236
 237 /**
 238  * Optimize the frame type of an irg by removing
 239  * never touched entities.
 240  *
 241  * @param irg  The graph whose frame type will be optimized
 242  *
 243  * This function did not change the graph, only it's frame type.
 244  * The layout state of the frame type will be set to layout_undefined
 245  * if entities were removed.
 246  */
 247 void opt_frame_irg(ir_graph *irg);
 248
 249 /** Possible flags for the Operator Scalar Replacement. */
 250 typedef enum osr_flags {
 251         osr_flag_none               = 0,  /**< no additional flags */
 252         osr_flag_lftr_with_ov_check = 1,  /**< do linear function test replacement
 253                                                only if no overflow can occur. */
 254         osr_flag_ignore_x86_shift   = 2,  /**< ignore Multiplications by 2, 4, 8 */
 255         osr_flag_keep_reg_pressure  = 4   /**< do NOT increase register pressure by introducing new
 256                                                induction variables. */
 257 } osr_flags;
 258
 259 /* FirmJNI cannot handle identical enum values... */
 260
 261 /** default setting */
 262 #define osr_flag_default osr_flag_lftr_with_ov_check
 263
 264 /**
 265  * Do the Operator Scalar Replacement optimization and linear
 266  * function test replacement for loop control.
 267  * Can be switched off using the set_opt_strength_red() flag.
 268  * In that case, only remove_phi_cycles() is executed.
 269  *
 270  * @param irg    the graph which should be optimized
 271  * @param flags  set of osr_flags
 272  *
 273  * The linear function replacement test is controlled by the flags.
 274  * If the osr_flag_lftr_with_ov_check is set, the replacement is only
 275  * done if do overflow can occur.
 276  * Otherwise it is ALWAYS done which might be insecure.
 277  *
 278  * For instance:
 279  *
 280  * for (i = 0; i < 100; ++i)
 281  *
 282  * might be replaced by
 283  *
 284  * for (i = 0; i < 400; i += 4)
 285  *
 286  * But
 287  *
 288  * for (i = 0; i < 0x7FFFFFFF; ++i)
 289  *
 290  * will not be replaced by
 291  *
 292  * for (i = 0; i < 0xFFFFFFFC; i += 4)
 293  *
 294  * because of overflow.
 295  *
 296  * More bad cases:
 297  *
 298  * for (i = 0; i <= 0xF; ++i)
 299  *
 300  * will NOT be transformed into
 301  *
 302  * for (i = 0xFFFFFFF0; i <= 0xFFFFFFFF; ++i)
 303  *
 304  * although here is no direct overflow. The OV occurs when the ++i
 305  * is executed (and would created an endless loop here!).
 306  *
 307  * For the same reason, a loop
 308  *
 309  * for (i = 0; i <= 9; i += x)
 310  *
 311  * will NOT be transformed because we cannot estimate whether an overflow
 312  * might happen adding x.
 313  *
 314  * Note that i < a + 400 is also not possible with the current implementation
 315  * although this might be allowed by other compilers...
 316  *
 317  * Note further that tests for equality can be handled some simpler (but are not
 318  * implemented yet).
 319  *
 320  * This algorithm destroys the link field of nodes.
 321  */
 322 void opt_osr(ir_graph *irg, unsigned flags);
 323
 324 /**
 325  * Removes useless Phi cycles, i.e cycles of Phi nodes with only one
 326  * non-Phi node.
 327  * This is automatically done in opt_osr(), so there is no need to call it
 328  * additionally.
 329  *
 330  * @param irg    the graph which should be optimized
 331  *
 332  * This algorithm destroys the link field of nodes.
 333  */
 334 void remove_phi_cycles(ir_graph *irg);
 335
 336 /** A default threshold. */
 337 #define DEFAULT_CLONE_THRESHOLD 300
 338
 339 /**
 340  * Do procedure cloning. Evaluate a heuristic weight for every
 341  * Call(..., Const, ...). If the weight is bigger than threshold,
 342  * clone the entity and fix the calls.
 343  *
 344  * @param threshold   the threshold for cloning
 345  *
 346  * The threshold is an estimation of how many instructions are saved
 347  * when executing a cloned method. If threshold is 0.0, every possible
 348  * call is cloned.
 349  */
 350 void proc_cloning(float threshold);
 351
 352 /**
 353  * Reassociation.
 354  *
 355  * Applies Reassociation rules to integer expressions.
 356  * Beware: Works only if integer overflow might be ignored, as for C, Java
 357  * and for address expression.
 358  * Works only if Constant folding is activated.
 359  *
 360  * Uses loop information to detect loop-invariant (ie contant
 361  * inside the loop) values.
 362  *
 363  * See Muchnik 12.3.1 Algebraic Simplification and Reassociation of
 364  * Addressing Expressions.
 365  *
 366  *
 367  */
 368 void optimize_reassociation(ir_graph *irg);
 369
 370 /**
 371  * Normalize the Returns of a graph by creating a new End block
 372  * with One Return(Phi).
 373  * This is the preferred input for the if-conversion.
 374  *
 375  * In pseudocode, it means:
 376  *
 377  * if (a)
 378  *   return b;
 379  * else
 380  *   return c;
 381  *
 382  * is transformed into
 383  *
 384  * if (a)
 385  *   res = b;
 386  * else
 387  *   res = c;
 388  * return res;
 389  */
 390 void normalize_one_return(ir_graph *irg);
 391
 392 /**
 393  * Normalize the Returns of a graph by moving
 394  * the Returns upwards as much as possible.
 395  * This might be preferred for code generation.
 396  *
 397  * In pseudocode, it means:
 398  *
 399  * if (a)
 400  *   res = b;
 401  * else
 402  *   res = c;
 403  * return res;
 404  *
 405  * is transformed into
 406  *
 407  * if (a)
 408  *   return b;
 409  * else
 410  *   return c;
 411  */
 412 void normalize_n_returns(ir_graph *irg);
 413
 414 /**
 415  * Do the scalar replacement optimization.
 416  * Replace local compound entities (like structures and arrays)
 417  * with atomic values if possible. Does not handle classes yet.
 418  *
 419  * @param irg  the graph which should be optimized
 420  */
 421 void scalar_replacement_opt(ir_graph *irg);
 422
 423 /** Performs strength reduction for the passed graph. */
 424 void reduce_strength(ir_graph *irg);
 425
 426 /**
 427  * Optimizes simple tail-recursion calls by
 428  * converting them into loops. Depends on the flag opt_tail_recursion.
 429  *
 430  * Does not work for Calls that use the exception stuff.
 431  *
 432  * @param irg   the graph to be optimized
 433  *
 434  * @return non-zero if the optimization could be applied, 0 else
 435  */
 436 int opt_tail_rec_irg(ir_graph *irg);
 437
 438 /*
 439  * Optimize tail-recursion calls for all IR-Graphs.
 440  * Depends on the flag opt_tail_recursion.
 441  */
 442 void opt_tail_recursion(void);
 443
 444 /** This is the type for a method, that returns a pointer type to
 445  *  tp.  This is needed in the normalization. */
 446 typedef ir_type *(*gen_pointer_type_to_func)(ir_type *tp);
 447
 448 /**  Insert Casts so that class type casts conform exactly with the type hierarchy.
 449  *
 450  *  Formulated in Java, this achieves the following:
 451  *
 452  *  For a class hierarchy
 453  *    class A {}
 454  *    class B extends A {}
 455  *    class C extends B {}
 456  *  we transforms a cast
 457  *    (A)new C()
 458  *  to
 459  *    (A)((B)new C()).
 460  *
 461  *  The algorithm works for Casts with class types, but also for Casts
 462  *  with all pointer types that point (over several indirections,
 463  *  i.e. ***A) to a class type.  Normalizes all graphs.  Computes type
 464  *  information (@see irtypeinfo.h) if not available.
 465  *  Invalidates trout information as new casts are generated.
 466  *
 467  *  @param gppt_fct A function that returns a pointer type that points
 468  *    to the type given as argument.  If this parameter is NULL, a default
 469  *    function is used that either uses trout information or performs a O(n)
 470  *    search to find an existing pointer type.  If it can not find a type,
 471  *    generates a pointer type with mode_P_mach and suffix "cc_ptr_tp".
 472  */
 473 void normalize_irp_class_casts(gen_pointer_type_to_func gppt_fct);
 474
 475
 476 /**  Insert Casts so that class type casts conform exactly with the type hierarchy
 477  *   in given graph.
 478  *
 479  *   For more details see normalize_irp_class_casts().
 480  *
 481  *  This transformation requires that type information is computed. @see irtypeinfo.h.
 482  */
 483 void normalize_irg_class_casts(ir_graph *irg, gen_pointer_type_to_func gppt_fct);
 484
 485
 486 /** Optimize casting between class types.
 487  *
 488  *    class A { m(); }
 489  *    class B extends A { }
 490  *    class C extends B {}
 491  *  Performs the following transformations:
 492  *    C c = (C)(B)(A)(B)new C()  --> C c = (C)(B)newC() --> C c = new C()
 493  *    (Optimizing downcasts as A a = (A)(B)(new A()) --> A a = new A() can
 494  *     be suppressed by setting the flag opt_suppress_downcast_optimization.
 495  *     Downcasting A to B might cause an exception.  It is not clear
 496  *     whether this is modeled by the Firm Cast node, as it has no exception
 497  *     outputs.);
 498  *  If there is inh_m() that overwrites m() in B:
 499  *    ((A) new B()).m()  --> (new B()).inh_m()
 500  *  Phi((A)x, (A)y)  --> (A) Phi (x, y)  if (A) is an upcast.
 501  *
 502  *  Computes type information if not available. @see irtypeinfo.h.
 503  *  Typeinformation is valid after optimization.
 504  *  Invalidates trout information.
 505  */
 506 void optimize_class_casts(void);
 507
 508 #endif