nsz Git - libfirm/blob - include/libfirm/iroptimize.h

   1 /*
   2  * Copyright (C) 1995-2008 University of Karlsruhe.  All right reserved.
   3  *
   4  * This file is part of libFirm.
   5  *
   6  * This file may be distributed and/or modified under the terms of the
   7  * GNU General Public License version 2 as published by the Free Software
   8  * Foundation and appearing in the file LICENSE.GPL included in the
   9  * packaging of this file.
  10  *
  11  * Licensees holding valid libFirm Professional Edition licenses may use
  12  * this file in accordance with the libFirm Commercial License.
  13  * Agreement provided with the Software.
  14  *
  15  * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
  16  * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
  17  * PURPOSE.
  18  */
  19
  20 /**
  21  * @file
  22  * @brief   Available Optimisations of libFirm.
  23  * @version $Id$
  24  */
  25 #ifndef FIRM_IROPTIMIZE_H
  26 #define FIRM_IROPTIMIZE_H
  27
  28 #include "firm_types.h"
  29 #include "begin.h"
  30
  31 /**
  32  * Control flow optimization.
  33  *
  34  * Removes empty blocks doing if simplifications and loop simplifications.
  35  * A block is empty if it contains only a Jmp node and Phi nodes.
  36  * Merges single entry single exit blocks with their predecessor
  37  * and propagates dead control flow by calling equivalent_node().
  38  * Independent of compiler flag it removes Tuples from cf edges,
  39  * Bad predecessors from Blocks and Phis, and unnecessary predecessors of End.
  40  * Destroys backedge information.
  41  *
  42  * @bug Chokes on Id nodes if called in a certain order with other
  43  *      optimizations.  Call local_optimize_graph() before to remove
  44  *      Ids.
  45  */
  46 FIRM_API void optimize_cf(ir_graph *irg);
  47
  48 /**
  49  * Creates an ir_graph pass for optimize_cf().
  50  *
  51  * @param name     the name of this pass or NULL
  52  *
  53  * @return  the newly created ir_graph pass
  54  */
  55 FIRM_API ir_graph_pass_t *optimize_cf_pass(const char *name);
  56
  57 /**
  58  * Perform path-sensitive jump threading on the given graph.
  59  *
  60  * @param irg  the graph
  61  */
  62 FIRM_API void opt_jumpthreading(ir_graph* irg);
  63
  64 /**
  65  * Creates an ir_graph pass for opt_jumpthreading().
  66  *
  67  * @param name     the name of this pass or NULL
  68  *
  69  * @return  the newly created ir_graph pass
  70  */
  71 FIRM_API ir_graph_pass_t *opt_jumpthreading_pass(const char *name);
  72
  73 /**
  74  * Creates an ir_graph pass for opt_loopunroll().
  75  *
  76  * @param name     the name of this pass or NULL
  77  *
  78  * @return  the newly created ir_graph pass
  79  */
  80 FIRM_API ir_graph_pass_t *opt_loopunroll_pass(const char *name);
  81
  82
  83 /**
  84  * Try to simplify boolean expression in the given ir graph.
  85  * eg. x < 5 && x < 6 becomes x < 5
  86  *
  87  * @param irg  the graph
  88  */
  89 FIRM_API void opt_bool(ir_graph *irg);
  90
  91 /**
  92  * Creates an ir_graph pass for opt_bool().
  93  *
  94  * @param name     the name of this pass or NULL
  95  *
  96  * @return  the newly created ir_graph pass
  97  */
  98 FIRM_API ir_graph_pass_t *opt_bool_pass(const char *name);
  99
 100 /**
 101  * Try to reduce the number of conv nodes in the given ir graph.
 102  *
 103  * @param irg  the graph
 104  *
 105  * @return non-zero if the optimization could be applied, 0 else
 106  */
 107 FIRM_API int conv_opt(ir_graph *irg);
 108
 109 /**
 110  * Creates an ir_graph pass for conv_opt().
 111  *
 112  * @param name     the name of this pass or NULL
 113  *
 114  * @return  the newly created ir_graph pass
 115  */
 116 FIRM_API ir_graph_pass_t *conv_opt_pass(const char *name);
 117
 118 /**
 119  * Do the scalar replacement optimization.
 120  * Make a date flow analyze and split the
 121  * data flow edges.
 122  *
 123  * @param irg  the graph which should be optimized
 124  */
 125 FIRM_API void data_flow_scalar_replacement_opt(ir_graph *irg);
 126
 127 /**
 128  * A callback that checks whether a entity is an allocation
 129  * routine.
 130  */
 131 typedef int (*check_alloc_entity_func)(ir_entity *ent);
 132
 133 /**
 134  * Do simple and fast escape analysis for one graph.
 135  *
 136  * @param irg       the graph
 137  * @param callback  a callback function to check whether a
 138  *                  given entity is a allocation call
 139  */
 140 FIRM_API void escape_enalysis_irg(ir_graph *irg,
 141                                   check_alloc_entity_func callback);
 142
 143 /**
 144  * Do simple and fast escape analysis for all graphs.
 145  *
 146  * This optimization implements a simple and fast but inexact
 147  * escape analysis. Some addresses might be marked as 'escaped' even
 148  * if they are not.
 149  * The advantage is a low memory footprint and fast speed.
 150  *
 151  * @param run_scalar_replace  if this flag in non-zero, scalar
 152  *                            replacement optimization is run on graphs with removed
 153  *                            allocation
 154  * @param callback            a callback function to check whether a
 155  *                            given entity is a allocation call
 156  *
 157  * This optimization removes allocation which are not used (rare) and replace
 158  * allocation that can be proved dead at the end of the graph which stack variables.
 159  *
 160  * The creation of stack variable allows scalar replacement to be run only
 161  * on those graphs that have been changed.
 162  *
 163  * This is most effective on Java where no other stack variables exists.
 164  */
 165 FIRM_API void escape_analysis(int run_scalar_replace,
 166                               check_alloc_entity_func callback);
 167
 168 /**
 169  * Optimize function calls by handling const functions.
 170  *
 171  * This optimization first detects all "const functions", i.e.,
 172  * IR graphs that neither read nor write memory (and hence did
 173  * not create exceptions, as these use memory in Firm).
 174  *
 175  * The result of calls to such functions depends only on its
 176  * arguments, hence those calls are no more pinned.
 177  *
 178  * This is a rather strong criteria, so do not expect that a
 179  * lot of functions will be found. Moreover, all of them might
 180  * already be inlined if inlining is activated.
 181  * Anyway, it might be good for handling builtin's
 182  * even if the later read/write memory (but we know how).
 183  *
 184  * This optimizations read the irg_const_function property of
 185  * entities and and sets the irg_const_function property of
 186  * graphs.
 187  *
 188  * If callee information is valid, we also optimize polymorphic Calls.
 189  *
 190  * @param force_run  if non-zero, an optimization run is started even
 191  *                   if no const function graph was detected.
 192  *                   Else calls are only optimized if at least one
 193  *                   const function graph was detected.
 194  * @param callback   a callback function to check whether a
 195  *                   given entity is a allocation call
 196  *
 197  * If the frontend created external entities with the irg_const_function
 198  * property set, the force_run parameter should be set, else
 199  * should be unset.
 200  *
 201  * @note This optimization destroys the link fields of nodes.
 202  */
 203 FIRM_API void optimize_funccalls(int force_run,
 204                                  check_alloc_entity_func callback);
 205
 206 /**
 207  * Creates an ir_prog pass for optimize_funccalls().
 208  *
 209  * @param name       the name of this pass or NULL
 210  * @param force_run  if non-zero, an optimization run is started even
 211  *                   if no const function graph was detected.
 212  *                   Else calls are only optimized if at least one
 213  *                   const function graph was detected.
 214  * @param callback   a callback function to check whether a
 215  *                   given entity is a allocation call
 216  *
 217  * @return  the newly created ir_prog pass
 218  */
 219 FIRM_API ir_prog_pass_t *optimize_funccalls_pass(const char *name,
 220                                                  int force_run,
 221                                                  check_alloc_entity_func callback);
 222
 223 /**
 224  * Does Partial Redundancy Elimination combined with
 225  * Global Value Numbering.
 226  * Can be used to replace place_code() completely.
 227  *
 228  * Based on VanDrunen and Hosking 2004.
 229  *
 230  * @param irg  the graph
 231  */
 232 FIRM_API void do_gvn_pre(ir_graph *irg);
 233
 234 /**
 235  * Creates an ir_graph pass for do_gvn_pre().
 236  *
 237  * @param name     the name of this pass or NULL
 238  *
 239  * @return  the newly created ir_graph pass
 240  */
 241 FIRM_API ir_graph_pass_t *do_gvn_pre_pass(const char *name);
 242
 243 /**
 244  * This function is called to evaluate, if a
 245  * mux(@p sel, @p mux_false, @p mux_true) should be built for the current
 246  * architecture.
 247  * If it returns non-zero, a mux is created, else the code
 248  * is not modified.
 249  * @param sel        A selector of a Cond.
 250  * @param phi_list   phi node to be converted
 251  * @param i          First data predecessor involved in if conversion
 252  * @param j          Second data predecessor involved in if conversion
 253  */
 254 typedef int (*arch_allow_ifconv_func)(ir_node *sel, ir_node *mux_false,
 255                                       ir_node *mux_true);
 256
 257 /**
 258  * Perform If conversion on a graph.
 259  *
 260  * @param irg The graph.
 261  *
 262  * Cannot handle blocks with Bad control predecessors, so call it after control
 263  * flow optimization.
 264  */
 265 FIRM_API void opt_if_conv(ir_graph *irg);
 266
 267 /**
 268  * Creates an ir_graph pass for opt_if_conv().
 269  *
 270  * @param name     the name of this pass or NULL
 271  *
 272  * @return  the newly created ir_graph pass
 273  */
 274 FIRM_API ir_graph_pass_t *opt_if_conv_pass(const char *name);
 275
 276 /**
 277  * Tries to reduce dependencies for memory nodes where possible by parllelizing
 278  * them and synchronising with Sync nodes
 279  * @param irg   the graph where memory operations should be parallelised
 280  */
 281 FIRM_API void opt_parallelize_mem(ir_graph *irg);
 282
 283 /**
 284  * Creates an ir_graph pass for opt_sync().
 285  *
 286  * @param name     the name of this pass or NULL
 287  *
 288  * @return  the newly created ir_graph pass
 289  */
 290 FIRM_API ir_graph_pass_t *opt_parallelize_mem_pass(const char *name);
 291
 292 /*
 293  * Check if we can replace the load by a given const from
 294  * the const code irg.
 295  *
 296  * @param load   the load to replace
 297  * @param c      the constant
 298  *
 299  * @return in the modes match or can be transformed using a reinterpret cast
 300  *         returns a copy of the constant (possibly Conv'ed) on the
 301  *         current_ir_graph
 302  */
 303 FIRM_API ir_node *can_replace_load_by_const(const ir_node *load, ir_node *c);
 304
 305 /**
 306  * Load/Store optimization.
 307  *
 308  * Removes redundant non-volatile Loads and Stores.
 309  * May introduce Bad nodes if exceptional control flow
 310  * is removed. The following cases are optimized:
 311  *
 312  * Load without result: A Load which has only a memory use
 313  *   is removed.
 314  *
 315  * Load after Store: A Load after a Store is removed, if
 316  *   the Load doesn't have an exception handler OR is in
 317  *   the same block as the Store.
 318  *
 319  * Load after Load: A Load after a Load is removed, if the
 320  *   Load doesn't have an exception handler OR is in the
 321  *   same block as the previous Load.
 322  *
 323  * Store before Store: A Store immediately before another
 324  *   Store in the same block is removed, if the Store doesn't
 325  *   have an exception handler.
 326  *
 327  * Store after Load: A Store after a Load is removed, if the
 328  *   Store doesn't have an exception handler.
 329  *
 330  * @return non-zero if the optimization could be applied, 0 else
 331  */
 332 FIRM_API int optimize_load_store(ir_graph *irg);
 333
 334 /**
 335  * Creates an ir_graph pass for optimize_load_store().
 336  *
 337  * @param name     the name of this pass or NULL
 338  *
 339  * @return  the newly created ir_graph pass
 340  */
 341 FIRM_API ir_graph_pass_t *optimize_load_store_pass(const char *name);
 342
 343 /**
 344  * New experimental alternative to optimize_load_store.
 345  * Based on a dataflow analysis, so load/stores are moved out of loops
 346  * where possible
 347  */
 348 FIRM_API int opt_ldst(ir_graph *irg);
 349
 350 /**
 351  * Creates an ir_graph pass for opt_ldst().
 352  *
 353  * @param name     the name of this pass or NULL
 354  *
 355  * @return  the newly created ir_graph pass
 356  */
 357 FIRM_API ir_graph_pass_t *opt_ldst_pass(const char *name);
 358
 359 /**
 360  * Optimize loops by peeling or unrolling them if beneficial.
 361  *
 362  * @param irg  The graph whose loops will be processed
 363  *
 364  * This function did not change the graph, only it's frame type.
 365  * The layout state of the frame type will be set to layout_undefined
 366  * if entities were removed.
 367  */
 368 FIRM_API void loop_optimization(ir_graph *irg);
 369
 370 /**
 371  * Optimize the frame type of an irg by removing
 372  * never touched entities.
 373  *
 374  * @param irg  The graph whose frame type will be optimized
 375  *
 376  * This function did not change the graph, only it's frame type.
 377  * The layout state of the frame type will be set to layout_undefined
 378  * if entities were removed.
 379  */
 380 FIRM_API void opt_frame_irg(ir_graph *irg);
 381
 382 /**
 383  * Creates an ir_graph pass for opt_frame_irg().
 384  *
 385  * @param name     the name of this pass or NULL
 386  *
 387  * @return  the newly created ir_graph pass
 388  */
 389 FIRM_API ir_graph_pass_t *opt_frame_irg_pass(const char *name);
 390
 391 /** Possible flags for the Operator Scalar Replacement. */
 392 typedef enum osr_flags {
 393         osr_flag_none               = 0,  /**< no additional flags */
 394         osr_flag_lftr_with_ov_check = 1,  /**< do linear function test replacement
 395                                                only if no overflow can occur. */
 396         osr_flag_ignore_x86_shift   = 2,  /**< ignore Multiplications by 2, 4, 8 */
 397         osr_flag_keep_reg_pressure  = 4   /**< do NOT increase register pressure by introducing new
 398                                                induction variables. */
 399 } osr_flags;
 400
 401 /* FirmJNI cannot handle identical enum values... */
 402
 403 /** default setting */
 404 #define osr_flag_default osr_flag_lftr_with_ov_check
 405
 406 /**
 407  * Do the Operator Scalar Replacement optimization and linear
 408  * function test replacement for loop control.
 409  * Can be switched off using the set_opt_strength_red() flag.
 410  * In that case, only remove_phi_cycles() is executed.
 411  *
 412  * @param irg    the graph which should be optimized
 413  * @param flags  set of osr_flags
 414  *
 415  * The linear function replacement test is controlled by the flags.
 416  * If the osr_flag_lftr_with_ov_check is set, the replacement is only
 417  * done if do overflow can occur.
 418  * Otherwise it is ALWAYS done which might be insecure.
 419  *
 420  * For instance:
 421  *
 422  * for (i = 0; i < 100; ++i)
 423  *
 424  * might be replaced by
 425  *
 426  * for (i = 0; i < 400; i += 4)
 427  *
 428  * But
 429  *
 430  * for (i = 0; i < 0x7FFFFFFF; ++i)
 431  *
 432  * will not be replaced by
 433  *
 434  * for (i = 0; i < 0xFFFFFFFC; i += 4)
 435  *
 436  * because of overflow.
 437  *
 438  * More bad cases:
 439  *
 440  * for (i = 0; i <= 0xF; ++i)
 441  *
 442  * will NOT be transformed into
 443  *
 444  * for (i = 0xFFFFFFF0; i <= 0xFFFFFFFF; ++i)
 445  *
 446  * although here is no direct overflow. The OV occurs when the ++i
 447  * is executed (and would created an endless loop here!).
 448  *
 449  * For the same reason, a loop
 450  *
 451  * for (i = 0; i <= 9; i += x)
 452  *
 453  * will NOT be transformed because we cannot estimate whether an overflow
 454  * might happen adding x.
 455  *
 456  * Note that i < a + 400 is also not possible with the current implementation
 457  * although this might be allowed by other compilers...
 458  *
 459  * Note further that tests for equality can be handled some simpler (but are not
 460  * implemented yet).
 461  *
 462  * This algorithm destroys the link field of nodes.
 463  */
 464 FIRM_API void opt_osr(ir_graph *irg, unsigned flags);
 465
 466 /**
 467  * Creates an ir_graph pass for remove_phi_cycles().
 468  *
 469  * @param name     the name of this pass or NULL
 470  * @param flags    set of osr_flags
 471  *
 472  * @return  the newly created ir_graph pass
 473  */
 474 FIRM_API ir_graph_pass_t *opt_osr_pass(const char *name, unsigned flags);
 475
 476 /**
 477  * Removes useless Phi cycles, i.e cycles of Phi nodes with only one
 478  * non-Phi node.
 479  * This is automatically done in opt_osr(), so there is no need to call it
 480  * additionally.
 481  *
 482  * @param irg    the graph which should be optimized
 483  *
 484  * This algorithm destroys the link field of nodes.
 485  */
 486 FIRM_API void remove_phi_cycles(ir_graph *irg);
 487
 488 /**
 489  * Creates an ir_graph pass for remove_phi_cycles().
 490  *
 491  * @param name     the name of this pass or NULL
 492  *
 493  * @return  the newly created ir_graph pass
 494  */
 495 FIRM_API ir_graph_pass_t *remove_phi_cycles_pass(const char *name);
 496
 497
 498 /** A default threshold. */
 499 #define DEFAULT_CLONE_THRESHOLD 20
 500
 501 /**
 502  * Do procedure cloning. Evaluate a heuristic weight for every
 503  * Call(..., Const, ...). If the weight is bigger than threshold,
 504  * clone the entity and fix the calls.
 505  *
 506  * @param threshold   the threshold for cloning
 507  *
 508  * The threshold is an estimation of how many instructions are saved
 509  * when executing a cloned method. If threshold is 0.0, every possible
 510  * call is cloned.
 511  */
 512 FIRM_API void proc_cloning(float threshold);
 513
 514 /**
 515  * Creates an ir_prog pass for proc_cloning().
 516  *
 517  * @param name        the name of this pass or NULL
 518  * @param threshold   the threshold for cloning
 519  *
 520  * @return  the newly created ir_prog pass
 521  */
 522 FIRM_API ir_prog_pass_t *proc_cloning_pass(const char *name, float threshold);
 523
 524 /**
 525  * Reassociation.
 526  *
 527  * Applies Reassociation rules to integer expressions.
 528  * Beware: Works only if integer overflow might be ignored, as for C, Java
 529  * and for address expression.
 530  * Works only if Constant folding is activated.
 531  *
 532  * Uses loop information to detect loop-invariant (ie contant
 533  * inside the loop) values.
 534  *
 535  * See Muchnik 12.3.1 Algebraic Simplification and Reassociation of
 536  * Addressing Expressions.
 537  *
 538  * @return non-zero if the optimization could be applied, 0 else
 539  */
 540 FIRM_API int optimize_reassociation(ir_graph *irg);
 541
 542 /**
 543  * Creates an ir_graph pass for optimize_reassociation().
 544  *
 545  * @param name     the name of this pass or NULL
 546  *
 547  * @return  the newly created ir_graph pass
 548  */
 549 FIRM_API ir_graph_pass_t *optimize_reassociation_pass(const char *name);
 550
 551 /**
 552  * Normalize the Returns of a graph by creating a new End block
 553  * with One Return(Phi).
 554  * This is the preferred input for the if-conversion.
 555  *
 556  * In pseudocode, it means:
 557  *
 558  * if (a)
 559  *   return b;
 560  * else
 561  *   return c;
 562  *
 563  * is transformed into
 564  *
 565  * if (a)
 566  *   res = b;
 567  * else
 568  *   res = c;
 569  * return res;
 570  */
 571 FIRM_API void normalize_one_return(ir_graph *irg);
 572
 573 /**
 574  * Creates an ir_graph pass for normalize_one_return().
 575  *
 576  * @param name     the name of this pass or NULL
 577  *
 578  * @return  the newly created ir_graph pass
 579  */
 580 FIRM_API ir_graph_pass_t *normalize_one_return_pass(const char *name);
 581
 582 /**
 583  * Normalize the Returns of a graph by moving
 584  * the Returns upwards as much as possible.
 585  * This might be preferred for code generation.
 586  *
 587  * In pseudocode, it means:
 588  *
 589  * if (a)
 590  *   res = b;
 591  * else
 592  *   res = c;
 593  * return res;
 594  *
 595  * is transformed into
 596  *
 597  * if (a)
 598  *   return b;
 599  * else
 600  *   return c;
 601  */
 602 FIRM_API void normalize_n_returns(ir_graph *irg);
 603
 604 /**
 605  * Creates an ir_graph pass for normalize_n_returns().
 606  *
 607  * @param name     the name of this pass or NULL
 608  *
 609  * @return  the newly created ir_graph pass
 610  */
 611 FIRM_API ir_graph_pass_t *normalize_n_returns_pass(const char *name);
 612
 613 /**
 614  * Do the scalar replacement optimization.
 615  * Replace local compound entities (like structures and arrays)
 616  * with atomic values if possible. Does not handle classes yet.
 617  *
 618  * @param irg  the graph which should be optimized
 619  *
 620  * @return non-zero, if at least one entity was replaced
 621  */
 622 FIRM_API int scalar_replacement_opt(ir_graph *irg);
 623
 624 /**
 625  * Creates an ir_graph pass for scalar_replacement_opt().
 626  *
 627  * @param name     the name of this pass or NULL
 628  *
 629  * @return  the newly created ir_graph pass
 630  */
 631 FIRM_API ir_graph_pass_t *scalar_replacement_opt_pass(const char *name);
 632
 633 /** Performs strength reduction for the passed graph. */
 634 FIRM_API void reduce_strength(ir_graph *irg);
 635
 636 /**
 637  * Optimizes tail-recursion calls by converting them into loops.
 638  * Depends on the flag opt_tail_recursion.
 639  * Currently supports the following forms:
 640  *  - return func();
 641  *  - return x + func();
 642  *  - return func() - x;
 643  *  - return x * func();
 644  *  - return -func();
 645  *
 646  * Does not work for Calls that use the exception stuff.
 647  *
 648  * @param irg   the graph to be optimized
 649  *
 650  * @return non-zero if the optimization could be applied, 0 else
 651  */
 652 FIRM_API int opt_tail_rec_irg(ir_graph *irg);
 653
 654 /**
 655  * Creates an ir_graph pass for opt_tail_rec_irg().
 656  *
 657  * @param name     the name of this pass or NULL
 658  *
 659  * @return  the newly created ir_graph pass
 660  */
 661 FIRM_API ir_graph_pass_t *opt_tail_rec_irg_pass(const char *name);
 662
 663 /**
 664  * Optimize tail-recursion calls for all IR-Graphs.
 665  * Can currently handle:
 666  * - direct return value, i.e. return func().
 667  * - additive return value, i.e. return x +/- func()
 668  * - multiplicative return value, i.e. return x * func() or return -func()
 669  *
 670  * The current implementation must be run before optimize_funccalls(),
 671  * because it expects the memory edges pointing to calls, which might be
 672  * removed by optimize_funccalls().
 673  */
 674 FIRM_API void opt_tail_recursion(void);
 675
 676 /**
 677  * Creates an ir_prog pass for opt_tail_recursion().
 678  *
 679  * @param name     the name of this pass or NULL
 680  *
 681  * @return  the newly created ir_prog pass
 682  */
 683 FIRM_API ir_prog_pass_t *opt_tail_recursion_pass(const char *name);
 684
 685 /** This is the type for a method, that returns a pointer type to
 686  *  tp.  This is needed in the normalization. */
 687 typedef ir_type *(*gen_pointer_type_to_func)(ir_type *tp);
 688
 689 /**  Insert Casts so that class type casts conform exactly with the type hierarchy.
 690  *
 691  *  Formulated in Java, this achieves the following:
 692  *
 693  *  For a class hierarchy
 694  *    class A {}
 695  *    class B extends A {}
 696  *    class C extends B {}
 697  *  we transforms a cast
 698  *    (A)new C()
 699  *  to
 700  *    (A)((B)new C()).
 701  *
 702  *  The algorithm works for Casts with class types, but also for Casts
 703  *  with all pointer types that point (over several indirections,
 704  *  i.e. ***A) to a class type.  Normalizes all graphs.  Computes type
 705  *  information (@see irtypeinfo.h) if not available.
 706  *  Invalidates trout information as new casts are generated.
 707  *
 708  *  @param gppt_fct A function that returns a pointer type that points
 709  *    to the type given as argument.  If this parameter is NULL, a default
 710  *    function is used that either uses trout information or performs a O(n)
 711  *    search to find an existing pointer type.  If it can not find a type,
 712  *    generates a pointer type with mode_P_mach and suffix "cc_ptr_tp".
 713  */
 714 FIRM_API void normalize_irp_class_casts(gen_pointer_type_to_func gppt_fct);
 715
 716 /**  Insert Casts so that class type casts conform exactly with the type hierarchy
 717  *   in given graph.
 718  *
 719  *   For more details see normalize_irp_class_casts().
 720  *
 721  *  This transformation requires that type information is computed. @see irtypeinfo.h.
 722  */
 723 FIRM_API void normalize_irg_class_casts(ir_graph *irg,
 724                                         gen_pointer_type_to_func gppt_fct);
 725
 726 /** Optimize casting between class types.
 727  *
 728  *    class A { m(); }
 729  *    class B extends A { }
 730  *    class C extends B {}
 731  *  Performs the following transformations:
 732  *    C c = (C)(B)(A)(B)new C()  --> C c = (C)(B)newC() --> C c = new C()
 733  *    (Optimizing downcasts as A a = (A)(B)(new A()) --> A a = new A() can
 734  *     be suppressed by setting the flag opt_suppress_downcast_optimization.
 735  *     Downcasting A to B might cause an exception.  It is not clear
 736  *     whether this is modeled by the Firm Cast node, as it has no exception
 737  *     outputs.);
 738  *  If there is inh_m() that overwrites m() in B:
 739  *    ((A) new B()).m()  --> (new B()).inh_m()
 740  *  Phi((A)x, (A)y)  --> (A) Phi (x, y)  if (A) is an upcast.
 741  *
 742  *  Computes type information if not available. @see irtypeinfo.h.
 743  *  Typeinformation is valid after optimization.
 744  *  Invalidates trout information.
 745  */
 746 FIRM_API void optimize_class_casts(void);
 747
 748 /**
 749  * CLiff Click's combo algorithm from
 750  *   "Combining Analyses, combining Optimizations".
 751  *
 752  * Does conditional constant propagation, unreachable code elimination and
 753  * optimistic global value numbering at once.
 754  *
 755  * @param irg  the graph to run on
 756  */
 757 FIRM_API void combo(ir_graph *irg);
 758
 759 /**
 760  * Creates an ir_graph pass for combo.
 761  *
 762  * @param name     the name of this pass or NULL
 763  *
 764  * @return  the newly created ir_graph pass
 765  */
 766 FIRM_API ir_graph_pass_t *combo_pass(const char *name);
 767
 768 /**
 769  * Inlines all small methods at call sites where the called address comes
 770  * from a SymConst node that references the entity representing the called
 771  * method.
 772  *
 773  * @param irg  the graph
 774  * @param size maximum function size
 775  *
 776  * The size argument is a rough measure for the code size of the method:
 777  * Methods where the obstack containing the firm graph is smaller than
 778  * size are inlined.  Further only a limited number of calls are inlined.
 779  * If the method contains more than 1024 inlineable calls none will be
 780  * inlined.
 781  * Inlining is only performed if flags `optimize' and `inlineing' are set.
 782  * The graph may not be in state phase_building.
 783  * It is recommended to call local_optimize_graph() after inlining as this
 784  * function leaves a set of obscure Tuple nodes, e.g. a Proj-Tuple-Jmp
 785  * combination as control flow operation.
 786  */
 787 FIRM_API void inline_small_irgs(ir_graph *irg, int size);
 788
 789 /**
 790  * Creates an ir_graph pass for inline_small_irgs().
 791  *
 792  * @param name   the name of this pass or NULL
 793  * @param size   maximum function size
 794  *
 795  * @return  the newly created ir_graph pass
 796  */
 797 FIRM_API ir_graph_pass_t *inline_small_irgs_pass(const char *name, int size);
 798
 799 /**
 800  * Inlineing with a different heuristic than inline_small_irgs().
 801  *
 802  * Inlines leave functions.  If inlinening creates new leave
 803  * function inlines these, too. (If g calls f, and f calls leave h,
 804  * h is first inlined in f and then f in g.)
 805  *
 806  * Then inlines all small functions (this is not recursive).
 807  *
 808  * For a heuristic this inlineing uses firm node counts.  It does
 809  * not count auxiliary nodes as Proj, Tuple, End, Start, Id, Sync.
 810  * If the ignore_runtime flag is set, calls to functions marked with the
 811  * mtp_property_runtime property are ignored.
 812  *
 813  * @param maxsize         Do not inline any calls if a method has more than
 814  *                        maxsize firm nodes.  It may reach this limit by
 815  *                        inlineing.
 816  * @param leavesize       Inline leave functions if they have less than leavesize
 817  *                        nodes.
 818  * @param size            Inline all function smaller than size.
 819  * @param ignore_runtime  count a function only calling runtime functions as
 820  *                        leave
 821  */
 822 FIRM_API void inline_leave_functions(unsigned maxsize, unsigned leavesize,
 823                                      unsigned size, int ignore_runtime);
 824
 825 /**
 826  * Creates an ir_prog pass for inline_leave_functions().
 827  *
 828  * @param name            the name of this pass or NULL
 829  * @param maxsize         Do not inline any calls if a method has more than
 830  *                        maxsize firm nodes.  It may reach this limit by
 831  *                        inlineing.
 832  * @param leavesize       Inline leave functions if they have less than leavesize
 833  *                        nodes.
 834  * @param size            Inline all function smaller than size.
 835  * @param ignore_runtime  count a function only calling runtime functions as
 836  *                        leave
 837  *
 838  * @return  the newly created ir_prog pass
 839  */
 840 FIRM_API ir_prog_pass_t *inline_leave_functions_pass(const char *name,
 841                 unsigned maxsize, unsigned leavesize, unsigned size,
 842                 int ignore_runtime);
 843
 844 typedef void (*opt_ptr)(ir_graph *irg);
 845
 846 /**
 847  * Heuristic inliner. Calculates a benefice value for every call and inlines
 848  * those calls with a value higher than the threshold.
 849  *
 850  * @param maxsize             Do not inline any calls if a method has more than
 851  *                            maxsize firm nodes.  It may reach this limit by
 852  *                            inlining.
 853  * @param inline_threshold    inlining threshold
 854  * @param after_inline_opt    optimizations performed immediately after inlining
 855  *                            some calls
 856  */
 857 FIRM_API void inline_functions(unsigned maxsize, int inline_threshold,
 858                                opt_ptr after_inline_opt);
 859
 860 /**
 861  * Creates an ir_prog pass for inline_functions().
 862  *
 863  * @param name               the name of this pass or NULL
 864  * @param maxsize            Do not inline any calls if a method has more than
 865  *                           maxsize firm nodes.  It may reach this limit by
 866  *                           inlineing.
 867  * @param inline_threshold   inlining threshold
 868  * @param after_inline_opt   a function that is called after inlining a
 869  *                           procedure. You should run fast local optimisations
 870  *                           here which cleanup the graph before further
 871  *                           inlining
 872  *
 873  * @return  the newly created ir_prog pass
 874  */
 875 FIRM_API ir_prog_pass_t *inline_functions_pass(const char *name,
 876                 unsigned maxsize, int inline_threshold, opt_ptr after_inline_opt);
 877
 878 /**
 879  * Combines congruent blocks into one.
 880  *
 881  * @param irg   The IR-graph to optimize.
 882  *
 883  * @return non-zero if the graph was transformed
 884  */
 885 FIRM_API int shape_blocks(ir_graph *irg);
 886
 887 /**
 888  * Creates an ir_graph pass for shape_blocks().
 889  *
 890  * @param name   the name of this pass or NULL
 891  *
 892  * @return  the newly created ir_graph pass
 893  */
 894 FIRM_API ir_graph_pass_t *shape_blocks_pass(const char *name);
 895
 896 /**
 897  * Perform loop inversion on a given graph.
 898  * Loop inversion transforms a head controlled loop (like while(...) {} and
 899  * for(...) {}) into a foot controlled loop (do {} while(...)).
 900  */
 901 FIRM_API void do_loop_inversion(ir_graph *irg);
 902
 903 /**
 904  * Perform loop unrolling on a given graph.
 905  * Loop unrolling multiplies the number loop completely by a number found
 906  * through a heuristic.
 907  */
 908 FIRM_API void do_loop_unrolling(ir_graph *irg);
 909
 910 /**
 911  * Perform loop peeling on a given graph.
 912  */
 913 FIRM_API void do_loop_peeling(ir_graph *irg);
 914
 915 /**
 916  * Creates an ir_graph pass for loop inversion.
 917  *
 918  * @param name     the name of this pass or NULL
 919  *
 920  * @return  the newly created ir_graph pass
 921  */
 922 FIRM_API ir_graph_pass_t *loop_inversion_pass(const char *name);
 923
 924 /**
 925  * Creates an ir_graph pass for loop unrolling.
 926  *
 927  * @param name     the name of this pass or NULL
 928  *
 929  * @return  the newly created ir_graph pass
 930  */
 931 FIRM_API ir_graph_pass_t *loop_unroll_pass(const char *name);
 932
 933 /**
 934  * Creates an ir_graph pass for loop peeling.
 935  *
 936  * @param name     the name of this pass or NULL
 937  *
 938  * @return  the newly created ir_graph pass
 939  */
 940 FIRM_API ir_graph_pass_t *loop_peeling_pass(const char *name);
 941
 942 typedef ir_type *(*get_Alloc_func)(ir_node *n);
 943 /** Set a new get_Alloc_func and returns the old one. */
 944 FIRM_API get_Alloc_func firm_set_Alloc_func(get_Alloc_func newf);
 945
 946 /**
 947  * Creates an ir_graph pass for set_vrp_data()
 948  *
 949  * @param name The name of this pass or NULL
 950  *
 951  * @return the newly created ir_graph pass
 952  */
 953 FIRM_API ir_graph_pass_t *set_vrp_pass(const char *name);
 954
 955 /**
 956  * Removes all entities which are unused.
 957  *
 958  * Unused entities have ir_visibility_local and are not used directly or
 959  * indirectly through entities/code visible outside the compilation unit.
 960  * This is usually conservative than gc_irgs, but does not respect properties
 961  * of object-oriented programs.
 962  */
 963 FIRM_API void garbage_collect_entities(void);
 964
 965 /** Pass for garbage_collect_entities */
 966 FIRM_API ir_prog_pass_t *garbage_collect_entities_pass(const char *name);
 967
 968 /**
 969  * Performs dead node elimination by copying the ir graph to a new obstack.
 970  *
 971  *  The major intention of this pass is to free memory occupied by
 972  *  dead nodes and outdated analyzes information.  Further this
 973  *  function removes Bad predecessors from Blocks and the corresponding
 974  *  inputs to Phi nodes.  This opens optimization potential for other
 975  *  optimizations.  Further this phase reduces dead Block<->Jmp
 976  *  self-cycles to Bad nodes.
 977  *
 978  *  Dead_node_elimination is only performed if options `optimize' and
 979  *  `opt_dead_node_elimination' are set.  The graph may
 980  *  not be in state phase_building.  The outs datasturcture is freed,
 981  *  the outs state set to outs_none.  Backedge information is conserved.
 982  *  Removes old attributes of nodes.  Sets link field to NULL.
 983  *  Callee information must be freed (irg_callee_info_none).
 984  *
 985  * @param irg  The graph to be optimized.
 986  */
 987 FIRM_API void dead_node_elimination(ir_graph *irg);
 988
 989 /**
 990  * Creates an ir_graph pass for dead_node_elimination().
 991  *
 992  * @param name     the name of this pass or NULL
 993  *
 994  * @return  the newly created ir_graph pass
 995  */
 996 FIRM_API ir_graph_pass_t *dead_node_elimination_pass(const char *name);
 997
 998 /**
 999  * Inlines a method at the given call site.
1000  *
1001  *  Removes the call node and splits the basic block the call node
1002  *  belongs to.  Inserts a copy of the called graph between these nodes.
1003  *  Assumes that call is a Call node in current_ir_graph and that
1004  *  the type in the Call nodes type attribute is the same as the
1005  *  type of the called graph.
1006  *  Further it assumes that all Phi nodes in a block of current_ir_graph
1007  *  are assembled in a "link" list in the link field of the corresponding
1008  *  block nodes.  Further assumes that all Proj nodes are in a "link" list
1009  *  in the nodes producing the tuple.  (This is only an optical feature
1010  *  for the graph.)  Conserves this feature for the old
1011  *  nodes of the graph.  This precondition can be established by a call to
1012  *  collect_phisprojs(), see irgmod.h.
1013  *  As dead_node_elimination this function reduces dead Block<->Jmp
1014  *  self-cycles to Bad nodes.
1015  *
1016  *  Called_graph must be unequal to current_ir_graph.   Will not inline
1017  *  if they are equal.
1018  *  Sets visited masterflag in current_ir_graph to the max of the flag in
1019  *  current and called graph.
1020  *  Assumes that both, the called and the calling graph are in state
1021  *  "op_pin_state_pinned".
1022  *  It is recommended to call local_optimize_graph() after inlining as this
1023  *  function leaves a set of obscure Tuple nodes, e.g. a Proj-Tuple-Jmp
1024  *  combination as control flow operation.
1025  *
1026  *  @param call          the call node that should be inlined
1027  *  @param called_graph  the IR-graph that is called at call
1028  *
1029  *  @return zero if method could not be inlined (recursion for instance),
1030  *          non-zero if all went ok
1031  */
1032 FIRM_API int inline_method(ir_node *call, ir_graph *called_graph);
1033
1034 /**
1035  * Code Placement.
1036  *
1037  * Pins all floating nodes to a block where they
1038  * will be executed only if needed.   Depends on the flag opt_global_cse.
1039  * Graph may not be in phase_building.  Does not schedule control dead
1040  * code.  Uses dominator information which it computes if the irg is not
1041  * in state dom_consistent.  Destroys the out information as it moves nodes
1042  * to other blocks.  Optimizes Tuples in Control edges.
1043  *
1044  * Call remove_critical_cf_edges() before place_code().  This normalizes
1045  * the control flow graph so that for all operations a basic block exists
1046  * where they can be optimally placed.
1047  */
1048 FIRM_API void place_code(ir_graph *irg);
1049
1050 /**
1051  * Creates an ir_graph pass for place_code().
1052  * This pass enables GCSE, runs optimize_graph_df() and finally
1053  * place_code();
1054  *
1055  * @param name     the name of this pass or NULL
1056  *
1057  * @return  the newly created ir_graph pass
1058  */
1059 FIRM_API ir_graph_pass_t *place_code_pass(const char *name);
1060
1061 /**
1062  * Determine information about the values of nodes and perform simplications
1063  * using this information.  This optimization performs a data-flow analysis to
1064  * find the minimal fixpoint.
1065  */
1066 FIRM_API void fixpoint_vrp(ir_graph*);
1067
1068 /**
1069  * Creates an ir_graph pass for fixpoint_vrp().
1070  * This pass dDetermines information about the values of nodes
1071  * and perform simplications using this information.
1072  * This optimization performs a data-flow analysis to
1073  * find the minimal fixpoint.
1074  *
1075  * @param name     the name of this pass or NULL
1076  *
1077  * @return  the newly created ir_graph pass
1078  */
1079 FIRM_API ir_graph_pass_t *fixpoint_vrp_irg_pass(const char *name);
1080
1081 #include "end.h"
1082
1083 #endif