2 * Copyright (C) 1995-2007 University of Karlsruhe. All right reserved.
4 * This file is part of libFirm.
6 * This file may be distributed and/or modified under the terms of the
7 * GNU General Public License version 2 as published by the Free Software
8 * Foundation and appearing in the file LICENSE.GPL included in the
9 * packaging of this file.
11 * Licensees holding valid libFirm Professional Edition licenses may use
12 * this file in accordance with the libFirm Commercial License.
13 * Agreement provided with the Software.
15 * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
16 * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * @brief Available Optimisations of libFirm.
23 * @version $Id: cfopt.h 13543 2007-04-29 19:29:02Z beck $
25 #ifndef FIRM_IROPTIMIZE_H
26 #define FIRM_IROPTIMIZE_H
28 #include "firm_types.h"
31 * Control flow optimization.
33 * Removes empty blocks doing if simplifications and loop simplifications.
34 * A block is empty if it contains only a Jmp node and Phi nodes.
35 * Merges single entry single exit blocks with their predecessor
36 * and propagates dead control flow by calling equivalent_node().
37 * Independent of compiler flag it removes Tuples from cf edges,
38 * Bad predecessors from Blocks and Phis, and unnecessary predecessors of End.
40 * @bug So far destroys backedge information.
41 * @bug Chokes on Id nodes if called in a certain order with other
42 * optimizations. Call local_optimize_graph() before to remove
45 void optimize_cf(ir_graph *irg);
48 * Perform partial conditional evaluation on the given graph.
50 * @param irg the graph
52 void opt_cond_eval(ir_graph* irg);
55 * Try to reduce the number of conv nodes in the given ir graph.
57 * @param irg the graph
59 void conv_opt(ir_graph *irg);
62 * Do the scalar replacement optimization.
63 * Make a date flow analyze and split the
66 * @param irg the graph which should be optimized
68 void data_flow_scalar_replacement_opt(ir_graph *irg);
71 * A callback that checks whether a entity is an allocation
74 typedef int (*check_alloc_entity_func)(ir_entity *ent);
77 * Do simple and fast escape analysis for one graph.
79 * @param irg the graph
80 * @param callback a callback function to check whether a
81 * given entity is a allocation call
83 void escape_enalysis_irg(ir_graph *irg, check_alloc_entity_func callback);
86 * Do simple and fast escape analysis for all graphs.
88 * This optimization implements a simple and fast but inexact
89 * escape analysis. Some addresses might be marked as 'escaped' even
91 * The advantage is a low memory footprint and fast speed.
93 * @param run_scalar_replace if this flag in non-zero, scalar
94 * replacement optimization is run on graphs with removed
96 * @param callback a callback function to check whether a
97 * given entity is a allocation call
99 * This optimization removes allocation which are not used (rare) and replace
100 * allocation that can be proved dead at the end of the graph which stack variables.
102 * The creation of stack variable allows scalar replacement to be run only
103 * on those graphs that have been changed.
105 * This is most effective on Java where no other stack variables exists.
107 void escape_analysis(int run_scalar_replace, check_alloc_entity_func callback);
110 * Optimize function calls by handling const functions.
112 * This optimization first detects all "const functions", i.e.,
113 * IR graphs that neither read nor write memory (and hence did
114 * not create exceptions, as these use memory in Firm).
116 * The result of calls to such functions depends only on its
117 * arguments, hence those calls are no more pinned.
119 * This is a rather strong criteria, so do not expect that a
120 * lot of functions will be found. Moreover, all of them might
121 * already be inlined if inlining is activated.
122 * Anyway, it might be good for handling builtin's or pseudo-graphs,
123 * even if the later read/write memory (but we know how).
125 * This optimizations read the irg_const_function property of
126 * entities and and sets the irg_const_function property of
129 * If callee information is valid, we also optimize polymorphic Calls.
131 * @param force_run if non-zero, an optimization run is started even
132 * if no const function graph was detected.
133 * Else calls are only optimized if at least one
134 * const function graph was detected.
136 * If the fontend created external entities with the irg_const_function
137 * property set, the force_run parameter should be set, else
140 * @note This optimization destroys the link fields of nodes.
142 void optimize_funccalls(int force_run);
145 * Does Partial Redundancy Elimination combined with
146 * Global Value Numbering.
147 * Can be used to replace place_code() completely.
149 * Based on VanDrunen and Hosking 2004.
151 * @param irg the graph
154 * Currently completely broken because the used sets do NOT
155 * preserve the topological sort of its elements.
157 void do_gvn_pre(ir_graph *irg);
160 * This function is called to evaluate, if a mux can build
161 * of the current architecture.
162 * If it returns non-zero, a mux is created, else the code
164 * @param sel A selector of a Cond.
165 * @param phi_list List of Phi nodes about to be converted (linked via link field)
166 * @param i First data predecessor involved in if conversion
167 * @param j Second data predecessor involved in if conversion
169 typedef int (*arch_allow_ifconv_func)(ir_node *sel, ir_node* phi_list, int i, int j);
172 * The parameters structure.
174 typedef struct _opt_if_conv_info_t {
175 int max_depth; /**< The maximum depth up to which expressions
176 are examined when it has to be decided if they
177 can be placed into another block. */
178 arch_allow_ifconv_func allow_ifconv; /**< Evaluator function, if not set all possible Psi
179 nodes will be created. */
180 } opt_if_conv_info_t;
183 * Perform If conversion on a graph.
185 * @param irg The graph.
186 * @param params The parameters for the if conversion.
188 * Cannot handle blocks with Bad control predecessors, so call it after control
191 void opt_if_conv(ir_graph *irg, const opt_if_conv_info_t *params);
193 void opt_ldst2(ir_graph *irg);
196 * Load/Store optimization.
198 * Removes redundant non-volatile Loads and Stores.
199 * May introduce Bad nodes if exceptional control flow
200 * is removed. The following cases are optimized:
202 * Load without result: A Load which has only a memory use
205 * Load after Store: A Load after a Store is removed, if
206 * the Load doesn't have an exception handler OR is in
207 * the same block as the Store.
209 * Load after Load: A Load after a Load is removed, if the
210 * Load doesn't have an exception handler OR is in the
211 * same block as the previous Load.
213 * Store before Store: A Store immediately before another
214 * Store in the same block is removed, if the Store doesn't
215 * have an exception handler.
217 * Store after Load: A Store after a Load is removed, if the
218 * Store doesn't have an exception handler.
220 void optimize_load_store(ir_graph *irg);
223 * Do Loop unrolling in the given graph.
225 void optimize_loop_unrolling(ir_graph *irg);
228 * Optimize the frame type of an irg by removing
229 * never touched entities.
231 * @param irg The graph whose frame type will be optimized
233 * This function did not change the graph, only it's frame type.
234 * The layout state of the frame type will be set to layout_undefined
235 * if entities were removed.
237 void opt_frame_irg(ir_graph *irg);
239 /** Possible flags for the Operator Scalar Replacement. */
240 typedef enum osr_flags {
241 osr_flag_none = 0, /**< no additional flags */
242 osr_flag_lftr_with_ov_check = 1, /**< do linear function test replacement
243 only if no overflow can occur. */
244 osr_flag_ignore_x86_shift = 2 /**< ignore Multiplications by 2, 4, 8 */
247 /* FirmJNI cannot handle identical enum values... */
249 /** default setting */
250 #define osr_flag_default osr_flag_lftr_with_ov_check
253 * Do the Operator Scalar Replacement optimization and linear
254 * function test replacement for loop control.
255 * Can be switched off using the set_opt_strength_red() flag.
256 * In that case, only remove_phi_cycles() is executed.
258 * @param irg the graph which should be optimized
259 * @param flags set of osr_flags
261 * The linear function replacement test is controlled by the flags.
262 * If the osr_flag_lftr_with_ov_check is set, the replacement is only
263 * done if do overflow can occur.
264 * Otherwise it is ALWAYS done which might be insecure.
268 * for (i = 0; i < 100; ++i)
270 * might be replaced by
272 * for (i = 0; i < 400; i += 4)
276 * for (i = 0; i < 0x7FFFFFFF; ++i)
278 * will not be replaced by
280 * for (i = 0; i < 0xFFFFFFFC; i += 4)
282 * because of overflow.
286 * for (i = 0; i <= 0xF; ++i)
288 * will NOT be transformed into
290 * for (i = 0xFFFFFFF0; i <= 0xFFFFFFFF; ++i)
292 * although here is no direct overflow. The OV occurs when the ++i
293 * is executed (and would created an endless loop here!).
295 * For the same reason, a loop
297 * for (i = 0; i <= 9; i += x)
299 * will NOT be transformed because we cannot estimate whether an overflow
300 * might happen adding x.
302 * Note that i < a + 400 is also not possible with the current implementation
303 * although this might be allowed by other compilers...
305 * Note further that tests for equality can be handled some simpler (but are not
308 * This algorithm destroys the link field of nodes.
310 void opt_osr(ir_graph *irg, unsigned flags);
313 * Removes useless Phi cycles, i.e cycles of Phi nodes with only one
315 * This is automatically done in opt_osr(), so there is no need to call it
318 * @param irg the graph which should be optimized
320 * This algorithm destroys the link field of nodes.
322 void remove_phi_cycles(ir_graph *irg);
324 /** A default threshold. */
325 #define DEFAULT_CLONE_THRESHOLD 300
328 * Do procedure cloning. Evaluate a heuristic weight for every
329 * Call(..., Const, ...). If the weight is bigger than threshold,
330 * clone the entity and fix the calls.
332 * @param threshold the threshold for cloning
334 * The threshold is an estimation of how many instructions are saved
335 * when executing a cloned method. If threshold is 0.0, every possible
338 void proc_cloning(float threshold);
343 * Applies Reassociation rules to integer expressions.
344 * Beware: Works only if integer overflow might be ignored, as for C, Java
345 * and for address expression.
346 * Works only if Constant folding is activated.
348 * Uses loop information to detect loop-invariant (ie contant
349 * inside the loop) values.
351 * See Muchnik 12.3.1 Algebraic Simplification and Reassociation of
352 * Addressing Expressions.
356 void optimize_reassociation(ir_graph *irg);
359 * Normalize the Returns of a graph by creating a new End block
360 * with One Return(Phi).
361 * This is the preferred input for the if-conversion.
363 * In pseudocode, it means:
370 * is transformed into
378 void normalize_one_return(ir_graph *irg);
381 * Normalize the Returns of a graph by moving
382 * the Returns upwards as much as possible.
383 * This might be preferred for code generation.
385 * In pseudocode, it means:
393 * is transformed into
400 void normalize_n_returns(ir_graph *irg);
403 * Do the scalar replacement optimization.
404 * Replace local compound entities (like structures and arrays)
405 * with atomic values if possible. Does not handle classes yet.
407 * @param irg the graph which should be optimized
409 void scalar_replacement_opt(ir_graph *irg);
411 /** Performs strength reduction for the passed graph. */
412 void reduce_strength(ir_graph *irg);
415 * Optimizes simple tail-recursion calls by
416 * converting them into loops. Depends on the flag opt_tail_recursion.
418 * Does not work for Calls that use the exception stuff.
420 * @param irg the graph to be optimized
422 * @return non-zero if the optimization could be applied, 0 else
424 int opt_tail_rec_irg(ir_graph *irg);
427 * Optimize tail-recursion calls for all IR-Graphs.
428 * Depends on the flag opt_tail_recursion.
430 void opt_tail_recursion(void);
432 /** This is the type for a method, that returns a pointer type to
433 * tp. This is needed in the normalization. */
434 typedef ir_type *(*gen_pointer_type_to_func)(ir_type *tp);
436 /** Insert Casts so that class type casts conform exactly with the type hierarchy.
438 * Formulated in Java, this achieves the following:
440 * For a class hierarchy
442 * class B extends A {}
443 * class C extends B {}
444 * we transforms a cast
449 * The algorithm works for Casts with class types, but also for Casts
450 * with all pointer types that point (over several indirections,
451 * i.e. ***A) to a class type. Normalizes all graphs. Computes type
452 * information (@see irtypeinfo.h) if not available.
453 * Invalidates trout information as new casts are generated.
455 * @param gppt_fct A function that returns a pointer type that points
456 * to the type given as argument. If this parameter is NULL, a default
457 * function is used that either uses trout information or performs a O(n)
458 * search to find an existing pointer type. If it can not find a type,
459 * generates a pointer type with mode_P_mach and suffix "cc_ptr_tp".
461 void normalize_irp_class_casts(gen_pointer_type_to_func gppt_fct);
464 /** Insert Casts so that class type casts conform exactly with the type hierarchy
467 * For more details see normalize_irp_class_casts().
469 * This transformation requires that type information is computed. @see irtypeinfo.h.
471 void normalize_irg_class_casts(ir_graph *irg, gen_pointer_type_to_func gppt_fct);
474 /** Optimize casting between class types.
477 * class B extends A { }
478 * class C extends B {}
479 * Performs the following transformations:
480 * C c = (C)(B)(A)(B)new C() --> C c = (C)(B)newC() --> C c = new C()
481 * (Optimizing downcasts as A a = (A)(B)(new A()) --> A a = new A() can
482 * be suppressed by setting the flag opt_suppress_downcast_optimization.
483 * Downcasting A to B might cause an exception. It is not clear
484 * whether this is modeled by the Firm Cast node, as it has no exception
486 * If there is inh_m() that overwrites m() in B:
487 * ((A) new B()).m() --> (new B()).inh_m()
488 * Phi((A)x, (A)y) --> (A) Phi (x, y) if (A) is an upcast.
490 * Computes type information if not available. @see irtypeinfo.h.
491 * Typeinformation is valid after optimization.
492 * Invalidates trout information.
494 void optimize_class_casts(void);
497 * Change the calling conventions for all local methods.
499 * @param cc new calling convention
501 void opt_change_calling_conventions(unsigned cc);