updated

[libfirm] / ir / ir / irgopt.c
diff --git a/ir/ir/irgopt.c b/ir/ir/irgopt.c

index 971e0c1..8be6585 100644 (file)
--- a/ir/ir/irgopt.c
+++ b/ir/ir/irgopt.c
@@ -1,5 +1,5 @@
  /*
- * Copyright (C) 1995-2007 University of Karlsruhe.  All right reserved.
+ * Copyright (C) 1995-2008 University of Karlsruhe.  All right reserved.
   *
   * This file is part of libFirm.
   *
@@ -52,7 +52,7 @@
  #include "irbackedge_t.h"
  #include "cgana.h"
  #include "trouts.h"
-
+#include "error.h"
  
  #include "irflag_t.h"
  #include "irhooks.h"
@@ -182,15 +182,13 @@ static void opt_walker(ir_node *n, void *env) {
  /* Applies local optimizations to all nodes in the graph until fixpoint. */
  void optimize_graph_df(ir_graph *irg) {
         pdeq     *waitq = new_pdeq();
-       int      state = edges_activated(irg);
         ir_graph *rem = current_ir_graph;
         ir_node  *end;
-       int      i;
+       int      i, state, n_ka;
  
         current_ir_graph = irg;
  
-       if (! state)
-               edges_activate(irg);
+       state = edges_assure(irg);
  
         if (get_opt_global_cse())
                 set_irg_pinned(current_ir_graph, op_pin_state_floats);
@@ -209,13 +207,22 @@ void optimize_graph_df(ir_graph *irg) {
  
         set_using_irn_link(irg);
  
+       end  = get_irg_end(irg);
+       n_ka = get_End_n_keepalives(end);
+
         /* walk over the graph, but don't touch keep-alives */
         irg_walk(get_irg_end_block(irg), NULL, opt_walker, waitq);
  
-       end = get_irg_end(irg);
-
-       /* optimize keep-alives by removing superfluous ones */
-       for (i = get_End_n_keepalives(end) - 1; i >= 0; --i) {
+       /*
+        * Optimize keep-alives by removing superfluous ones.
+        * Beware: the last transformation might add new keep-alives
+        * that keep blocks that are where visited! So, check only the
+        * "old" keep-alives, not the new ones!
+        *
+        * FIXME: it might be better to completely remove this
+        * optimization here ...
+        */
+       for (i = n_ka - 1; i >= 0; --i) {
                 ir_node *ka = get_End_keepalive(end, i);
  
                 if (irn_visited(ka) && !is_irn_keep(ka)) {
@@ -288,7 +295,7 @@ compute_new_arity(ir_node *b) {
                 /* compute the number of good predecessors */
                 res = irn_arity = get_irn_arity(b);
                 for (i = 0; i < irn_arity; i++)
-                       if (get_irn_opcode(get_irn_n(b, i)) == iro_Bad) res--;
+                       if (is_Bad(get_irn_n(b, i))) res--;
                         /* save it in the flag. */
                         set_Block_block_visited(b, irg_v + res);
                         return res;
@@ -312,6 +319,7 @@ static void copy_node(ir_node *n, void *env) {
         ir_node *nn, *block;
         int new_arity;
         ir_op *op = get_irn_op(n);
+       (void) env;
  
         /* The end node looses it's flexible in array.  This doesn't matter,
            as dead node elimination builds End by hand, inlineing doesn't use
@@ -340,9 +348,13 @@ static void copy_node(ir_node *n, void *env) {
                 get_irn_mode(n),
                 new_arity,
                 get_irn_in(n) + 1);
-               /* Copy the attributes.  These might point to additional data.  If this
-               was allocated on the old obstack the pointers now are dangling.  This
-       frees e.g. the memory of the graph_arr allocated in new_immBlock. */
+       /* Copy the attributes.  These might point to additional data.  If this
+          was allocated on the old obstack the pointers now are dangling.  This
+          frees e.g. the memory of the graph_arr allocated in new_immBlock. */
+       if (op == op_Block) {
+               /* we cannot allow blocks WITHOUT macroblock input */
+               set_Block_MacroBlock(nn, get_Block_MacroBlock(n));
+       }
         copy_node_attr(n, nn);
  
  #ifdef DEBUG_libfirm
@@ -371,12 +383,25 @@ static void copy_preds(ir_node *n, void *env) {
         nn = get_new_node(n);
  
         if (is_Block(n)) {
+               /* copy the macro block header */
+               ir_node *mbh = get_Block_MacroBlock(n);
+
+               if (mbh == n) {
+                       /* this block is a macroblock header */
+                       set_Block_MacroBlock(nn, nn);
+               } else {
+                       /* get the macro block header */
+                       ir_node *nmbh = get_new_node(mbh);
+                       assert(nmbh != NULL);
+                       set_Block_MacroBlock(nn, nmbh);
+               }
+
                 /* Don't copy Bad nodes. */
                 j = 0;
                 irn_arity = get_irn_arity(n);
                 for (i = 0; i < irn_arity; i++) {
                         if (! is_Bad(get_irn_n(n, i))) {
-                               set_irn_n (nn, j, get_new_node(get_irn_n(n, i)));
+                               set_irn_n(nn, j, get_new_node(get_irn_n(n, i)));
                                 /*if (is_backedge(n, i)) set_backedge(nn, j);*/
                                 j++;
                         }
@@ -391,7 +416,7 @@ static void copy_preds(ir_node *n, void *env) {
                    that the fields in ir_graph are set properly. */
                 if ((get_opt_control_flow_straightening()) &&
                         (get_Block_n_cfgpreds(nn) == 1) &&
-                       (get_irn_op(get_Block_cfgpred(nn, 0)) == op_Jmp)) {
+                       is_Jmp(get_Block_cfgpred(nn, 0))) {
                         ir_node *old = get_nodes_block(get_Block_cfgpred(nn, 0));
                         if (nn == old) {
                                 /* Jmp jumps into the block it is in -- deal self cycle. */
@@ -401,11 +426,11 @@ static void copy_preds(ir_node *n, void *env) {
                                 exchange(nn, old);
                         }
                 }
-       } else if (get_irn_op(n) == op_Phi) {
+       } else if (is_Phi(n) && get_irn_arity(n) > 0) {
                 /* Don't copy node if corresponding predecessor in block is Bad.
                    The Block itself should not be Bad. */
                 block = get_nodes_block(n);
-               set_irn_n(nn, -1, get_new_node(block));
+               set_nodes_block(nn, get_new_node(block));
                 j = 0;
                 irn_arity = get_irn_arity(n);
                 for (i = 0; i < irn_arity; i++) {
@@ -425,11 +450,11 @@ static void copy_preds(ir_node *n, void *env) {
         } else {
                 irn_arity = get_irn_arity(n);
                 for (i = -1; i < irn_arity; i++)
-                       set_irn_n (nn, i, get_new_node(get_irn_n(n, i)));
+                       set_irn_n(nn, i, get_new_node(get_irn_n(n, i)));
         }
         /* Now the new node is complete.  We can add it to the hash table for CSE.
            @@@ inlining aborts if we identify End. Why? */
-       if (get_irn_op(nn) != op_End)
+       if (!is_End(nn))
                 add_identities(current_ir_graph->value_table, nn);
  }
  
@@ -589,7 +614,7 @@ copy_graph_env(int copy_node_nr) {
         irg->anchor = new_anchor;
  
         /* ensure the new anchor is placed in the endblock */
-       set_irn_n(new_anchor, -1, get_irg_end_block(irg));
+       set_nodes_block(new_anchor, get_irg_end_block(irg));
  }
  
  /**
@@ -600,62 +625,65 @@ copy_graph_env(int copy_node_nr) {
   * Adds all new nodes to a new hash table for CSE.  Does not
   * perform CSE, so the hash table might contain common subexpressions.
   */
-void
-dead_node_elimination(ir_graph *irg) {
-       if (get_opt_optimize() && get_opt_dead_node_elimination()) {
-               ir_graph *rem;
-               int rem_ipview = get_interprocedural_view();
-               struct obstack *graveyard_obst = NULL;
-               struct obstack *rebirth_obst   = NULL;
-               assert(! edges_activated(irg) && "dead node elimination requires disabled edges");
-
-               /* inform statistics that we started a dead-node elimination run */
-               hook_dead_node_elim(irg, 1);
-
-               /* Remember external state of current_ir_graph. */
-               rem = current_ir_graph;
-               current_ir_graph = irg;
-               set_interprocedural_view(0);
+void dead_node_elimination(ir_graph *irg) {
+       ir_graph *rem;
+#ifdef INTERPROCEDURAL_VIEW
+       int rem_ipview = get_interprocedural_view();
+#endif
+       struct obstack *graveyard_obst = NULL;
+       struct obstack *rebirth_obst   = NULL;
+       assert(! edges_activated(irg) && "dead node elimination requires disabled edges");
  
-               assert(get_irg_phase_state(irg) != phase_building);
+       /* inform statistics that we started a dead-node elimination run */
+       hook_dead_node_elim(irg, 1);
  
-               /* Handle graph state */
-               free_callee_info(irg);
-               free_irg_outs(irg);
-               free_trouts();
+       /* Remember external state of current_ir_graph. */
+       rem = current_ir_graph;
+       current_ir_graph = irg;
+#ifdef INTERPROCEDURAL_VIEW
+       set_interprocedural_view(0);
+#endif
  
-               /* @@@ so far we loose loops when copying */
-               free_loop_information(irg);
+       assert(get_irg_phase_state(irg) != phase_building);
  
-               set_irg_doms_inconsistent(irg);
+       /* Handle graph state */
+       free_callee_info(irg);
+       free_irg_outs(irg);
+       free_trouts();
  
-               /* A quiet place, where the old obstack can rest in peace,
-                  until it will be cremated. */
-               graveyard_obst = irg->obst;
+       /* @@@ so far we loose loops when copying */
+       free_loop_information(irg);
  
-               /* A new obstack, where the reachable nodes will be copied to. */
-               rebirth_obst = xmalloc(sizeof(*rebirth_obst));
-               irg->obst = rebirth_obst;
-               obstack_init(irg->obst);
-               irg->last_node_idx = 0;
+       set_irg_doms_inconsistent(irg);
  
-               /* We also need a new value table for CSE */
-               del_identities(irg->value_table);
-               irg->value_table = new_identities();
+       /* A quiet place, where the old obstack can rest in peace,
+          until it will be cremated. */
+       graveyard_obst = irg->obst;
  
-               /* Copy the graph from the old to the new obstack */
-               copy_graph_env(/*copy_node_nr=*/1);
+       /* A new obstack, where the reachable nodes will be copied to. */
+       rebirth_obst = xmalloc(sizeof(*rebirth_obst));
+       irg->obst = rebirth_obst;
+       obstack_init(irg->obst);
+       irg->last_node_idx = 0;
  
-               /* Free memory from old unoptimized obstack */
-               obstack_free(graveyard_obst, 0);  /* First empty the obstack ... */
-               xfree (graveyard_obst);           /* ... then free it.           */
+       /* We also need a new value table for CSE */
+       del_identities(irg->value_table);
+       irg->value_table = new_identities();
  
-               /* inform statistics that the run is over */
-               hook_dead_node_elim(irg, 0);
+       /* Copy the graph from the old to the new obstack */
+       copy_graph_env(/*copy_node_nr=*/1);
  
-               current_ir_graph = rem;
-               set_interprocedural_view(rem_ipview);
-       }
+       /* Free memory from old unoptimized obstack */
+       obstack_free(graveyard_obst, 0);  /* First empty the obstack ... */
+       xfree(graveyard_obst);            /* ... then free it.           */
+
+       /* inform statistics that the run is over */
+       hook_dead_node_elim(irg, 0);
+
+       current_ir_graph = rem;
+#ifdef INTERPROCEDURAL_VIEW
+       set_interprocedural_view(rem_ipview);
+#endif
  }
  
  /**
@@ -672,9 +700,7 @@ static void relink_bad_block_predecessors(ir_node *n, void *env) {
  
         /* if link field of block is NULL, look for bad predecessors otherwise
            this is already done */
-       if (get_irn_op(n) == op_Block &&
-               get_irn_link(n) == NULL) {
-
+       if (is_Block(n) && get_irn_link(n) == NULL) {
                 /* save old predecessors in link field (position 0 is the block operand)*/
                 set_irn_link(n, get_irn_in(n));
  
@@ -719,12 +745,11 @@ static void relink_bad_predecessors(ir_node *n, void *env) {
         int i, old_irn_arity, new_irn_arity;
  
         /* relink bad predecessors of a block */
-       if (get_irn_op(n) == op_Block)
+       if (is_Block(n))
                 relink_bad_block_predecessors(n, env);
  
         /* If Phi node relink its block and its predecessors */
-       if (get_irn_op(n) == op_Phi) {
-
+       if (is_Phi(n)) {
                 /* Relink predecessors of phi's block */
                 block = get_nodes_block(n);
                 if (get_irn_link(block) == NULL)
@@ -746,7 +771,7 @@ static void relink_bad_predecessors(ir_node *n, void *env) {
                                 }
  
                                 ARR_SETLEN(ir_node *, n->in, new_irn_arity);
-                               ARR_SETLEN(int, n->attr.phi_backedge, new_irn_arity);
+                               ARR_SETLEN(int, n->attr.phi.u.backedge, new_irn_arity);
                 }
         } /* n is a Phi node */
  }
@@ -761,6 +786,7 @@ static void relink_bad_predecessors(ir_node *n, void *env) {
   * changes).
   */
  void remove_bad_predecessors(ir_graph *irg) {
+       panic("Fix backedge handling first");
         irg_walk_graph(irg, firm_clear_link, relink_bad_predecessors, NULL);
  }
  
@@ -898,13 +924,13 @@ copy_node_inline(ir_node *n, void *env) {
         ir_type *frame_tp = (ir_type *)env;
  
         copy_node(n, NULL);
-       if (get_irn_op(n) == op_Sel) {
+       if (is_Sel(n)) {
                 nn = get_new_node (n);
                 assert(is_Sel(nn));
                 if (get_entity_owner(get_Sel_entity(n)) == frame_tp) {
                         set_Sel_entity(nn, get_entity_link(get_Sel_entity(n)));
                 }
-       } else if (get_irn_op(n) == op_Block) {
+       } else if (is_Block(n)) {
                 nn = get_new_node (n);
                 nn->attr.block.irg = current_ir_graph;
         }
@@ -915,9 +941,10 @@ copy_node_inline(ir_node *n, void *env) {
   */
  static void find_addr(ir_node *node, void *env) {
         int *allow_inline = env;
-       if (is_Proj(node) && get_irn_op(get_Proj_pred(node)) == op_Start) {
-               if (get_Proj_proj(node) == pn_Start_P_value_arg_base)
-                       *allow_inline = 0;
+       if (is_Proj(node) &&
+                       is_Start(get_Proj_pred(node)) &&
+                       get_Proj_proj(node) == pn_Start_P_value_arg_base) {
+               *allow_inline = 0;
         }
  }
  
@@ -960,9 +987,9 @@ static int can_inline(ir_node *call, ir_graph *called_graph) {
  }
  
  enum exc_mode {
-          exc_handler    = 0, /**< There is a handler. */
-          exc_to_end     = 1, /**< Branches to End. */
-          exc_no_handler = 2  /**< Exception handling not represented. */
+       exc_handler    = 0, /**< There is a handler. */
+       exc_to_end     = 1, /**< Branches to End. */
+       exc_no_handler = 2  /**< Exception handling not represented. */
  };
  
  /* Inlines a method at the given call site. */
@@ -974,21 +1001,31 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
         ir_node **res_pred;
         ir_node **cf_pred;
         ir_node *ret, *phi;
-       int arity, n_ret, n_exc, n_res, i, j, rem_opt, irn_arity;
+       int arity, n_ret, n_exc, n_res, i, n, j, rem_opt, irn_arity;
         enum exc_mode exc_handling;
-       ir_type *called_frame;
+       ir_type *called_frame, *curr_frame;
         irg_inline_property prop = get_irg_inline_property(called_graph);
+       ir_entity *ent;
+
+       if (prop == irg_inline_forbidden)
+               return 0;
  
-       if ( (prop < irg_inline_forced) &&
-            (!get_opt_optimize() || !get_opt_inline() || (prop == irg_inline_forbidden))) return 0;
+       ent = get_irg_entity(called_graph);
  
         /* Do not inline variadic functions. */
-       if (get_method_variadicity(get_entity_type(get_irg_entity(called_graph))) == variadicity_variadic)
+       if (get_method_variadicity(get_entity_type(ent)) == variadicity_variadic)
                 return 0;
  
-       assert(get_method_n_params(get_entity_type(get_irg_entity(called_graph))) ==
+       assert(get_method_n_params(get_entity_type(ent)) ==
                get_method_n_params(get_Call_type(call)));
  
+       /*
+        * We cannot inline a recursive call. The graph must be copied before
+        * the call the inline_method() using create_irg_copy().
+        */
+       if (called_graph == current_ir_graph)
+               return 0;
+
         /*
          * currently, we cannot inline two cases:
          * - call with compound arguments
@@ -1013,15 +1050,6 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
  
         /* -- Check preconditions -- */
         assert(is_Call(call));
-       /* @@@ does not work for InterfaceIII.java after cgana
-        assert(get_Call_type(call) == get_entity_type(get_irg_entity(called_graph)));
-        assert(smaller_type(get_entity_type(get_irg_entity(called_graph)),
-        get_Call_type(call)));
-       */
-       if (called_graph == current_ir_graph) {
-               set_optimize(rem_opt);
-               return 0;
-       }
  
         /* here we know we WILL inline, so inform the statistics */
         hook_inline(call, called_graph);
@@ -1092,10 +1120,11 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
         /* -- Replicate local entities of the called_graph -- */
         /* copy the entities. */
         called_frame = get_irg_frame_type(called_graph);
-       for (i = 0; i < get_class_n_members(called_frame); i++) {
+       curr_frame   = get_irg_frame_type(current_ir_graph);
+       for (i = 0, n = get_class_n_members(called_frame); i < n; ++i) {
                 ir_entity *new_ent, *old_ent;
                 old_ent = get_class_member(called_frame, i);
-               new_ent = copy_entity_own(old_ent, get_cur_frame_type());
+               new_ent = copy_entity_own(old_ent, curr_frame);
                 set_entity_link(old_ent, new_ent);
         }
  
@@ -1188,7 +1217,7 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
                         n_ret = 0;
                         for (i = 0; i < arity; i++) {
                                 ret = get_irn_n(end_bl, i);
-                               if (get_irn_op(ret) == op_Return) {
+                               if (is_Return(ret)) {
                                         cf_pred[n_ret] = get_Return_res(ret, j);
                                         n_ret++;
                                 }
@@ -1200,14 +1229,16 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
                         res_pred[j] = phi;
                         /* Conserve Phi-list for further inlinings -- but might be optimized */
                         if (get_nodes_block(phi) == post_bl) {
-                               set_irn_link(phi, get_irn_link(post_bl));
-                               set_irn_link(post_bl, phi);
+                               set_Phi_next(phi, get_Block_phis(post_bl));
+                               set_Block_phis(post_bl, phi);
                         }
                 }
                 set_Tuple_pred(call, pn_Call_T_result, new_Tuple(n_res, res_pred));
         } else {
                 set_Tuple_pred(call, pn_Call_T_result, new_Bad());
         }
+       /* handle the regular call */
+       set_Tuple_pred(call, pn_Call_X_regular, new_Jmp());
  
         /* For now, we cannot inline calls with value_base */
         set_Tuple_pred(call, pn_Call_P_value_res_base, new_Bad());
@@ -1228,7 +1259,7 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
                         ir_node *ret, *irn;
                         ret = get_irn_n(end_bl, i);
                         irn = skip_Proj(ret);
-                       if (is_fragile_op(irn) || (get_irn_op(irn) == op_Raise)) {
+                       if (is_fragile_op(irn) || is_Raise(irn)) {
                                 cf_pred[n_exc] = ret;
                                 ++n_exc;
                         }
@@ -1248,7 +1279,7 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
                                         /* We rely that all cfops have the memory output at the same position. */
                                         cf_pred[n_exc] = new_r_Proj(current_ir_graph, get_nodes_block(ret), ret, mode_M, 0);
                                         n_exc++;
-                               } else if (get_irn_op(ret) == op_Raise) {
+                               } else if (is_Raise(ret)) {
                                         cf_pred[n_exc] = new_r_Proj(current_ir_graph, get_nodes_block(ret), ret, mode_M, 1);
                                         n_exc++;
                                 }
@@ -1258,7 +1289,6 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
                         set_Tuple_pred(call, pn_Call_X_except, new_Bad());
                         set_Tuple_pred(call, pn_Call_M_except, new_Bad());
                 }
-               set_Tuple_pred(call, pn_Call_X_regular, new_Bad());
         } else {
                 ir_node *main_end_bl;
                 int main_end_bl_arity;
@@ -1270,7 +1300,7 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
                         ir_node *ret = get_irn_n(end_bl, i);
                         ir_node *irn = skip_Proj(ret);
  
-                       if (is_fragile_op(irn) || (get_irn_op(irn) == op_Raise)) {
+                       if (is_fragile_op(irn) || is_Raise(irn)) {
                                 cf_pred[n_exc] = ret;
                                 n_exc++;
                         }
@@ -1284,7 +1314,6 @@ int inline_method(ir_node *call, ir_graph *called_graph) {
                 for (i = 0; i < n_exc; ++i)
                         end_preds[main_end_bl_arity + i] = cf_pred[i];
                 set_irn_in(main_end_bl, n_exc + main_end_bl_arity, end_preds);
-               set_Tuple_pred(call, pn_Call_X_regular, new_Bad());
                 set_Tuple_pred(call, pn_Call_X_except,  new_Bad());
                 set_Tuple_pred(call, pn_Call_M_except,  new_Bad());
                 free(end_preds);
@@ -1308,6 +1337,7 @@ struct _call_entry {
         ir_node    *call;   /**< the Call */
         ir_graph   *callee; /**< the callee called here */
         call_entry *next;   /**< for linking the next one */
+       unsigned   weight;  /**< the weight of the call */
  };
  
  /**
@@ -1322,17 +1352,19 @@ typedef struct _inline_env_t {
  /**
   * Returns the irg called from a Call node. If the irg is not
   * known, NULL is returned.
+ *
+ * @param call  the call node
   */
  static ir_graph *get_call_called_irg(ir_node *call) {
         ir_node *addr;
-       ir_graph *called_irg = NULL;
  
         addr = get_Call_ptr(call);
-       if (is_SymConst(addr) && get_SymConst_kind(addr) == symconst_addr_ent) {
-               called_irg = get_entity_irg(get_SymConst_entity(addr));
+       if (is_SymConst_addr_ent(addr)) {
+               ir_entity *ent = get_SymConst_entity(addr);
+               return get_entity_irg(ent);
         }
  
-       return called_irg;
+       return NULL;
  }
  
  /**
@@ -1341,13 +1373,15 @@ static ir_graph *get_call_called_irg(ir_node *call) {
  static void collect_calls(ir_node *call, void *env) {
         if (is_Call(call)) {
                 ir_graph *called_irg = get_call_called_irg(call);
-               if (called_irg) {
+
+               if (called_irg != NULL) {
                         /* The Call node calls a locally defined method.  Remember to inline. */
                         inline_env_t *ienv  = env;
                         call_entry   *entry = obstack_alloc(&ienv->obst, sizeof(*entry));
                         entry->call   = call;
                         entry->callee = called_irg;
                         entry->next   = NULL;
+                       entry->weight = 0;
  
                         if (ienv->tail == NULL)
                                 ienv->head = entry;
@@ -1372,8 +1406,6 @@ void inline_small_irgs(ir_graph *irg, int size) {
         call_entry *entry;
         DEBUG_ONLY(firm_dbg_module_t *dbg;)
  
-       if (!(get_opt_optimize() && get_opt_inline())) return;
-
         FIRM_DBG_REGISTER(dbg, "firm.opt.inline");
  
         current_ir_graph = irg;
@@ -1440,7 +1472,8 @@ static inline_irg_env *alloc_inline_irg_env(struct obstack *obst) {
  typedef struct walker_env {
         struct obstack *obst; /**< the obstack for allocations. */
         inline_irg_env *x;    /**< the inline environment */
-       int ignore_runtime;   /**< the ignore runtime flag */
+       char ignore_runtime;  /**< the ignore runtime flag */
+       char ignore_callers;  /**< if set, do change callers data */
  } wenv_t;
  
  /**
@@ -1450,23 +1483,23 @@ typedef struct walker_env {
  static void collect_calls2(ir_node *call, void *ctx) {
         wenv_t         *env = ctx;
         inline_irg_env *x = env->x;
-       ir_op          *op = get_irn_op(call);
+       ir_opcode      code = get_irn_opcode(call);
         ir_graph       *callee;
         call_entry     *entry;
  
         /* count meaningful nodes in irg */
-       if (op != op_Proj && op != op_Tuple && op != op_Sync) {
+       if (code != iro_Proj && code != iro_Tuple && code != iro_Sync) {
                 ++x->n_nodes;
                 ++x->n_nodes_orig;
         }
  
-       if (op != op_Call) return;
+       if (code != iro_Call) return;
  
         /* check, if it's a runtime call */
         if (env->ignore_runtime) {
                 ir_node *symc = get_Call_ptr(call);
  
-               if (is_SymConst(symc) && get_SymConst_kind(symc) == symconst_addr_ent) {
+               if (is_SymConst_addr_ent(symc)) {
                         ir_entity *ent = get_SymConst_entity(symc);
  
                         if (get_entity_additional_properties(ent) & mtp_property_runtime)
@@ -1479,11 +1512,13 @@ static void collect_calls2(ir_node *call, void *ctx) {
         ++x->n_call_nodes_orig;
  
         callee = get_call_called_irg(call);
-       if (callee) {
-               inline_irg_env *callee_env = get_irg_link(callee);
-               /* count all static callers */
-               ++callee_env->n_callers;
-               ++callee_env->n_callers_orig;
+       if (callee != NULL) {
+               if (! env->ignore_callers) {
+                       inline_irg_env *callee_env = get_irg_link(callee);
+                       /* count all static callers */
+                       ++callee_env->n_callers;
+                       ++callee_env->n_callers_orig;
+               }
  
                 /* link it in the list of possible inlinable entries */
                 entry = obstack_alloc(env->obst, sizeof(*entry));
@@ -1499,7 +1534,7 @@ static void collect_calls2(ir_node *call, void *ctx) {
  }
  
  /**
- * Returns TRUE if the number of callers in 0 in the irg's environment,
+ * Returns TRUE if the number of callers is 0 in the irg's environment,
   * hence this irg is a leave.
   */
  INLINE static int is_leave(ir_graph *irg) {
@@ -1508,7 +1543,8 @@ INLINE static int is_leave(ir_graph *irg) {
  }
  
  /**
- * Returns TRUE if the number of callers is smaller size in the irg's environment.
+ * Returns TRUE if the number of nodes in the callee is
+ * smaller then size in the irg's environment.
   */
  INLINE static int is_smaller(ir_graph *callee, int size) {
         inline_irg_env *env = get_irg_link(callee);
@@ -1552,14 +1588,17 @@ void inline_leave_functions(int maxsize, int leavesize, int size, int ignore_run
         call_entry       *entry, *tail;
         const call_entry *centry;
         struct obstack   obst;
+       pmap             *copied_graphs;
+       pmap_entry       *pm_entry;
         DEBUG_ONLY(firm_dbg_module_t *dbg;)
  
-       if (!(get_opt_optimize() && get_opt_inline())) return;
-
         FIRM_DBG_REGISTER(dbg, "firm.opt.inline");
         rem = current_ir_graph;
         obstack_init(&obst);
  
+       /* a map for the copied graphs, used to inline recursive calls */
+       copied_graphs = pmap_create();
+
         /* extend all irgs by a temporary data structure for inlining. */
         n_irgs = get_irp_n_irgs();
         for (i = 0; i < n_irgs; ++i)
@@ -1568,6 +1607,7 @@ void inline_leave_functions(int maxsize, int leavesize, int size, int ignore_run
         /* Precompute information in temporary data structure. */
         wenv.obst           = &obst;
         wenv.ignore_runtime = ignore_runtime;
+       wenv.ignore_callers = 0;
         for (i = 0; i < n_irgs; ++i) {
                 ir_graph *irg = get_irp_irg(i);
  
@@ -1600,7 +1640,8 @@ void inline_leave_functions(int maxsize, int leavesize, int size, int ignore_run
                                 call   = entry->call;
                                 callee = entry->callee;
  
-                               if (is_leave(callee) && is_smaller(callee, leavesize)) {
+                               if (is_leave(callee) && (
+                                   is_smaller(callee, leavesize) || (get_irg_inline_property(callee) >= irg_inline_forced))) {
                                         if (!phiproj_computed) {
                                                 phiproj_computed = 1;
                                                 collect_phiprojs(current_ir_graph);
@@ -1608,9 +1649,12 @@ void inline_leave_functions(int maxsize, int leavesize, int size, int ignore_run
                                         did_inline = inline_method(call, callee);
  
                                         if (did_inline) {
-                                               /* Do some statistics */
                                                 inline_irg_env *callee_env = (inline_irg_env *)get_irg_link(callee);
  
+                                               /* was inlined, must be recomputed */
+                                               phiproj_computed = 0;
+
+                                               /* Do some statistics */
                                                 env->got_inline = 1;
                                                 --env->n_call_nodes;
                                                 env->n_nodes += callee_env->n_nodes;
@@ -1641,20 +1685,76 @@ void inline_leave_functions(int maxsize, int leavesize, int size, int ignore_run
                 /* note that the list of possible calls is updated during the process */
                 tail = NULL;
                 for (entry = env->call_head; entry != NULL; entry = entry->next) {
-                       ir_graph *callee;
+                       ir_graph   *callee;
+                       pmap_entry *e;
  
                         call   = entry->call;
                         callee = entry->callee;
  
+                       e = pmap_find(copied_graphs, callee);
+                       if (e != NULL) {
+                               /*
+                                * Remap callee if we have a copy.
+                                * FIXME: Should we do this only for recursive Calls ?
+                                */
+                               callee = e->value;
+                       }
+
                         if (((is_smaller(callee, size) && (env->n_nodes < maxsize)) ||    /* small function */
                                 (get_irg_inline_property(callee) >= irg_inline_forced))) {
-                               if (!phiproj_computed) {
+                               if (current_ir_graph == callee) {
+                                       /*
+                                        * Recursive call: we cannot directly inline because we cannot walk
+                                        * the graph and change it. So we have to make a copy of the graph
+                                        * first.
+                                        */
+
+                                       inline_irg_env *callee_env;
+                                       ir_graph       *copy;
+
+                                       /*
+                                        * No copy yet, create one.
+                                        * Note that recursive methods are never leaves, so it is sufficient
+                                        * to test this condition here.
+                                        */
+                                       copy = create_irg_copy(callee);
+
+                                       /* create_irg_copy() destroys the Proj links, recompute them */
+                                       phiproj_computed = 0;
+
+                                       /* allocate new environment */
+                                       callee_env = alloc_inline_irg_env(&obst);
+                                       set_irg_link(copy, callee_env);
+
+                                       wenv.x              = callee_env;
+                                       wenv.ignore_callers = 1;
+                                       irg_walk_graph(copy, NULL, collect_calls2, &wenv);
+
+                                       /*
+                                        * Enter the entity of the original graph. This is needed
+                                        * for inline_method(). However, note that ent->irg still points
+                                        * to callee, NOT to copy.
+                                        */
+                                       set_irg_entity(copy, get_irg_entity(callee));
+
+                                       pmap_insert(copied_graphs, callee, copy);
+                                       callee = copy;
+
+                                       /* we have only one caller: the original graph */
+                                       callee_env->n_callers      = 1;
+                                       callee_env->n_callers_orig = 1;
+                               }
+                               if (! phiproj_computed) {
                                         phiproj_computed = 1;
                                         collect_phiprojs(current_ir_graph);
                                 }
-                               if (inline_method(call, callee)) {
+                               did_inline = inline_method(call, callee);
+                               if (did_inline) {
                                         inline_irg_env *callee_env = (inline_irg_env *)get_irg_link(callee);
  
+                                       /* was inlined, must be recomputed */
+                                       phiproj_computed = 0;
+
                                         /* callee was inline. Append it's call list. */
                                         env->got_inline = 1;
                                         --env->n_call_nodes;
@@ -1695,13 +1795,24 @@ void inline_leave_functions(int maxsize, int leavesize, int size, int ignore_run
                         optimize_graph_df(irg);
                         optimize_cf(irg);
                 }
-               if (env->got_inline || (env->n_callers_orig != env->n_callers))
+               if (env->got_inline || (env->n_callers_orig != env->n_callers)) {
                         DB((dbg, SET_LEVEL_1, "Nodes:%3d ->%3d, calls:%3d ->%3d, callers:%3d ->%3d, -- %s\n",
                         env->n_nodes_orig, env->n_nodes, env->n_call_nodes_orig, env->n_call_nodes,
                         env->n_callers_orig, env->n_callers,
                         get_entity_name(get_irg_entity(irg))));
+               }
         }
  
+       /* kill the copied graphs: we don't need them anymore */
+       foreach_pmap(copied_graphs, pm_entry) {
+               ir_graph *copy = pm_entry->value;
+
+               /* reset the entity, otherwise it will be deleted in the next step ... */
+               set_irg_entity(copy, NULL);
+               free_ir_graph(copy);
+       }
+       pmap_destroy(copied_graphs);
+
         obstack_free(&obst, NULL);
         current_ir_graph = rem;
  }
@@ -1750,7 +1861,7 @@ place_floats_early(ir_node *n, waitq *worklist) {
  
         /* Place floating nodes. */
         if (get_irn_pinned(n) == op_pin_state_floats) {
-               ir_node *curr_block = get_irn_n(n, -1);
+               ir_node *curr_block = get_nodes_block(n);
                 int in_dead_block   = is_Block_unreachable(curr_block);
                 int depth           = 0;
                 ir_node *b          = NULL;   /* The block to place this node in */
@@ -1782,7 +1893,7 @@ place_floats_early(ir_node *n, waitq *worklist) {
                                  */
                                 if (! in_dead_block) {
                                         if (get_irn_pinned(pred) == op_pin_state_floats &&
-                                               is_Block_unreachable(get_irn_n(pred, -1)))
+                                               is_Block_unreachable(get_nodes_block(pred)))
                                                 set_nodes_block(pred, curr_block);
                                 }
                                 place_floats_early(pred, worklist);
@@ -1798,15 +1909,16 @@ place_floats_early(ir_node *n, waitq *worklist) {
                         /* Because all loops contain at least one op_pin_state_pinned node, now all
                            our inputs are either op_pin_state_pinned or place_early() has already
                            been finished on them.  We do not have any unfinished inputs!  */
-                       pred_block = get_irn_n(pred, -1);
+                       pred_block = get_nodes_block(pred);
                         if ((!is_Block_dead(pred_block)) &&
                                 (get_Block_dom_depth(pred_block) > depth)) {
                                 b = pred_block;
                                 depth = get_Block_dom_depth(pred_block);
                         }
                         /* Avoid that the node is placed in the Start block */
-                       if ((depth == 1) && (get_Block_dom_depth(get_irn_n(n, -1)) > 1)
-                               && get_irg_phase_state(current_ir_graph) != phase_backend) {
+                       if (depth == 1 &&
+                                       get_Block_dom_depth(get_nodes_block(n)) > 1 &&
+                                       get_irg_phase_state(current_ir_graph) != phase_backend) {
                                 b = get_Block_cfg_out(get_irg_start_block(current_ir_graph), 0);
                                 assert(b != get_irg_start_block(current_ir_graph));
                                 depth = 2;
@@ -1822,7 +1934,7 @@ place_floats_early(ir_node *n, waitq *worklist) {
          */
         irn_arity = get_irn_arity(n);
  
-       if (get_irn_op(n) == op_End) {
+       if (is_End(n)) {
                 /*
                  * Simplest case: End node. Predecessors are keep-alives,
                  * no need to move out of dead block.
@@ -1844,14 +1956,14 @@ place_floats_early(ir_node *n, waitq *worklist) {
                 }
         } else if (is_Phi(n)) {
                 ir_node *pred;
-               ir_node *curr_block = get_irn_n(n, -1);
+               ir_node *curr_block = get_nodes_block(n);
                 int in_dead_block   = is_Block_unreachable(curr_block);
  
                 /*
                  * Phi nodes: move nodes from dead blocks into the effective use
                  * of the Phi-input if the Phi is not in a bad block.
                  */
-               pred = get_irn_n(n, -1);
+               pred = get_nodes_block(n);
                 if (irn_not_visited(pred))
                         waitq_put(worklist, pred);
  
@@ -1861,7 +1973,7 @@ place_floats_early(ir_node *n, waitq *worklist) {
                         if (irn_not_visited(pred)) {
                                 if (! in_dead_block &&
                                         get_irn_pinned(pred) == op_pin_state_floats &&
-                                       is_Block_unreachable(get_irn_n(pred, -1))) {
+                                       is_Block_unreachable(get_nodes_block(pred))) {
                                         set_nodes_block(pred, get_Block_cfgpred_block(curr_block, i));
                                 }
                                 waitq_put(worklist, pred);
@@ -1869,13 +1981,13 @@ place_floats_early(ir_node *n, waitq *worklist) {
                 }
         } else {
                 ir_node *pred;
-               ir_node *curr_block = get_irn_n(n, -1);
+               ir_node *curr_block = get_nodes_block(n);
                 int in_dead_block   = is_Block_unreachable(curr_block);
  
                 /*
                  * All other nodes: move nodes from dead blocks into the same block.
                  */
-               pred = get_irn_n(n, -1);
+               pred = get_nodes_block(n);
                 if (irn_not_visited(pred))
                         waitq_put(worklist, pred);
  
@@ -1885,7 +1997,7 @@ place_floats_early(ir_node *n, waitq *worklist) {
                         if (irn_not_visited(pred)) {
                                 if (! in_dead_block &&
                                         get_irn_pinned(pred) == op_pin_state_floats &&
-                                       is_Block_unreachable(get_irn_n(pred, -1))) {
+                                       is_Block_unreachable(get_nodes_block(pred))) {
                                         set_nodes_block(pred, curr_block);
                                 }
                                 waitq_put(worklist, pred);
@@ -1952,37 +2064,30 @@ static ir_node *calc_dca(ir_node *dca, ir_node *block) {
   * I.e., DCA is the block where we might place PRODUCER.
   * A data flow edge points from producer to consumer.
   */
-static ir_node *
-consumer_dom_dca(ir_node *dca, ir_node *consumer, ir_node *producer) {
-       ir_node *block = NULL;
-
-       /* Compute the latest block into which we can place a node so that it is
+static ir_node *consumer_dom_dca(ir_node *dca, ir_node *consumer, ir_node *producer)
+{
+       /* Compute the last block into which we can place a node so that it is
            before consumer. */
-       if (get_irn_op(consumer) == op_Phi) {
+       if (is_Phi(consumer)) {
                 /* our consumer is a Phi-node, the effective use is in all those
                    blocks through which the Phi-node reaches producer */
-               int i, irn_arity;
                 ir_node *phi_block = get_nodes_block(consumer);
-               irn_arity = get_irn_arity(consumer);
+               int      arity     = get_irn_arity(consumer);
+               int      i;
  
-               for (i = 0;  i < irn_arity; i++) {
-                       if (get_irn_n(consumer, i) == producer) {
-                               ir_node *new_block = get_nodes_block(get_Block_cfgpred(phi_block, i));
+               for (i = 0;  i < arity; i++) {
+                       if (get_Phi_pred(consumer, i) == producer) {
+                               ir_node *new_block = get_Block_cfgpred_block(phi_block, i);
  
-                               if (! is_Block_unreachable(new_block))
-                                       block = calc_dca(block, new_block);
+                               if (!is_Block_unreachable(new_block))
+                                       dca = calc_dca(dca, new_block);
                         }
                 }
-
-               if (! block)
-                       block = get_irn_n(producer, -1);
         } else {
-               assert(is_no_Block(consumer));
-               block = get_nodes_block(consumer);
+               dca = calc_dca(dca, get_nodes_block(consumer));
         }
  
-       /* Compute the deepest common ancestor of block and dca. */
-       return calc_dca(dca, block);
+       return dca;
  }
  
  /* FIXME: the name clashes here with the function from ana/field_temperature.c
@@ -2035,7 +2140,6 @@ static ir_node *get_deepest_common_ancestor(ir_node *node, ir_node *dca)
  
         for (i = get_irn_n_outs(node) - 1; i >= 0; --i) {
                 ir_node *succ = get_irn_out(node, i);
-               ir_node *succ_blk;
  
                 if (is_End(succ)) {
                         /*
@@ -2045,11 +2149,11 @@ static ir_node *get_deepest_common_ancestor(ir_node *node, ir_node *dca)
                         continue;
                 }
  
-               if(is_Proj(succ)) {
+               if (is_Proj(succ)) {
                         dca = get_deepest_common_ancestor(succ, dca);
                 } else {
                         /* ignore if succ is in dead code */
-                       succ_blk = get_irn_n(succ, -1);
+                       ir_node *succ_blk = get_nodes_block(succ);
                         if (is_Block_unreachable(succ_blk))
                                 continue;
                         dca = consumer_dom_dca(dca, succ, node);
@@ -2096,12 +2200,12 @@ static void place_floats_late(ir_node *n, pdeq *worklist) {
         mark_irn_visited(n);
  
         /* no need to place block nodes, control nodes are already placed. */
-       if ((get_irn_op(n) != op_Block) &&
+       if (!is_Block(n) &&
             (!is_cfop(n)) &&
             (get_irn_mode(n) != mode_X)) {
                 /* Remember the early_blk placement of this block to move it
                    out of loop no further than the early_blk placement. */
-               early_blk = get_irn_n(n, -1);
+               early_blk = get_nodes_block(n);
  
                 /*
                  * BEWARE: Here we also get code, that is live, but
@@ -2119,7 +2223,7 @@ static void place_floats_late(ir_node *n, pdeq *worklist) {
                     producer of one of their inputs in the same block anyway. */
                 for (i = get_irn_n_outs(n) - 1; i >= 0; --i) {
                         ir_node *succ = get_irn_out(n, i);
-                       if (irn_not_visited(succ) && (get_irn_op(succ) != op_Phi))
+                       if (irn_not_visited(succ) && !is_Phi(succ))
                                 place_floats_late(succ, worklist);
                 }
  
@@ -2193,7 +2297,7 @@ void place_code(ir_graph *irg) {
  
         if (1 || get_irg_loopinfo_state(irg) != loopinfo_consistent) {
                 free_loop_information(irg);
-               construct_backedges(irg);
+               construct_cf_backedges(irg);
         }
  
         /* Place all floating nodes as early as possible. This guarantees
@@ -2214,6 +2318,11 @@ void place_code(ir_graph *irg) {
         current_ir_graph = rem;
  }
  
+typedef struct cf_env {
+       char ignore_exc_edges; /**< set if exception edges should be ignored. */
+       char changed;          /**< flag indicates that the cf graphs has changed. */
+} cf_env;
+
  /**
   * Called by walker of remove_critical_cf_edges().
   *
@@ -2221,12 +2330,12 @@ void place_code(ir_graph *irg) {
   * predecessors and a block of multiple successors.
   *
   * @param n   IR node
- * @param env Environment of walker. The changed field.
+ * @param env Environment of walker.
   */
  static void walk_critical_cf_edges(ir_node *n, void *env) {
         int arity, i;
         ir_node *pre, *block, *jmp;
-       int *changed = env;
+       cf_env *cenv = env;
         ir_graph *irg = get_irn_irg(n);
  
         /* Block has multiple predecessors */
@@ -2239,27 +2348,40 @@ static void walk_critical_cf_edges(ir_node *n, void *env) {
                         const ir_op *cfop;
  
                         pre = get_irn_n(n, i);
+                       /* don't count Bad's */
+                       if (is_Bad(pre))
+                               continue;
+
                         cfop = get_irn_op(skip_Proj(pre));
-                       /* Predecessor has multiple successors. Insert new control flow edge but
-                          ignore exception edges. */
-                       if (! is_op_fragile(cfop) && is_op_forking(cfop)) {
+                       if (is_op_fragile(cfop)) {
+                               if (cenv->ignore_exc_edges && get_Proj_proj(pre) == pn_Generic_X_except)
+                                       continue;
+                               goto insert;
+                       }
+                       /* we don't want place nodes in the start block, so handle it like forking */
+                       if (is_op_forking(cfop) || cfop == op_Start) {
+                               /* Predecessor has multiple successors. Insert new control flow edge edges. */
+insert:
                                 /* set predecessor of new block */
                                 block = new_r_Block(irg, 1, &pre);
                                 /* insert new jmp node to new block */
                                 jmp = new_r_Jmp(irg, block);
                                 /* set successor of new block */
                                 set_irn_n(n, i, jmp);
-                               *changed = 1;
+                               cenv->changed = 1;
                         } /* predecessor has multiple successors */
                 } /* for all predecessors */
         } /* n is a multi-entry block */
  }
  
  void remove_critical_cf_edges(ir_graph *irg) {
-       int changed = 0;
+       cf_env env;
+
+       env.ignore_exc_edges = 1;
+       env.changed          = 0;
  
-       irg_block_walk_graph(irg, NULL, walk_critical_cf_edges, &changed);
-       if (changed) {
+       irg_block_walk_graph(irg, NULL, walk_critical_cf_edges, &env);
+       if (env.changed) {
                 /* control flow changed */
                 set_irg_outs_inconsistent(irg);
                 set_irg_extblk_inconsistent(irg);