nsz Git - libfirm/blob - ir/ir/irgopt.c

   1 /*
   2  * Project:     libFIRM
   3  * File name:   ir/ir/irgopt.c
   4  * Purpose:     Optimizations for a whole ir graph, i.e., a procedure.
   5  * Author:      Christian Schaefer, Goetz Lindenmaier
   6  * Modified by: Sebastian Felis
   7  * Created:
   8  * CVS-ID:      $Id$
   9  * Copyright:   (c) 1998-2003 Universität Karlsruhe
  10  * Licence:     This file protected by GPL -  GNU GENERAL PUBLIC LICENSE.
  11  */
  12
  13
  14 #ifdef HAVE_CONFIG_H
  15 # include "config.h"
  16 #endif
  17
  18 #include <assert.h>
  19
  20 #include "irnode_t.h"
  21 #include "irgraph_t.h"
  22 #include "irprog_t.h"
  23
  24 #include "ircons.h"
  25 #include "iropt_t.h"
  26 #include "irgopt.h"
  27 #include "irgmod.h"
  28 #include "irgwalk.h"
  29
  30 #include "array.h"
  31 #include "pset.h"
  32 #include "pmap.h"
  33 #include "eset.h"
  34 #include "pdeq.h"       /* Fuer code placement */
  35 #include "xmalloc.h"
  36
  37 #include "irouts.h"
  38 #include "irloop_t.h"
  39 #include "irbackedge_t.h"
  40 #include "cgana.h"
  41 #include "trouts.h"
  42
  43
  44 #include "irflag_t.h"
  45 #include "irhooks.h"
  46 #include "iredges_t.h"
  47 #include "irtools.h"
  48
  49 /* Defined in iropt.c */
  50 pset *new_identities (void);
  51 void  del_identities (pset *value_table);
  52 void  add_identities (pset *value_table, ir_node *node);
  53
  54 /*------------------------------------------------------------------*/
  55 /* apply optimizations of iropt to all nodes.                       */
  56 /*------------------------------------------------------------------*/
  57
  58 static void init_link (ir_node *n, void *env) {
  59   set_irn_link(n, NULL);
  60 }
  61
  62 #if 0   /* Old version. Avoids Ids.
  63            This is not necessary:  we do a post walk, and get_irn_n
  64            removes ids anyways.  So it's much cheaper to call the
  65            optimization less often and use the exchange() algorithm. */
  66 static void
  67 optimize_in_place_wrapper (ir_node *n, void *env) {
  68   int i, irn_arity;
  69   ir_node *optimized, *old;
  70
  71   irn_arity = get_irn_arity(n);
  72   for (i = 0; i < irn_arity; i++) {
  73     /* get_irn_n skips Id nodes, so comparison old != optimized does not
  74        show all optimizations. Therefore always set new predecessor. */
  75     old = get_irn_intra_n(n, i);
  76     optimized = optimize_in_place_2(old);
  77     set_irn_n(n, i, optimized);
  78   }
  79
  80   if (get_irn_op(n) == op_Block) {
  81     optimized = optimize_in_place_2(n);
  82     if (optimized != n) exchange (n, optimized);
  83   }
  84 }
  85 #else
  86 static void
  87 optimize_in_place_wrapper (ir_node *n, void *env) {
  88   ir_node *optimized = optimize_in_place_2(n);
  89   if (optimized != n) exchange (n, optimized);
  90 }
  91 #endif
  92
  93
  94 static INLINE void do_local_optimize(ir_node *n) {
  95   /* Handle graph state */
  96   assert(get_irg_phase_state(current_ir_graph) != phase_building);
  97
  98   if (get_opt_global_cse())
  99     set_irg_pinned(current_ir_graph, op_pin_state_floats);
 100   set_irg_outs_inconsistent(current_ir_graph);
 101   set_irg_doms_inconsistent(current_ir_graph);
 102   set_irg_loopinfo_inconsistent(current_ir_graph);
 103
 104   /* Clean the value_table in irg for the CSE. */
 105   del_identities(current_ir_graph->value_table);
 106   current_ir_graph->value_table = new_identities();
 107
 108   /* walk over the graph */
 109   irg_walk(n, init_link, optimize_in_place_wrapper, NULL);
 110 }
 111
 112 void local_optimize_node(ir_node *n) {
 113   ir_graph *rem = current_ir_graph;
 114   current_ir_graph = get_irn_irg(n);
 115
 116   do_local_optimize(n);
 117
 118   current_ir_graph = rem;
 119 }
 120
 121 /**
 122  * Block-Walker: uses dominance depth to mark dead blocks.
 123  */
 124 static void kill_dead_blocks(ir_node *block, void *env)
 125 {
 126   if (get_Block_dom_depth(block) < 0)
 127     set_Block_dead(block);
 128 }
 129
 130 void
 131 local_optimize_graph (ir_graph *irg) {
 132   ir_graph *rem = current_ir_graph;
 133   current_ir_graph = irg;
 134
 135   if (get_irg_dom_state(current_ir_graph) == dom_consistent)
 136     irg_block_walk_graph(irg, NULL, kill_dead_blocks, NULL);
 137
 138   do_local_optimize(irg->end);
 139
 140   current_ir_graph = rem;
 141 }
 142
 143
 144 /*------------------------------------------------------------------*/
 145 /* Routines for dead node elimination / copying garbage collection  */
 146 /* of the obstack.                                                  */
 147 /*------------------------------------------------------------------*/
 148
 149 /**
 150  * Remember the new node in the old node by using a field all nodes have.
 151  */
 152 #define set_new_node(oldn, newn)  set_irn_link(oldn, newn)
 153
 154 /**
 155  * Get this new node, before the old node is forgotten.
 156  */
 157 #define get_new_node(oldn) get_irn_link(oldn)
 158
 159 /**
 160  * Check if a new node was set.
 161  */
 162 #define has_new_node(n) (get_new_node(n) != NULL)
 163
 164 /**
 165  * We use the block_visited flag to mark that we have computed the
 166  * number of useful predecessors for this block.
 167  * Further we encode the new arity in this flag in the old blocks.
 168  * Remembering the arity is useful, as it saves a lot of pointer
 169  * accesses.  This function is called for all Phi and Block nodes
 170  * in a Block.
 171  */
 172 static INLINE int
 173 compute_new_arity(ir_node *b) {
 174   int i, res, irn_arity;
 175   int irg_v, block_v;
 176
 177   irg_v = get_irg_block_visited(current_ir_graph);
 178   block_v = get_Block_block_visited(b);
 179   if (block_v >= irg_v) {
 180     /* we computed the number of preds for this block and saved it in the
 181        block_v flag */
 182     return block_v - irg_v;
 183   } else {
 184     /* compute the number of good predecessors */
 185     res = irn_arity = get_irn_arity(b);
 186     for (i = 0; i < irn_arity; i++)
 187       if (get_irn_opcode(get_irn_n(b, i)) == iro_Bad) res--;
 188     /* save it in the flag. */
 189     set_Block_block_visited(b, irg_v + res);
 190     return res;
 191   }
 192 }
 193
 194 /**
 195  * Copies the node to the new obstack. The Ins of the new node point to
 196  * the predecessors on the old obstack.  For block/phi nodes not all
 197  * predecessors might be copied.  n->link points to the new node.
 198  * For Phi and Block nodes the function allocates in-arrays with an arity
 199  * only for useful predecessors.  The arity is determined by counting
 200  * the non-bad predecessors of the block.
 201  *
 202  * @param n    The node to be copied
 203  * @param env  if non-NULL, the node number attribute will be copied to the new node
 204  *
 205  * Note: Also used for loop unrolling.
 206  */
 207 static void copy_node(ir_node *n, void *env) {
 208   ir_node *nn, *block;
 209   int new_arity;
 210   ir_op *op = get_irn_op(n);
 211   int copy_node_nr = env != NULL;
 212
 213   /* The end node looses it's flexible in array.  This doesn't matter,
 214      as dead node elimination builds End by hand, inlineing doesn't use
 215      the End node. */
 216   /* assert(op == op_End ||  ((_ARR_DESCR(n->in))->cookie != ARR_F_MAGIC)); */
 217
 218   if (op == op_Bad) {
 219     /* node copied already */
 220     return;
 221   } else if (op == op_Block) {
 222     block = NULL;
 223     new_arity = compute_new_arity(n);
 224     n->attr.block.graph_arr = NULL;
 225   } else {
 226     block = get_nodes_block(n);
 227     if (op == op_Phi) {
 228       new_arity = compute_new_arity(block);
 229     } else {
 230       new_arity = get_irn_arity(n);
 231     }
 232   }
 233   nn = new_ir_node(get_irn_dbg_info(n),
 234            current_ir_graph,
 235            block,
 236            op,
 237            get_irn_mode(n),
 238            new_arity,
 239            get_irn_in(n) + 1);
 240   /* Copy the attributes.  These might point to additional data.  If this
 241      was allocated on the old obstack the pointers now are dangling.  This
 242      frees e.g. the memory of the graph_arr allocated in new_immBlock. */
 243   copy_node_attr(n, nn);
 244   new_backedge_info(nn);
 245
 246 #if DEBUG_libfirm
 247   if (copy_node_nr) {
 248     /* for easier debugging, we want to copy the node numbers too */
 249     nn->node_nr = n->node_nr;
 250   }
 251 #endif
 252
 253   set_new_node(n, nn);
 254   hook_dead_node_elim_subst(current_ir_graph, n, nn);
 255 }
 256
 257 /**
 258  * Copies new predecessors of old node to new node remembered in link.
 259  * Spare the Bad predecessors of Phi and Block nodes.
 260  */
 261 void
 262 copy_preds (ir_node *n, void *env) {
 263   ir_node *nn, *block;
 264   int i, j, irn_arity;
 265
 266   nn = get_new_node(n);
 267
 268   /* printf("\n old node: "); DDMSG2(n);
 269      printf(" new node: "); DDMSG2(nn);
 270      printf(" arities: old: %d, new: %d\n", get_irn_arity(n), get_irn_arity(nn)); */
 271
 272   if (is_Block(n)) {
 273     /* Don't copy Bad nodes. */
 274     j = 0;
 275     irn_arity = get_irn_arity(n);
 276     for (i = 0; i < irn_arity; i++)
 277       if (! is_Bad(get_irn_n(n, i))) {
 278         set_irn_n (nn, j, get_new_node(get_irn_n(n, i)));
 279         /*if (is_backedge(n, i)) set_backedge(nn, j);*/
 280         j++;
 281       }
 282     /* repair the block visited flag from above misuse. Repair it in both
 283        graphs so that the old one can still be used. */
 284     set_Block_block_visited(nn, 0);
 285     set_Block_block_visited(n, 0);
 286     /* Local optimization could not merge two subsequent blocks if
 287        in array contained Bads.  Now it's possible.
 288        We don't call optimize_in_place as it requires
 289        that the fields in ir_graph are set properly. */
 290     if ((get_opt_control_flow_straightening()) &&
 291         (get_Block_n_cfgpreds(nn) == 1) &&
 292         (get_irn_op(get_Block_cfgpred(nn, 0)) == op_Jmp)) {
 293       ir_node *old = get_nodes_block(get_Block_cfgpred(nn, 0));
 294       if (nn == old) {
 295         /* Jmp jumps into the block it is in -- deal self cycle. */
 296         assert(is_Bad(get_new_node(get_irg_bad(current_ir_graph))));
 297         exchange(nn, get_new_node(get_irg_bad(current_ir_graph)));
 298       } else {
 299         exchange(nn, old);
 300       }
 301     }
 302   } else if (get_irn_op(n) == op_Phi) {
 303     /* Don't copy node if corresponding predecessor in block is Bad.
 304        The Block itself should not be Bad. */
 305     block = get_nodes_block(n);
 306     set_irn_n (nn, -1, get_new_node(block));
 307     j = 0;
 308     irn_arity = get_irn_arity(n);
 309     for (i = 0; i < irn_arity; i++)
 310       if (! is_Bad(get_irn_n(block, i))) {
 311         set_irn_n (nn, j, get_new_node(get_irn_n(n, i)));
 312         /*if (is_backedge(n, i)) set_backedge(nn, j);*/
 313         j++;
 314       }
 315     /* If the pre walker reached this Phi after the post walker visited the
 316        block block_visited is > 0. */
 317     set_Block_block_visited(get_nodes_block(n), 0);
 318     /* Compacting the Phi's ins might generate Phis with only one
 319        predecessor. */
 320     if (get_irn_arity(nn) == 1)
 321       exchange(nn, get_irn_n(nn, 0));
 322   } else {
 323     irn_arity = get_irn_arity(n);
 324     for (i = -1; i < irn_arity; i++)
 325       set_irn_n (nn, i, get_new_node(get_irn_n(n, i)));
 326   }
 327   /* Now the new node is complete.  We can add it to the hash table for CSE.
 328      @@@ inlining aborts if we identify End. Why? */
 329   if (get_irn_op(nn) != op_End)
 330     add_identities (current_ir_graph->value_table, nn);
 331 }
 332
 333 /**
 334  * Copies the graph recursively, compacts the keep-alives of the end node.
 335  *
 336  * @param irg           the graph to be copied
 337  * @param copy_node_nr  If non-zero, the node number will be copied
 338  */
 339 static void copy_graph(ir_graph *irg, int copy_node_nr) {
 340   ir_node *oe, *ne, *ob, *nb, *om, *nm; /* old end, new end, old bad, new bad, old NoMem, new NoMem */
 341   ir_node *ka;      /* keep alive */
 342   int i, irn_arity;
 343
 344   oe = get_irg_end(irg);
 345   /* copy the end node by hand, allocate dynamic in array! */
 346   ne = new_ir_node(get_irn_dbg_info(oe),
 347            irg,
 348            NULL,
 349            op_End,
 350            mode_X,
 351            -1,
 352            NULL);
 353   /* Copy the attributes.  Well, there might be some in the future... */
 354   copy_node_attr(oe, ne);
 355   set_new_node(oe, ne);
 356
 357   /* copy the Bad node */
 358   ob = get_irg_bad(irg);
 359   nb = new_ir_node(get_irn_dbg_info(ob),
 360            irg,
 361            NULL,
 362            op_Bad,
 363            mode_T,
 364            0,
 365            NULL);
 366   set_new_node(ob, nb);
 367
 368   /* copy the NoMem node */
 369   om = get_irg_no_mem(irg);
 370   nm = new_ir_node(get_irn_dbg_info(om),
 371            irg,
 372            NULL,
 373            op_NoMem,
 374            mode_M,
 375            0,
 376            NULL);
 377   set_new_node(om, nm);
 378
 379   /* copy the live nodes */
 380   irg_walk(get_nodes_block(oe), copy_node, copy_preds, INT_TO_PTR(copy_node_nr));
 381   /* copy_preds for the end node ... */
 382   set_nodes_block(ne, get_new_node(get_nodes_block(oe)));
 383
 384   /*- ... and now the keep alives. -*/
 385   /* First pick the not marked block nodes and walk them.  We must pick these
 386      first as else we will oversee blocks reachable from Phis. */
 387   irn_arity = get_irn_arity(oe);
 388   for (i = 0; i < irn_arity; i++) {
 389     ka = get_irn_intra_n(oe, i);
 390     if (is_Block(ka) &&
 391         (get_irn_visited(ka) < get_irg_visited(irg))) {
 392       /* We must keep the block alive and copy everything reachable */
 393       set_irg_visited(irg, get_irg_visited(irg)-1);
 394       irg_walk(ka, copy_node, copy_preds, INT_TO_PTR(copy_node_nr));
 395       add_End_keepalive(ne, get_new_node(ka));
 396     }
 397   }
 398
 399   /* Now pick other nodes.  Here we will keep all! */
 400   irn_arity = get_irn_arity(oe);
 401   for (i = 0; i < irn_arity; i++) {
 402     ka = get_irn_intra_n(oe, i);
 403     if (!is_Block(ka)) {
 404       if (get_irn_visited(ka) < get_irg_visited(irg)) {
 405         /* We didn't copy the node yet.  */
 406         set_irg_visited(irg, get_irg_visited(irg)-1);
 407         irg_walk(ka, copy_node, copy_preds, INT_TO_PTR(copy_node_nr));
 408       }
 409       add_End_keepalive(ne, get_new_node(ka));
 410     }
 411   }
 412
 413   /* start block sometimes only reached after keep alives */
 414   set_nodes_block(nb, get_new_node(get_nodes_block(ob)));
 415   set_nodes_block(nm, get_new_node(get_nodes_block(om)));
 416 }
 417
 418 /**
 419  * Copies the graph reachable from current_ir_graph->end to the obstack
 420  * in current_ir_graph and fixes the environment.
 421  * Then fixes the fields in current_ir_graph containing nodes of the
 422  * graph.
 423  *
 424  * @param copy_node_nr  If non-zero, the node number will be copied
 425  */
 426 static void
 427 copy_graph_env (int copy_node_nr) {
 428   ir_graph *irg = current_ir_graph;
 429   ir_node *old_end, *n;
 430   /* Not all nodes remembered in irg might be reachable
 431      from the end node.  Assure their link is set to NULL, so that
 432      we can test whether new nodes have been computed. */
 433   set_irn_link(get_irg_frame      (irg), NULL);
 434   set_irn_link(get_irg_globals    (irg), NULL);
 435   set_irn_link(get_irg_args       (irg), NULL);
 436   set_irn_link(get_irg_initial_mem(irg), NULL);
 437   set_irn_link(get_irg_bad        (irg), NULL);
 438   set_irn_link(get_irg_no_mem     (irg), NULL);
 439
 440   /* we use the block walk flag for removing Bads from Blocks ins. */
 441   inc_irg_block_visited(irg);
 442
 443   /* copy the graph */
 444   copy_graph(irg, copy_node_nr);
 445
 446   /* fix the fields in irg */
 447   old_end = get_irg_end(irg);
 448   set_irg_end        (irg, get_new_node(old_end));
 449   set_irg_end_except (irg, get_irg_end(irg));
 450   set_irg_end_reg    (irg, get_irg_end(irg));
 451   free_End(old_end);
 452   set_irg_end_block  (irg, get_new_node(get_irg_end_block(irg)));
 453
 454   n = get_irg_frame(irg);
 455   if (!has_new_node(n)) {
 456     copy_node (n, INT_TO_PTR(copy_node_nr));
 457     copy_preds(n, NULL);
 458   }
 459   n = get_irg_globals(irg);
 460   if (!has_new_node(n)) {
 461     copy_node (n, INT_TO_PTR(copy_node_nr));
 462     copy_preds(n, NULL);
 463   }
 464   n = get_irg_initial_mem(irg);
 465   if (!has_new_node(n)) {
 466     copy_node (n, INT_TO_PTR(copy_node_nr));
 467     copy_preds(n, NULL);
 468   }
 469   n = get_irg_args(irg);
 470   if (!has_new_node(n)) {
 471     copy_node (n, INT_TO_PTR(copy_node_nr));
 472     copy_preds(n, NULL);
 473   }
 474   n = get_irg_bad(irg);
 475   if (!has_new_node(n)) {
 476     copy_node(n, INT_TO_PTR(copy_node_nr));
 477     copy_preds(n, NULL);
 478   }
 479   n = get_irg_no_mem(irg);
 480   if (!has_new_node(n)) {
 481     copy_node(n, INT_TO_PTR(copy_node_nr));
 482     copy_preds(n, NULL);
 483   }
 484   set_irg_start      (irg, get_new_node(get_irg_start(irg)));
 485   set_irg_start_block(irg, get_new_node(get_irg_start_block(irg)));
 486   set_irg_frame      (irg, get_new_node(get_irg_frame(irg)));
 487   set_irg_globals    (irg, get_new_node(get_irg_globals(irg)));
 488   set_irg_initial_mem(irg, get_new_node(get_irg_initial_mem(irg)));
 489   set_irg_args       (irg, get_new_node(get_irg_args(irg)));
 490   set_irg_bad        (irg, get_new_node(get_irg_bad(irg)));
 491   set_irg_no_mem     (irg, get_new_node(get_irg_no_mem(irg)));
 492 }
 493
 494 /**
 495  * Copies all reachable nodes to a new obstack.  Removes bad inputs
 496  * from block nodes and the corresponding inputs from Phi nodes.
 497  * Merges single exit blocks with single entry blocks and removes
 498  * 1-input Phis.
 499  * Adds all new nodes to a new hash table for CSE.  Does not
 500  * perform CSE, so the hash table might contain common subexpressions.
 501  */
 502 void
 503 dead_node_elimination(ir_graph *irg) {
 504   ir_graph *rem;
 505   int rem_ipview = get_interprocedural_view();
 506   struct obstack *graveyard_obst = NULL;
 507   struct obstack *rebirth_obst   = NULL;
 508
 509   if (get_opt_optimize() && get_opt_dead_node_elimination()) {
 510     assert(! edges_activated(irg) && "dead node elimination requires disabled edges");
 511
 512     /* inform statistics that we started a dead-node elimination run */
 513     hook_dead_node_elim(irg, 1);
 514
 515     /* Remember external state of current_ir_graph. */
 516     rem = current_ir_graph;
 517     current_ir_graph = irg;
 518     set_interprocedural_view(0);
 519
 520     assert(get_irg_phase_state(current_ir_graph) != phase_building);
 521
 522     /* Handle graph state */
 523     free_callee_info(current_ir_graph);
 524     free_irg_outs(current_ir_graph);
 525     free_trouts();
 526
 527     /* @@@ so far we loose loops when copying */
 528     free_loop_information(current_ir_graph);
 529
 530     set_irg_doms_inconsistent(irg);
 531
 532     /* A quiet place, where the old obstack can rest in peace,
 533        until it will be cremated. */
 534     graveyard_obst = irg->obst;
 535
 536     /* A new obstack, where the reachable nodes will be copied to. */
 537     rebirth_obst = xmalloc (sizeof(*rebirth_obst));
 538     current_ir_graph->obst = rebirth_obst;
 539     obstack_init (current_ir_graph->obst);
 540
 541     /* We also need a new hash table for cse */
 542     del_identities (irg->value_table);
 543     irg->value_table = new_identities ();
 544
 545     /* Copy the graph from the old to the new obstack */
 546     copy_graph_env(1);
 547
 548     /* Free memory from old unoptimized obstack */
 549     obstack_free(graveyard_obst, 0);  /* First empty the obstack ... */
 550     xfree (graveyard_obst);           /* ... then free it.           */
 551
 552     /* inform statistics that the run is over */
 553     hook_dead_node_elim(irg, 0);
 554
 555     current_ir_graph = rem;
 556     set_interprocedural_view(rem_ipview);
 557   }
 558 }
 559
 560 /**
 561  * Relink bad predecessors of a block and store the old in array to the
 562  * link field. This function is called by relink_bad_predecessors().
 563  * The array of link field starts with the block operand at position 0.
 564  * If block has bad predecessors, create a new in array without bad preds.
 565  * Otherwise let in array untouched.
 566  */
 567 static void relink_bad_block_predecessors(ir_node *n, void *env) {
 568   ir_node **new_in, *irn;
 569   int i, new_irn_n, old_irn_arity, new_irn_arity = 0;
 570
 571   /* if link field of block is NULL, look for bad predecessors otherwise
 572      this is already done */
 573   if (get_irn_op(n) == op_Block &&
 574       get_irn_link(n) == NULL) {
 575
 576     /* save old predecessors in link field (position 0 is the block operand)*/
 577     set_irn_link(n, get_irn_in(n));
 578
 579     /* count predecessors without bad nodes */
 580     old_irn_arity = get_irn_arity(n);
 581     for (i = 0; i < old_irn_arity; i++)
 582       if (!is_Bad(get_irn_n(n, i))) new_irn_arity++;
 583
 584     /* arity changing: set new predecessors without bad nodes */
 585     if (new_irn_arity < old_irn_arity) {
 586       /* Get new predecessor array. We do not resize the array, as we must
 587          keep the old one to update Phis. */
 588       new_in = NEW_ARR_D (ir_node *, current_ir_graph->obst, (new_irn_arity+1));
 589
 590       /* set new predecessors in array */
 591       new_in[0] = NULL;
 592       new_irn_n = 1;
 593       for (i = 0; i < old_irn_arity; i++) {
 594         irn = get_irn_n(n, i);
 595         if (!is_Bad(irn)) {
 596           new_in[new_irn_n] = irn;
 597           is_backedge(n, i) ? set_backedge(n, new_irn_n-1) : set_not_backedge(n, new_irn_n-1);
 598           ++new_irn_n;
 599         }
 600       }
 601       //ARR_SETLEN(int, n->attr.block.backedge, new_irn_arity);
 602       ARR_SHRINKLEN(n->attr.block.backedge, new_irn_arity);
 603       n->in = new_in;
 604
 605     } /* ir node has bad predecessors */
 606
 607   } /* Block is not relinked */
 608 }
 609
 610 /**
 611  * Relinks Bad predecessors from Blocks and Phis called by walker
 612  * remove_bad_predecesors(). If n is a Block, call
 613  * relink_bad_block_redecessors(). If n is a Phi-node, call also the relinking
 614  * function of Phi's Block. If this block has bad predecessors, relink preds
 615  * of the Phi-node.
 616  */
 617 static void relink_bad_predecessors(ir_node *n, void *env) {
 618   ir_node *block, **old_in;
 619   int i, old_irn_arity, new_irn_arity;
 620
 621   /* relink bad predecessors of a block */
 622   if (get_irn_op(n) == op_Block)
 623     relink_bad_block_predecessors(n, env);
 624
 625   /* If Phi node relink its block and its predecessors */
 626   if (get_irn_op(n) == op_Phi) {
 627
 628     /* Relink predecessors of phi's block */
 629     block = get_nodes_block(n);
 630     if (get_irn_link(block) == NULL)
 631       relink_bad_block_predecessors(block, env);
 632
 633     old_in = (ir_node **)get_irn_link(block); /* Of Phi's Block */
 634     old_irn_arity = ARR_LEN(old_in);
 635
 636     /* Relink Phi predecessors if count of predecessors changed */
 637     if (old_irn_arity != ARR_LEN(get_irn_in(block))) {
 638       /* set new predecessors in array
 639          n->in[0] remains the same block */
 640       new_irn_arity = 1;
 641       for(i = 1; i < old_irn_arity; i++)
 642         if (!is_Bad((ir_node *)old_in[i])) {
 643           n->in[new_irn_arity] = n->in[i];
 644           is_backedge(n, i) ? set_backedge(n, new_irn_arity) : set_not_backedge(n, new_irn_arity);
 645           ++new_irn_arity;
 646         }
 647
 648       ARR_SETLEN(ir_node *, n->in, new_irn_arity);
 649       ARR_SETLEN(int, n->attr.phi_backedge, new_irn_arity);
 650     }
 651
 652   } /* n is a Phi node */
 653 }
 654
 655 /*
 656  * Removes Bad Bad predecessors from Blocks and the corresponding
 657  * inputs to Phi nodes as in dead_node_elimination but without
 658  * copying the graph.
 659  * On walking up set the link field to NULL, on walking down call
 660  * relink_bad_predecessors() (This function stores the old in array
 661  * to the link field and sets a new in array if arity of predecessors
 662  * changes).
 663  */
 664 void remove_bad_predecessors(ir_graph *irg) {
 665   irg_walk_graph(irg, init_link, relink_bad_predecessors, NULL);
 666 }
 667
 668
 669 /*
 670          __                      _  __ __
 671         (_     __    o     _    | \/  |_
 672         __)|_| | \_/ | \_/(/_   |_/\__|__
 673
 674   The following stuff implements a facility that automatically patches
 675   registered ir_node pointers to the new node when a dead node elimination occurs.
 676 */
 677
 678 struct _survive_dce_t {
 679         struct obstack obst;
 680         pmap *places;
 681         pmap *new_places;
 682         hook_entry_t dead_node_elim;
 683         hook_entry_t dead_node_elim_subst;
 684 };
 685
 686 typedef struct _survive_dce_list_t {
 687         struct _survive_dce_list_t *next;
 688         ir_node **place;
 689 } survive_dce_list_t;
 690
 691 static void dead_node_hook(void *context, ir_graph *irg, int start)
 692 {
 693         survive_dce_t *sd = context;
 694
 695         /* Create a new map before the dead node elimination is performed. */
 696         if(start) {
 697                 sd->new_places = pmap_create_ex(pmap_count(sd->places));
 698         }
 699
 700         /* Patch back all nodes if dead node elimination is over and something is to be done. */
 701         else {
 702                 pmap_destroy(sd->places);
 703                 sd->places     = sd->new_places;
 704                 sd->new_places = NULL;
 705         }
 706 }
 707
 708 static void dead_node_subst_hook(void *context, ir_graph *irg, ir_node *old, ir_node *nw)
 709 {
 710         survive_dce_t *sd = context;
 711         survive_dce_list_t *list = pmap_get(sd->places, old);
 712
 713         /* If the node is to be patched back, write the new address to all registered locations. */
 714         if(list) {
 715                 survive_dce_list_t *p;
 716
 717                 for(p = list; p; p = p->next)
 718                         *(p->place) = nw;
 719
 720                 pmap_insert(sd->new_places, nw, list);
 721         }
 722 }
 723
 724 /**
 725  * Make a new Survive DCE environment.
 726  */
 727 survive_dce_t *new_survive_dce(void)
 728 {
 729         survive_dce_t *res = xmalloc(sizeof(res[0]));
 730         obstack_init(&res->obst);
 731         res->places     = pmap_create();
 732         res->new_places = NULL;
 733
 734         res->dead_node_elim.hook._hook_dead_node_elim = dead_node_hook;
 735         res->dead_node_elim.context                   = res;
 736         res->dead_node_elim.next                      = NULL;
 737
 738         res->dead_node_elim_subst.hook._hook_dead_node_elim_subst = dead_node_subst_hook;
 739         res->dead_node_elim_subst.context = res;
 740         res->dead_node_elim_subst.next    = NULL;
 741
 742         register_hook(hook_dead_node_elim, &res->dead_node_elim);
 743         register_hook(hook_dead_node_elim_subst, &res->dead_node_elim_subst);
 744         return res;
 745 }
 746
 747 /**
 748  * Free a Survive DCE environment.
 749  */
 750 void free_survive_dce(survive_dce_t *sd)
 751 {
 752         obstack_free(&sd->obst, NULL);
 753         pmap_destroy(sd->places);
 754         unregister_hook(hook_dead_node_elim, &sd->dead_node_elim);
 755         unregister_hook(hook_dead_node_elim_subst, &sd->dead_node_elim_subst);
 756         free(sd);
 757 }
 758
 759 /**
 760  * Register a node pointer to be patched upon DCE.
 761  * When DCE occurs, the node pointer specified by @p place will be
 762  * patched to the new address of the node it is pointing to.
 763  *
 764  * @param sd    The Survive DCE environment.
 765  * @param place The address of the node pointer.
 766  */
 767 void survive_dce_register_irn(survive_dce_t *sd, ir_node **place)
 768 {
 769         if(*place != NULL) {
 770                 ir_node *irn      = *place;
 771                 survive_dce_list_t *curr = pmap_get(sd->places, irn);
 772                 survive_dce_list_t *nw   = obstack_alloc(&sd->obst, sizeof(nw));
 773
 774                 nw->next  = curr;
 775                 nw->place = place;
 776
 777                 pmap_insert(sd->places, irn, nw);
 778         }
 779 }
 780
 781 /*--------------------------------------------------------------------*/
 782 /*  Functionality for inlining                                         */
 783 /*--------------------------------------------------------------------*/
 784
 785 /**
 786  * Copy node for inlineing.  Updates attributes that change when
 787  * inlineing but not for dead node elimination.
 788  *
 789  * Copies the node by calling copy_node() and then updates the entity if
 790  * it's a local one.  env must be a pointer of the frame type of the
 791  * inlined procedure. The new entities must be in the link field of
 792  * the entities.
 793  */
 794 static INLINE void
 795 copy_node_inline (ir_node *n, void *env) {
 796   ir_node *nn;
 797   ir_type *frame_tp = (ir_type *)env;
 798
 799   copy_node(n, NULL);
 800   if (get_irn_op(n) == op_Sel) {
 801     nn = get_new_node (n);
 802     assert(is_Sel(nn));
 803     if (get_entity_owner(get_Sel_entity(n)) == frame_tp) {
 804       set_Sel_entity(nn, get_entity_link(get_Sel_entity(n)));
 805     }
 806   } else if (get_irn_op(n) == op_Block) {
 807     nn = get_new_node (n);
 808     nn->attr.block.irg = current_ir_graph;
 809   }
 810 }
 811
 812 static void find_addr(ir_node *node, void *env)
 813 {
 814   if (get_irn_opcode(node) == iro_Proj) {
 815     if (get_Proj_proj(node) == pn_Start_P_value_arg_base)
 816       *(int *)env = 0;
 817   }
 818 }
 819
 820 /*
 821  * currently, we cannot inline two cases:
 822  * - call with compound arguments
 823  * - graphs that take the address of a parameter
 824  *
 825  * check these conditions here
 826  */
 827 static int can_inline(ir_node *call, ir_graph *called_graph)
 828 {
 829   ir_type *call_type = get_Call_type(call);
 830   int params, ress, i, res;
 831   assert(is_Method_type(call_type));
 832
 833   params = get_method_n_params(call_type);
 834   ress   = get_method_n_ress(call_type);
 835
 836   /* check params */
 837   for (i = 0; i < params; ++i) {
 838     ir_type *p_type = get_method_param_type(call_type, i);
 839
 840     if (is_compound_type(p_type))
 841       return 0;
 842   }
 843
 844   /* check res */
 845   for (i = 0; i < ress; ++i) {
 846     ir_type *r_type = get_method_res_type(call_type, i);
 847
 848     if (is_compound_type(r_type))
 849       return 0;
 850   }
 851
 852   res = 1;
 853   irg_walk_graph(called_graph, find_addr, NULL, &res);
 854
 855   return res;
 856 }
 857
 858 int inline_method(ir_node *call, ir_graph *called_graph) {
 859   ir_node *pre_call;
 860   ir_node *post_call, *post_bl;
 861   ir_node *in[5];
 862   ir_node *end, *end_bl;
 863   ir_node **res_pred;
 864   ir_node **cf_pred;
 865   ir_node *ret, *phi;
 866   int arity, n_ret, n_exc, n_res, i, j, rem_opt, irn_arity;
 867   int exc_handling;
 868   ir_type *called_frame;
 869   irg_inline_property prop = get_irg_inline_property(called_graph);
 870
 871   if ( (prop != irg_inline_forced) &&
 872        (!get_opt_optimize() || !get_opt_inline() || (prop == irg_inline_forbidden))) return 0;
 873
 874   /* Do not inline variadic functions. */
 875   if (get_method_variadicity(get_entity_type(get_irg_entity(called_graph))) == variadicity_variadic)
 876     return 0;
 877
 878   assert(get_method_n_params(get_entity_type(get_irg_entity(called_graph))) ==
 879          get_method_n_params(get_Call_type(call)));
 880
 881   /*
 882    * currently, we cannot inline two cases:
 883    * - call with compound arguments
 884    * - graphs that take the address of a parameter
 885    */
 886   if (! can_inline(call, called_graph))
 887     return 0;
 888
 889   /* --  Turn off optimizations, this can cause problems when allocating new nodes. -- */
 890   rem_opt = get_opt_optimize();
 891   set_optimize(0);
 892
 893   /* Handle graph state */
 894   assert(get_irg_phase_state(current_ir_graph) != phase_building);
 895   assert(get_irg_pinned(current_ir_graph) == op_pin_state_pinned);
 896   assert(get_irg_pinned(called_graph) == op_pin_state_pinned);
 897   set_irg_outs_inconsistent(current_ir_graph);
 898   set_irg_extblk_inconsistent(current_ir_graph);
 899   set_irg_doms_inconsistent(current_ir_graph);
 900   set_irg_loopinfo_inconsistent(current_ir_graph);
 901   set_irg_callee_info_state(current_ir_graph, irg_callee_info_inconsistent);
 902
 903   /* -- Check preconditions -- */
 904   assert(is_Call(call));
 905   /* @@@ does not work for InterfaceIII.java after cgana
 906      assert(get_Call_type(call) == get_entity_type(get_irg_entity(called_graph)));
 907      assert(smaller_type(get_entity_type(get_irg_entity(called_graph)),
 908      get_Call_type(call)));
 909   */
 910   assert(get_type_tpop(get_Call_type(call)) == type_method);
 911   if (called_graph == current_ir_graph) {
 912     set_optimize(rem_opt);
 913     return 0;
 914   }
 915
 916   /* here we know we WILL inline, so inform the statistics */
 917   hook_inline(call, called_graph);
 918
 919   /* -- Decide how to handle exception control flow: Is there a handler
 920      for the Call node, or do we branch directly to End on an exception?
 921      exc_handling:
 922      0 There is a handler.
 923      1 Branches to End.
 924      2 Exception handling not represented in Firm. -- */
 925   {
 926     ir_node *proj, *Mproj = NULL, *Xproj = NULL;
 927     for (proj = (ir_node *)get_irn_link(call); proj; proj = (ir_node *)get_irn_link(proj)) {
 928       assert(get_irn_op(proj) == op_Proj);
 929       if (get_Proj_proj(proj) == pn_Call_X_except) Xproj = proj;
 930       if (get_Proj_proj(proj) == pn_Call_M_except) Mproj = proj;
 931     }
 932     if      (Mproj) { assert(Xproj); exc_handling = 0; } /*  Mproj           */
 933     else if (Xproj) {                exc_handling = 1; } /* !Mproj &&  Xproj   */
 934     else            {                exc_handling = 2; } /* !Mproj && !Xproj   */
 935   }
 936
 937
 938   /* --
 939      the procedure and later replaces the Start node of the called graph.
 940      Post_call is the old Call node and collects the results of the called
 941      graph. Both will end up being a tuple.  -- */
 942   post_bl = get_nodes_block(call);
 943   set_irg_current_block(current_ir_graph, post_bl);
 944   /* XxMxPxP of Start + parameter of Call */
 945   in[pn_Start_X_initial_exec] = new_Jmp();
 946   in[pn_Start_M]              = get_Call_mem(call);
 947   in[pn_Start_P_frame_base]   = get_irg_frame(current_ir_graph);
 948   in[pn_Start_P_globals]      = get_irg_globals(current_ir_graph);
 949   in[pn_Start_T_args]         = new_Tuple(get_Call_n_params(call), get_Call_param_arr(call));
 950   /* in[pn_Start_P_value_arg_base] = ??? */
 951   pre_call = new_Tuple(5, in);
 952   post_call = call;
 953
 954   /* --
 955      The new block gets the ins of the old block, pre_call and all its
 956      predecessors and all Phi nodes. -- */
 957   part_block(pre_call);
 958
 959   /* -- Prepare state for dead node elimination -- */
 960   /* Visited flags in calling irg must be >= flag in called irg.
 961      Else walker and arity computation will not work. */
 962   if (get_irg_visited(current_ir_graph) <= get_irg_visited(called_graph))
 963     set_irg_visited(current_ir_graph, get_irg_visited(called_graph)+1);
 964   if (get_irg_block_visited(current_ir_graph)< get_irg_block_visited(called_graph))
 965     set_irg_block_visited(current_ir_graph, get_irg_block_visited(called_graph));
 966   /* Set pre_call as new Start node in link field of the start node of
 967      calling graph and pre_calls block as new block for the start block
 968      of calling graph.
 969      Further mark these nodes so that they are not visited by the
 970      copying. */
 971   set_irn_link(get_irg_start(called_graph), pre_call);
 972   set_irn_visited(get_irg_start(called_graph), get_irg_visited(current_ir_graph));
 973   set_irn_link(get_irg_start_block(called_graph), get_nodes_block(pre_call));
 974   set_irn_visited(get_irg_start_block(called_graph), get_irg_visited(current_ir_graph));
 975   set_irn_link(get_irg_bad(called_graph), get_irg_bad(current_ir_graph));
 976   set_irn_visited(get_irg_bad(called_graph), get_irg_visited(current_ir_graph));
 977
 978   /* Initialize for compaction of in arrays */
 979   inc_irg_block_visited(current_ir_graph);
 980
 981   /* -- Replicate local entities of the called_graph -- */
 982   /* copy the entities. */
 983   called_frame = get_irg_frame_type(called_graph);
 984   for (i = 0; i < get_class_n_members(called_frame); i++) {
 985     entity *new_ent, *old_ent;
 986     old_ent = get_class_member(called_frame, i);
 987     new_ent = copy_entity_own(old_ent, get_cur_frame_type());
 988     set_entity_link(old_ent, new_ent);
 989   }
 990
 991   /* visited is > than that of called graph.  With this trick visited will
 992      remain unchanged so that an outer walker, e.g., searching the call nodes
 993      to inline, calling this inline will not visit the inlined nodes. */
 994   set_irg_visited(current_ir_graph, get_irg_visited(current_ir_graph)-1);
 995
 996   /* -- Performing dead node elimination inlines the graph -- */
 997   /* Copies the nodes to the obstack of current_ir_graph. Updates links to new
 998      entities. */
 999   /* @@@ endless loops are not copied!! -- they should be, I think... */
1000   irg_walk(get_irg_end(called_graph), copy_node_inline, copy_preds,
1001            get_irg_frame_type(called_graph));
1002
1003   /* Repair called_graph */
1004   set_irg_visited(called_graph, get_irg_visited(current_ir_graph));
1005   set_irg_block_visited(called_graph, get_irg_block_visited(current_ir_graph));
1006   set_Block_block_visited(get_irg_start_block(called_graph), 0);
1007
1008   /* -- Merge the end of the inlined procedure with the call site -- */
1009   /* We will turn the old Call node into a Tuple with the following
1010      predecessors:
1011      -1:  Block of Tuple.
1012      0: Phi of all Memories of Return statements.
1013      1: Jmp from new Block that merges the control flow from all exception
1014      predecessors of the old end block.
1015      2: Tuple of all arguments.
1016      3: Phi of Exception memories.
1017      In case the old Call directly branches to End on an exception we don't
1018      need the block merging all exceptions nor the Phi of the exception
1019      memories.
1020   */
1021
1022   /* -- Precompute some values -- */
1023   end_bl = get_new_node(get_irg_end_block(called_graph));
1024   end = get_new_node(get_irg_end(called_graph));
1025   arity = get_irn_arity(end_bl);    /* arity = n_exc + n_ret  */
1026   n_res = get_method_n_ress(get_Call_type(call));
1027
1028   res_pred = xmalloc (n_res * sizeof(*res_pred));
1029   cf_pred  = xmalloc (arity * sizeof(*res_pred));
1030
1031   set_irg_current_block(current_ir_graph, post_bl); /* just to make sure */
1032
1033   /* -- archive keepalives -- */
1034   irn_arity = get_irn_arity(end);
1035   for (i = 0; i < irn_arity; i++)
1036     add_End_keepalive(get_irg_end(current_ir_graph), get_irn_n(end, i));
1037
1038   /* The new end node will die.  We need not free as the in array is on the obstack:
1039      copy_node() only generated 'D' arrays. */
1040
1041   /* -- Replace Return nodes by Jump nodes. -- */
1042   n_ret = 0;
1043   for (i = 0; i < arity; i++) {
1044     ir_node *ret;
1045     ret = get_irn_n(end_bl, i);
1046     if (is_Return(ret)) {
1047       cf_pred[n_ret] = new_r_Jmp(current_ir_graph, get_nodes_block(ret));
1048       n_ret++;
1049     }
1050   }
1051   set_irn_in(post_bl, n_ret, cf_pred);
1052
1053   /* -- Build a Tuple for all results of the method.
1054      Add Phi node if there was more than one Return.  -- */
1055   turn_into_tuple(post_call, 4);
1056   /* First the Memory-Phi */
1057   n_ret = 0;
1058   for (i = 0; i < arity; i++) {
1059     ret = get_irn_n(end_bl, i);
1060     if (is_Return(ret)) {
1061       cf_pred[n_ret] = get_Return_mem(ret);
1062       n_ret++;
1063     }
1064   }
1065   phi = new_Phi(n_ret, cf_pred, mode_M);
1066   set_Tuple_pred(call, pn_Call_M_regular, phi);
1067   /* Conserve Phi-list for further inlinings -- but might be optimized */
1068   if (get_nodes_block(phi) == post_bl) {
1069     set_irn_link(phi, get_irn_link(post_bl));
1070     set_irn_link(post_bl, phi);
1071   }
1072   /* Now the real results */
1073   if (n_res > 0) {
1074     for (j = 0; j < n_res; j++) {
1075       n_ret = 0;
1076       for (i = 0; i < arity; i++) {
1077         ret = get_irn_n(end_bl, i);
1078         if (get_irn_op(ret) == op_Return) {
1079           cf_pred[n_ret] = get_Return_res(ret, j);
1080           n_ret++;
1081         }
1082       }
1083       if (n_ret > 0)
1084         phi = new_Phi(n_ret, cf_pred, get_irn_mode(cf_pred[0]));
1085       else
1086         phi = new_Bad();
1087       res_pred[j] = phi;
1088       /* Conserve Phi-list for further inlinings -- but might be optimized */
1089       if (get_nodes_block(phi) == post_bl) {
1090         set_irn_link(phi, get_irn_link(post_bl));
1091         set_irn_link(post_bl, phi);
1092       }
1093     }
1094     set_Tuple_pred(call, pn_Call_T_result, new_Tuple(n_res, res_pred));
1095   } else {
1096     set_Tuple_pred(call, pn_Call_T_result, new_Bad());
1097   }
1098   /* Finally the exception control flow.
1099      We have two (three) possible situations:
1100      First if the Call branches to an exception handler: We need to add a Phi node to
1101      collect the memory containing the exception objects.  Further we need
1102      to add another block to get a correct representation of this Phi.  To
1103      this block we add a Jmp that resolves into the X output of the Call
1104      when the Call is turned into a tuple.
1105      Second the Call branches to End, the exception is not handled.  Just
1106      add all inlined exception branches to the End node.
1107      Third: there is no Exception edge at all. Handle as case two. */
1108   if (exc_handling == 0) {
1109     n_exc = 0;
1110     for (i = 0; i < arity; i++) {
1111       ir_node *ret;
1112       ret = get_irn_n(end_bl, i);
1113       if (is_fragile_op(skip_Proj(ret)) || (get_irn_op(skip_Proj(ret)) == op_Raise)) {
1114         cf_pred[n_exc] = ret;
1115         n_exc++;
1116       }
1117     }
1118     if (n_exc > 0) {
1119       new_Block(n_exc, cf_pred);      /* watch it: current_block is changed! */
1120       set_Tuple_pred(call, pn_Call_X_except, new_Jmp());
1121       /* The Phi for the memories with the exception objects */
1122       n_exc = 0;
1123       for (i = 0; i < arity; i++) {
1124         ir_node *ret;
1125         ret = skip_Proj(get_irn_n(end_bl, i));
1126         if (is_Call(ret)) {
1127           cf_pred[n_exc] = new_r_Proj(current_ir_graph, get_nodes_block(ret), ret, mode_M, 3);
1128           n_exc++;
1129         } else if (is_fragile_op(ret)) {
1130           /* We rely that all cfops have the memory output at the same position. */
1131           cf_pred[n_exc] = new_r_Proj(current_ir_graph, get_nodes_block(ret), ret, mode_M, 0);
1132           n_exc++;
1133         } else if (get_irn_op(ret) == op_Raise) {
1134           cf_pred[n_exc] = new_r_Proj(current_ir_graph, get_nodes_block(ret), ret, mode_M, 1);
1135           n_exc++;
1136         }
1137       }
1138       set_Tuple_pred(call, pn_Call_M_except, new_Phi(n_exc, cf_pred, mode_M));
1139     } else {
1140       set_Tuple_pred(call, pn_Call_X_except, new_Bad());
1141       set_Tuple_pred(call, pn_Call_M_except, new_Bad());
1142     }
1143   } else {
1144     ir_node *main_end_bl;
1145     int main_end_bl_arity;
1146     ir_node **end_preds;
1147
1148     /* assert(exc_handling == 1 || no exceptions. ) */
1149     n_exc = 0;
1150     for (i = 0; i < arity; i++) {
1151       ir_node *ret = get_irn_n(end_bl, i);
1152
1153       if (is_fragile_op(skip_Proj(ret)) || (get_irn_op(skip_Proj(ret)) == op_Raise)) {
1154         cf_pred[n_exc] = ret;
1155         n_exc++;
1156       }
1157     }
1158     main_end_bl = get_irg_end_block(current_ir_graph);
1159     main_end_bl_arity = get_irn_arity(main_end_bl);
1160     end_preds =  xmalloc ((n_exc + main_end_bl_arity) * sizeof(*end_preds));
1161
1162     for (i = 0; i < main_end_bl_arity; ++i)
1163       end_preds[i] = get_irn_n(main_end_bl, i);
1164     for (i = 0; i < n_exc; ++i)
1165       end_preds[main_end_bl_arity + i] = cf_pred[i];
1166     set_irn_in(main_end_bl, n_exc + main_end_bl_arity, end_preds);
1167     set_Tuple_pred(call, pn_Call_X_except, new_Bad());
1168     set_Tuple_pred(call, pn_Call_M_except, new_Bad());
1169     free(end_preds);
1170   }
1171   free(res_pred);
1172   free(cf_pred);
1173
1174 #if 0  /* old. now better, correcter, faster implementation. */
1175   if (n_exc > 0) {
1176     /* -- If the exception control flow from the inlined Call directly
1177        branched to the end block we now have the following control
1178        flow predecessor pattern: ProjX -> Tuple -> Jmp.  We must
1179        remove the Jmp along with it's empty block and add Jmp's
1180        predecessors as predecessors of this end block.  No problem if
1181        there is no exception, because then branches Bad to End which
1182        is fine. --
1183        @@@ can't we know this beforehand: by getting the Proj(1) from
1184        the Call link list and checking whether it goes to Proj. */
1185     /* find the problematic predecessor of the end block. */
1186     end_bl = get_irg_end_block(current_ir_graph);
1187     for (i = 0; i < get_Block_n_cfgpreds(end_bl); i++) {
1188       cf_op = get_Block_cfgpred(end_bl, i);
1189       if (get_irn_op(cf_op) == op_Proj) {
1190         cf_op = get_Proj_pred(cf_op);
1191         if ((get_irn_op(cf_op) == op_Tuple) && (cf_op == call)) {
1192           /*  There are unoptimized tuples from inlineing before when no exc */
1193           assert(get_Proj_proj(get_Block_cfgpred(end_bl, i)) == pn_Call_X_except);
1194           cf_op = get_Tuple_pred(cf_op, pn_Call_X_except);
1195           assert(get_irn_op(cf_op) == op_Jmp);
1196           break;
1197         }
1198       }
1199     }
1200     /* repair */
1201     if (i < get_Block_n_cfgpreds(end_bl)) {
1202       bl = get_nodes_block(cf_op);
1203       arity = get_Block_n_cfgpreds(end_bl) + get_Block_n_cfgpreds(bl) - 1;
1204       cf_pred = xmalloc (arity * sizeof(*cf_pred));
1205       for (j = 0; j < i; j++)
1206         cf_pred[j] = get_Block_cfgpred(end_bl, j);
1207       for (j = j; j < i + get_Block_n_cfgpreds(bl); j++)
1208         cf_pred[j] = get_Block_cfgpred(bl, j-i);
1209       for (j = j; j < arity; j++)
1210         cf_pred[j] = get_Block_cfgpred(end_bl, j-get_Block_n_cfgpreds(bl) +1);
1211       set_irn_in(end_bl, arity, cf_pred);
1212       free(cf_pred);
1213       /*  Remove the exception pred from post-call Tuple. */
1214       set_Tuple_pred(call, pn_Call_X_except, new_Bad());
1215     }
1216   }
1217 #endif
1218
1219   /* --  Turn CSE back on. -- */
1220   set_optimize(rem_opt);
1221
1222   return 1;
1223 }
1224
1225 /********************************************************************/
1226 /* Apply inlineing to small methods.                                */
1227 /********************************************************************/
1228
1229 /* It makes no sense to inline too many calls in one procedure. Anyways,
1230    I didn't get a version with NEW_ARR_F to run. */
1231 #define MAX_INLINE 1024
1232
1233 /**
1234  * environment for inlining small irgs
1235  */
1236 typedef struct _inline_env_t {
1237   int pos;
1238   ir_node *calls[MAX_INLINE];
1239 } inline_env_t;
1240
1241 /**
1242  * Returns the irg called from a Call node. If the irg is not
1243  * known, NULL is returned.
1244  */
1245 static ir_graph *get_call_called_irg(ir_node *call) {
1246   ir_node *addr;
1247   ir_graph *called_irg = NULL;
1248
1249   assert(is_Call(call));
1250
1251   addr = get_Call_ptr(call);
1252   if ((get_irn_op(addr) == op_SymConst) && (get_SymConst_kind (addr) == symconst_addr_ent)) {
1253     called_irg = get_entity_irg(get_SymConst_entity(addr));
1254   }
1255
1256   return called_irg;
1257 }
1258
1259 static void collect_calls(ir_node *call, void *env) {
1260   ir_node *addr;
1261
1262   if (! is_Call(call)) return;
1263
1264   addr = get_Call_ptr(call);
1265
1266   if (get_irn_op(addr) == op_SymConst) {
1267     if (get_SymConst_kind(addr) == symconst_addr_ent) {
1268       ir_graph *called_irg = get_entity_irg(get_SymConst_entity(addr));
1269       inline_env_t *ienv = (inline_env_t *)env;
1270       if (called_irg && ienv->pos < MAX_INLINE) {
1271         /* The Call node calls a locally defined method.  Remember to inline. */
1272         ienv->calls[ienv->pos++] = call;
1273       }
1274     }
1275   }
1276 }
1277
1278 /**
1279  * Inlines all small methods at call sites where the called address comes
1280  * from a Const node that references the entity representing the called
1281  * method.
1282  * The size argument is a rough measure for the code size of the method:
1283  * Methods where the obstack containing the firm graph is smaller than
1284  * size are inlined.
1285  */
1286 void inline_small_irgs(ir_graph *irg, int size) {
1287   int i;
1288   ir_graph *rem = current_ir_graph;
1289   inline_env_t env /* = {0, NULL}*/;
1290
1291   if (!(get_opt_optimize() && get_opt_inline())) return;
1292
1293   current_ir_graph = irg;
1294   /* Handle graph state */
1295   assert(get_irg_phase_state(current_ir_graph) != phase_building);
1296   free_callee_info(current_ir_graph);
1297
1298   /* Find Call nodes to inline.
1299      (We can not inline during a walk of the graph, as inlineing the same
1300      method several times changes the visited flag of the walked graph:
1301      after the first inlineing visited of the callee equals visited of
1302      the caller.  With the next inlineing both are increased.) */
1303   env.pos = 0;
1304   irg_walk(get_irg_end(irg), NULL, collect_calls, &env);
1305
1306   if ((env.pos > 0) && (env.pos < MAX_INLINE)) {
1307     /* There are calls to inline */
1308     collect_phiprojs(irg);
1309     for (i = 0; i < env.pos; i++) {
1310       ir_graph *callee;
1311       callee = get_entity_irg(get_SymConst_entity(get_Call_ptr(env.calls[i])));
1312       if (((_obstack_memory_used(callee->obst) - (int)obstack_room(callee->obst)) < size) ||
1313         (get_irg_inline_property(callee) == irg_inline_forced)) {
1314         inline_method(env.calls[i], callee);
1315       }
1316     }
1317   }
1318
1319   current_ir_graph = rem;
1320 }
1321
1322 /**
1323  * Environment for inlining irgs.
1324  */
1325 typedef struct {
1326   int n_nodes;       /**< Nodes in graph except Id, Tuple, Proj, Start, End */
1327   int n_nodes_orig;  /**< for statistics */
1328   eset *call_nodes;  /**< All call nodes in this graph */
1329   int n_call_nodes;
1330   int n_call_nodes_orig; /**< for statistics */
1331   int n_callers;   /**< Number of known graphs that call this graphs. */
1332   int n_callers_orig; /**< for statistics */
1333 } inline_irg_env;
1334
1335 /**
1336  * Allocate a new environment for inlining.
1337  */
1338 static inline_irg_env *new_inline_irg_env(void) {
1339   inline_irg_env *env    = xmalloc(sizeof(*env));
1340   env->n_nodes           = -2; /* do not count count Start, End */
1341   env->n_nodes_orig      = -2; /* do not count Start, End */
1342   env->call_nodes        = eset_create();
1343   env->n_call_nodes      = 0;
1344   env->n_call_nodes_orig = 0;
1345   env->n_callers         = 0;
1346   env->n_callers_orig    = 0;
1347   return env;
1348 }
1349
1350 /**
1351  * destroy an environment for inlining.
1352  */
1353 static void free_inline_irg_env(inline_irg_env *env) {
1354   eset_destroy(env->call_nodes);
1355   free(env);
1356 }
1357
1358 /**
1359  * post-walker: collect all calls in the inline-environment
1360  * of a graph and sum some statistics.
1361  */
1362 static void collect_calls2(ir_node *call, void *env) {
1363   inline_irg_env *x = (inline_irg_env *)env;
1364   ir_op *op = get_irn_op(call);
1365   ir_graph *callee;
1366
1367   /* count meaningful nodes in irg */
1368   if (op != op_Proj && op != op_Tuple && op != op_Sync) {
1369     x->n_nodes++;
1370     x->n_nodes_orig++;
1371   }
1372
1373   if (op != op_Call) return;
1374
1375   /* collect all call nodes */
1376   eset_insert(x->call_nodes, call);
1377   x->n_call_nodes++;
1378   x->n_call_nodes_orig++;
1379
1380   /* count all static callers */
1381   callee = get_call_called_irg(call);
1382   if (callee) {
1383     inline_irg_env *callee_env = get_irg_link(callee);
1384     callee_env->n_callers++;
1385     callee_env->n_callers_orig++;
1386   }
1387 }
1388
1389 /**
1390  * Returns TRUE if the number of callers in 0 in the irg's environment,
1391  * hence this irg is a leave.
1392  */
1393 INLINE static int is_leave(ir_graph *irg) {
1394   return (((inline_irg_env *)get_irg_link(irg))->n_call_nodes == 0);
1395 }
1396
1397 /**
1398  * Returns TRUE if the number of callers is smaller size in the irg's environment.
1399  */
1400 INLINE static int is_smaller(ir_graph *callee, int size) {
1401   return (((inline_irg_env *)get_irg_link(callee))->n_nodes < size);
1402 }
1403
1404
1405 /*
1406  * Inlines small leave methods at call sites where the called address comes
1407  * from a Const node that references the entity representing the called
1408  * method.
1409  * The size argument is a rough measure for the code size of the method:
1410  * Methods where the obstack containing the firm graph is smaller than
1411  * size are inlined.
1412  */
1413 void inline_leave_functions(int maxsize, int leavesize, int size) {
1414   inline_irg_env *env;
1415   int i, n_irgs = get_irp_n_irgs();
1416   ir_graph *rem = current_ir_graph;
1417   int did_inline = 1;
1418
1419   if (!(get_opt_optimize() && get_opt_inline())) return;
1420
1421   /* extend all irgs by a temporary data structure for inlining. */
1422   for (i = 0; i < n_irgs; ++i)
1423     set_irg_link(get_irp_irg(i), new_inline_irg_env());
1424
1425   /* Precompute information in temporary data structure. */
1426   for (i = 0; i < n_irgs; ++i) {
1427     current_ir_graph = get_irp_irg(i);
1428     assert(get_irg_phase_state(current_ir_graph) != phase_building);
1429     free_callee_info(current_ir_graph);
1430
1431     irg_walk(get_irg_end(current_ir_graph), NULL, collect_calls2,
1432              get_irg_link(current_ir_graph));
1433   }
1434
1435   /* -- and now inline. -- */
1436
1437   /* Inline leaves recursively -- we might construct new leaves. */
1438   while (did_inline) {
1439     did_inline = 0;
1440
1441     for (i = 0; i < n_irgs; ++i) {
1442       ir_node *call;
1443       int phiproj_computed = 0;
1444
1445       current_ir_graph = get_irp_irg(i);
1446       env = (inline_irg_env *)get_irg_link(current_ir_graph);
1447
1448       for (call = eset_first(env->call_nodes); call; call = eset_next(env->call_nodes)) {
1449         ir_graph *callee;
1450
1451         if (get_irn_op(call) == op_Tuple) continue;   /* We already have inlined this call. */
1452         callee = get_call_called_irg(call);
1453
1454         if (env->n_nodes > maxsize) continue; // break;
1455
1456         if (callee && (is_leave(callee) && is_smaller(callee, leavesize))) {
1457           if (!phiproj_computed) {
1458             phiproj_computed = 1;
1459             collect_phiprojs(current_ir_graph);
1460           }
1461           did_inline = inline_method(call, callee);
1462
1463           if (did_inline) {
1464             /* Do some statistics */
1465             inline_irg_env *callee_env = (inline_irg_env *)get_irg_link(callee);
1466             env->n_call_nodes --;
1467             env->n_nodes += callee_env->n_nodes;
1468             callee_env->n_callers--;
1469           }
1470         }
1471       }
1472     }
1473   }
1474
1475   /* inline other small functions. */
1476   for (i = 0; i < n_irgs; ++i) {
1477     ir_node *call;
1478     eset *walkset;
1479     int phiproj_computed = 0;
1480
1481     current_ir_graph = get_irp_irg(i);
1482     env = (inline_irg_env *)get_irg_link(current_ir_graph);
1483
1484     /* we can not walk and change a set, nor remove from it.
1485        So recompute.*/
1486     walkset = env->call_nodes;
1487     env->call_nodes = eset_create();
1488     for (call = eset_first(walkset); call; call = eset_next(walkset)) {
1489       ir_graph *callee;
1490
1491       if (get_irn_op(call) == op_Tuple) continue;   /* We already inlined. */
1492       callee = get_call_called_irg(call);
1493
1494       if (callee &&
1495           ((is_smaller(callee, size) && (env->n_nodes < maxsize)) ||    /* small function */
1496            (get_irg_inline_property(callee) == irg_inline_forced))) {
1497         if (!phiproj_computed) {
1498             phiproj_computed = 1;
1499             collect_phiprojs(current_ir_graph);
1500         }
1501         if (inline_method(call, callee)) {
1502           inline_irg_env *callee_env = (inline_irg_env *)get_irg_link(callee);
1503           env->n_call_nodes--;
1504           eset_insert_all(env->call_nodes, callee_env->call_nodes);  /* @@@ ??? This are the wrong nodes !? Not the copied ones. */
1505           env->n_call_nodes += callee_env->n_call_nodes;
1506           env->n_nodes += callee_env->n_nodes;
1507           callee_env->n_callers--;
1508         }
1509       } else {
1510         eset_insert(env->call_nodes, call);
1511       }
1512     }
1513     eset_destroy(walkset);
1514   }
1515
1516   for (i = 0; i < n_irgs; ++i) {
1517     current_ir_graph = get_irp_irg(i);
1518 #if 0
1519     env = (inline_irg_env *)get_irg_link(current_ir_graph);
1520     if ((env->n_call_nodes_orig != env->n_call_nodes) ||
1521         (env->n_callers_orig != env->n_callers))
1522       printf("Nodes:%3d ->%3d, calls:%3d ->%3d, callers:%3d ->%3d, -- %s\n",
1523              env->n_nodes_orig, env->n_nodes, env->n_call_nodes_orig, env->n_call_nodes,
1524              env->n_callers_orig, env->n_callers,
1525              get_entity_name(get_irg_entity(current_ir_graph)));
1526 #endif
1527     free_inline_irg_env((inline_irg_env *)get_irg_link(current_ir_graph));
1528   }
1529
1530   current_ir_graph = rem;
1531 }
1532
1533 /*******************************************************************/
1534 /*  Code Placement.  Pins all floating nodes to a block where they */
1535 /*  will be executed only if needed.                               */
1536 /*******************************************************************/
1537
1538 /**
1539  * Returns non-zero, is a block is not reachable from Start.
1540  *
1541  * @param block  the block to test
1542  */
1543 static int
1544 is_Block_unreachable(ir_node *block) {
1545   return is_Block_dead(block) || get_Block_dom_depth(block) < 0;
1546 }
1547
1548 /**
1549  * Find the earliest correct block for N.  --- Place N into the
1550  * same Block as its dominance-deepest Input.
1551  *
1552  * We have to avoid calls to get_nodes_block() here
1553  * because the graph is floating.
1554  *
1555  * move_out_of_loops() expects that place_floats_early() have placed
1556  * all "living" nodes into a living block. That's why we must
1557  * move nodes in dead block with "live" successors into a valid
1558  * block.
1559  * We move them just into the same block as it's successor (or
1560  * in case of a Phi into the effective use block). For Phi successors,
1561  * this may still be a dead block, but then there is no real use, as
1562  * the control flow will be dead later.
1563  */
1564 static void
1565 place_floats_early(ir_node *n, pdeq *worklist)
1566 {
1567   int i, irn_arity;
1568
1569   /* we must not run into an infinite loop */
1570   assert(irn_not_visited(n));
1571   mark_irn_visited(n);
1572
1573   /* Place floating nodes. */
1574   if (get_irn_pinned(n) == op_pin_state_floats) {
1575     ir_node *curr_block = get_irn_n(n, -1);
1576     int in_dead_block   = is_Block_unreachable(curr_block);
1577     int depth           = 0;
1578     ir_node *b          = NULL;   /* The block to place this node in */
1579
1580     assert(get_irn_op(n) != op_Block);
1581
1582     if ((get_irn_op(n) == op_Const) ||
1583         (get_irn_op(n) == op_SymConst) ||
1584         (is_Bad(n)) ||
1585         (get_irn_op(n) == op_Unknown)) {
1586       /* These nodes will not be placed by the loop below. */
1587       b = get_irg_start_block(current_ir_graph);
1588       depth = 1;
1589     }
1590
1591     /* find the block for this node. */
1592     irn_arity = get_irn_arity(n);
1593     for (i = 0; i < irn_arity; i++) {
1594       ir_node *pred = get_irn_n(n, i);
1595       ir_node *pred_block;
1596
1597       if ((irn_not_visited(pred))
1598          && (get_irn_pinned(pred) == op_pin_state_floats)) {
1599
1600         /*
1601          * If the current node is NOT in a dead block, but one of its
1602          * predecessors is, we must move the predecessor to a live block.
1603          * Such thing can happen, if global CSE chose a node from a dead block.
1604          * We move it simple to our block.
1605          * Note that neither Phi nor End nodes are floating, so we don't
1606          * need to handle them here.
1607          */
1608         if (! in_dead_block) {
1609           if (get_irn_pinned(pred) == op_pin_state_floats &&
1610               is_Block_unreachable(get_irn_n(pred, -1)))
1611             set_nodes_block(pred, curr_block);
1612         }
1613         place_floats_early(pred, worklist);
1614       }
1615
1616       /*
1617        * A node in the Bad block must stay in the bad block,
1618        * so don't compute a new block for it.
1619        */
1620       if (in_dead_block)
1621         continue;
1622
1623       /* Because all loops contain at least one op_pin_state_pinned node, now all
1624          our inputs are either op_pin_state_pinned or place_early() has already
1625          been finished on them.  We do not have any unfinished inputs!  */
1626       pred_block = get_irn_n(pred, -1);
1627       if ((!is_Block_dead(pred_block)) &&
1628           (get_Block_dom_depth(pred_block) > depth)) {
1629         b = pred_block;
1630         depth = get_Block_dom_depth(pred_block);
1631       }
1632       /* Avoid that the node is placed in the Start block */
1633       if ((depth == 1) && (get_Block_dom_depth(get_irn_n(n, -1)) > 1)) {
1634         b = get_Block_cfg_out(get_irg_start_block(current_ir_graph), 0);
1635         assert(b != get_irg_start_block(current_ir_graph));
1636         depth = 2;
1637       }
1638     }
1639     if (b)
1640       set_nodes_block(n, b);
1641   }
1642
1643   /*
1644    * Add predecessors of non floating nodes and non-floating predecessors
1645    * of floating nodes to worklist and fix their blocks if the are in dead block.
1646    */
1647   irn_arity = get_irn_arity(n);
1648
1649   if (get_irn_op(n) == op_End) {
1650     /*
1651      * Simplest case: End node. Predecessors are keep-alives,
1652      * no need to move out of dead block.
1653      */
1654     for (i = -1; i < irn_arity; ++i) {
1655       ir_node *pred = get_irn_n(n, i);
1656       if (irn_not_visited(pred))
1657         pdeq_putr(worklist, pred);
1658     }
1659   }
1660   else if (is_Block(n)) {
1661     /*
1662      * Blocks: Predecessors are control flow, no need to move
1663      * them out of dead block.
1664      */
1665     for (i = irn_arity - 1; i >= 0; --i) {
1666       ir_node *pred = get_irn_n(n, i);
1667       if (irn_not_visited(pred))
1668         pdeq_putr(worklist, pred);
1669     }
1670   }
1671   else if (is_Phi(n)) {
1672     ir_node *pred;
1673     ir_node *curr_block = get_irn_n(n, -1);
1674     int in_dead_block   = is_Block_unreachable(curr_block);
1675
1676     /*
1677      * Phi nodes: move nodes from dead blocks into the effective use
1678      * of the Phi-input if the Phi is not in a bad block.
1679      */
1680     pred = get_irn_n(n, -1);
1681     if (irn_not_visited(pred))
1682       pdeq_putr(worklist, pred);
1683
1684     for (i = irn_arity - 1; i >= 0; --i) {
1685       ir_node *pred = get_irn_n(n, i);
1686
1687       if (irn_not_visited(pred)) {
1688         if (! in_dead_block &&
1689             get_irn_pinned(pred) == op_pin_state_floats &&
1690             is_Block_unreachable(get_irn_n(pred, -1))) {
1691           set_nodes_block(pred, get_Block_cfgpred_block(curr_block, i));
1692         }
1693         pdeq_putr(worklist, pred);
1694       }
1695     }
1696   }
1697   else {
1698     ir_node *pred;
1699     ir_node *curr_block = get_irn_n(n, -1);
1700     int in_dead_block   = is_Block_unreachable(curr_block);
1701
1702     /*
1703      * All other nodes: move nodes from dead blocks into the same block.
1704      */
1705     pred = get_irn_n(n, -1);
1706     if (irn_not_visited(pred))
1707       pdeq_putr(worklist, pred);
1708
1709     for (i = irn_arity - 1; i >= 0; --i) {
1710       ir_node *pred = get_irn_n(n, i);
1711
1712       if (irn_not_visited(pred)) {
1713         if (! in_dead_block &&
1714             get_irn_pinned(pred) == op_pin_state_floats &&
1715             is_Block_unreachable(get_irn_n(pred, -1))) {
1716           set_nodes_block(pred, curr_block);
1717         }
1718         pdeq_putr(worklist, pred);
1719       }
1720     }
1721   }
1722 }
1723
1724 /**
1725  * Floating nodes form subgraphs that begin at nodes as Const, Load,
1726  * Start, Call and that end at op_pin_state_pinned nodes as Store, Call.  Place_early
1727  * places all floating nodes reachable from its argument through floating
1728  * nodes and adds all beginnings at op_pin_state_pinned nodes to the worklist.
1729  */
1730 static INLINE void place_early(pdeq *worklist) {
1731   assert(worklist);
1732   inc_irg_visited(current_ir_graph);
1733
1734   /* this inits the worklist */
1735   place_floats_early(get_irg_end(current_ir_graph), worklist);
1736
1737   /* Work the content of the worklist. */
1738   while (!pdeq_empty(worklist)) {
1739     ir_node *n = pdeq_getl(worklist);
1740     if (irn_not_visited(n))
1741       place_floats_early(n, worklist);
1742   }
1743
1744   set_irg_outs_inconsistent(current_ir_graph);
1745   set_irg_pinned(current_ir_graph, op_pin_state_pinned);
1746 }
1747
1748 /**
1749  * Compute the deepest common ancestor of block and dca.
1750  */
1751 static ir_node *calc_dca(ir_node *dca, ir_node *block)
1752 {
1753   assert(block);
1754
1755   /* we do not want to place nodes in dead blocks */
1756   if (is_Block_dead(block))
1757     return dca;
1758
1759   /* We found a first legal placement. */
1760   if (!dca) return block;
1761
1762   /* Find a placement that is dominates both, dca and block. */
1763   while (get_Block_dom_depth(block) > get_Block_dom_depth(dca))
1764     block = get_Block_idom(block);
1765
1766   while (get_Block_dom_depth(dca) > get_Block_dom_depth(block)) {
1767     dca = get_Block_idom(dca);
1768   }
1769
1770   while (block != dca)
1771     { block = get_Block_idom(block); dca = get_Block_idom(dca); }
1772
1773   return dca;
1774 }
1775
1776 /** Deepest common dominance ancestor of DCA and CONSUMER of PRODUCER.
1777  * I.e., DCA is the block where we might place PRODUCER.
1778  * A data flow edge points from producer to consumer.
1779  */
1780 static ir_node *
1781 consumer_dom_dca(ir_node *dca, ir_node *consumer, ir_node *producer)
1782 {
1783   ir_node *block = NULL;
1784
1785   /* Compute the latest block into which we can place a node so that it is
1786      before consumer. */
1787   if (get_irn_op(consumer) == op_Phi) {
1788     /* our consumer is a Phi-node, the effective use is in all those
1789        blocks through which the Phi-node reaches producer */
1790     int i, irn_arity;
1791     ir_node *phi_block = get_nodes_block(consumer);
1792     irn_arity = get_irn_arity(consumer);
1793
1794     for (i = 0;  i < irn_arity; i++) {
1795       if (get_irn_n(consumer, i) == producer) {
1796         ir_node *new_block = get_nodes_block(get_Block_cfgpred(phi_block, i));
1797
1798         if (! is_Block_unreachable(new_block))
1799           block = calc_dca(block, new_block);
1800       }
1801     }
1802
1803     if (! block)
1804       block = get_irn_n(producer, -1);
1805   }
1806   else {
1807     assert(is_no_Block(consumer));
1808     block = get_nodes_block(consumer);
1809   }
1810
1811   /* Compute the deepest common ancestor of block and dca. */
1812   return calc_dca(dca, block);
1813 }
1814
1815 /* FIXME: the name clashes here with the function from ana/field_temperature.c
1816  * please rename. */
1817 static INLINE int get_irn_loop_depth(ir_node *n) {
1818   return get_loop_depth(get_irn_loop(n));
1819 }
1820
1821 /**
1822  * Move n to a block with less loop depth than it's current block. The
1823  * new block must be dominated by early.
1824  *
1825  * @param n      the node that should be moved
1826  * @param early  the earliest block we can n move to
1827  */
1828 static void
1829 move_out_of_loops (ir_node *n, ir_node *early)
1830 {
1831   ir_node *best, *dca;
1832   assert(n && early);
1833
1834
1835   /* Find the region deepest in the dominator tree dominating
1836      dca with the least loop nesting depth, but still dominated
1837      by our early placement. */
1838   dca = get_nodes_block(n);
1839
1840   best = dca;
1841   while (dca != early) {
1842     dca = get_Block_idom(dca);
1843     if (!dca || is_Bad(dca)) break; /* may be Bad if not reachable from Start */
1844     if (get_irn_loop_depth(dca) < get_irn_loop_depth(best)) {
1845       best = dca;
1846     }
1847   }
1848   if (best != get_nodes_block(n)) {
1849     /* debug output
1850     printf("Moving out of loop: "); DDMN(n);
1851     printf(" Outermost block: "); DDMN(early);
1852     printf(" Best block: "); DDMN(best);
1853     printf(" Innermost block: "); DDMN(get_nodes_block(n));
1854     */
1855     set_nodes_block(n, best);
1856   }
1857 }
1858
1859 /**
1860  * Find the latest legal block for N and place N into the
1861  * `optimal' Block between the latest and earliest legal block.
1862  * The `optimal' block is the dominance-deepest block of those
1863  * with the least loop-nesting-depth.  This places N out of as many
1864  * loops as possible and then makes it as control dependent as
1865  * possible.
1866  */
1867 static void
1868 place_floats_late(ir_node *n, pdeq *worklist)
1869 {
1870   int i;
1871   ir_node *early_blk;
1872
1873   assert(irn_not_visited(n)); /* no multiple placement */
1874
1875   mark_irn_visited(n);
1876
1877   /* no need to place block nodes, control nodes are already placed. */
1878   if ((get_irn_op(n) != op_Block) &&
1879       (!is_cfop(n)) &&
1880       (get_irn_mode(n) != mode_X)) {
1881     /* Remember the early_blk placement of this block to move it
1882        out of loop no further than the early_blk placement. */
1883     early_blk = get_irn_n(n, -1);
1884
1885     /*
1886      * BEWARE: Here we also get code, that is live, but
1887      * was in a dead block.  If the node is life, but because
1888      * of CSE in a dead block, we still might need it.
1889      */
1890
1891     /* Assure that our users are all placed, except the Phi-nodes.
1892        --- Each data flow cycle contains at least one Phi-node.  We
1893        have to break the `user has to be placed before the
1894        producer' dependence cycle and the Phi-nodes are the
1895        place to do so, because we need to base our placement on the
1896        final region of our users, which is OK with Phi-nodes, as they
1897        are op_pin_state_pinned, and they never have to be placed after a
1898        producer of one of their inputs in the same block anyway. */
1899     for (i = get_irn_n_outs(n) - 1; i >= 0; --i) {
1900       ir_node *succ = get_irn_out(n, i);
1901       if (irn_not_visited(succ) && (get_irn_op(succ) != op_Phi))
1902         place_floats_late(succ, worklist);
1903     }
1904
1905     if (! is_Block_dead(early_blk)) {
1906       /* do only move things that where not dead */
1907
1908       /* We have to determine the final block of this node... except for
1909          constants. */
1910       if ((get_irn_pinned(n) == op_pin_state_floats) &&
1911           (get_irn_op(n) != op_Const) &&
1912           (get_irn_op(n) != op_SymConst)) {
1913         ir_node *dca = NULL;  /* deepest common ancestor in the
1914                      dominator tree of all nodes'
1915                      blocks depending on us; our final
1916                      placement has to dominate DCA. */
1917         for (i = get_irn_n_outs(n) - 1; i >= 0; --i) {
1918           ir_node *succ = get_irn_out(n, i);
1919           ir_node *succ_blk;
1920
1921           if (get_irn_op(succ) == op_End) {
1922             /*
1923              * This consumer is the End node, a keep alive edge.
1924              * This is not a real consumer, so we ignore it
1925              */
1926             continue;
1927           }
1928
1929           /* ignore if succ is in dead code */
1930           succ_blk = get_irn_n(succ, -1);
1931           if (is_Block_unreachable(succ_blk))
1932             continue;
1933           dca = consumer_dom_dca(dca, succ, n);
1934         }
1935         if (dca) {
1936           set_nodes_block(n, dca);
1937           move_out_of_loops(n, early_blk);
1938         }
1939       }
1940     }
1941   }
1942
1943   /* Add predecessors of all non-floating nodes on list. (Those of floating
1944      nodes are placed already and therefore are marked.)  */
1945   for (i = 0; i < get_irn_n_outs(n); i++) {
1946     ir_node *succ = get_irn_out(n, i);
1947     if (irn_not_visited(get_irn_out(n, i))) {
1948       pdeq_putr(worklist, succ);
1949     }
1950   }
1951 }
1952
1953 static INLINE void place_late(pdeq *worklist) {
1954   assert(worklist);
1955   inc_irg_visited(current_ir_graph);
1956
1957   /* This fills the worklist initially. */
1958   place_floats_late(get_irg_start_block(current_ir_graph), worklist);
1959
1960   /* And now empty the worklist again... */
1961   while (!pdeq_empty(worklist)) {
1962     ir_node *n = pdeq_getl(worklist);
1963     if (irn_not_visited(n))
1964       place_floats_late(n, worklist);
1965   }
1966 }
1967
1968 void place_code(ir_graph *irg) {
1969   pdeq *worklist;
1970   ir_graph *rem = current_ir_graph;
1971
1972   current_ir_graph = irg;
1973
1974   if (!(get_opt_optimize() && get_opt_global_cse())) return;
1975
1976   /* Handle graph state */
1977   assert(get_irg_phase_state(irg) != phase_building);
1978   if (get_irg_dom_state(irg) != dom_consistent)
1979     compute_doms(irg);
1980
1981   if (1 || get_irg_loopinfo_state(irg) != loopinfo_consistent) {
1982     free_loop_information(irg);
1983     construct_backedges(irg);
1984   }
1985
1986   /* Place all floating nodes as early as possible. This guarantees
1987      a legal code placement. */
1988   worklist = new_pdeq();
1989   place_early(worklist);
1990
1991   /* place_early() invalidates the outs, place_late needs them. */
1992   compute_irg_outs(irg);
1993
1994   /* Now move the nodes down in the dominator tree. This reduces the
1995      unnecessary executions of the node. */
1996   place_late(worklist);
1997
1998   set_irg_outs_inconsistent(current_ir_graph);
1999   set_irg_loopinfo_inconsistent(current_ir_graph);
2000   del_pdeq(worklist);
2001   current_ir_graph = rem;
2002 }
2003
2004 /**
2005  * Called by walker of remove_critical_cf_edges().
2006  *
2007  * Place an empty block to an edge between a blocks of multiple
2008  * predecessors and a block of multiple successors.
2009  *
2010  * @param n   IR node
2011  * @param env Environment of walker. The changed field.
2012  */
2013 static void walk_critical_cf_edges(ir_node *n, void *env) {
2014   int arity, i;
2015   ir_node *pre, *block, *jmp;
2016   int *changed = env;
2017
2018   /* Block has multiple predecessors */
2019   if (is_Block(n) && (get_irn_arity(n) > 1)) {
2020     if (n == get_irg_end_block(current_ir_graph))
2021       return;  /*  No use to add a block here.      */
2022
2023     arity = get_irn_arity(n);
2024     for (i=0; i<arity; i++) {
2025       pre = get_irn_n(n, i);
2026       /* Predecessor has multiple successors. Insert new control flow edge. */
2027       if (op_Raise != get_irn_op(skip_Proj(pre))) {
2028         /* set predecessor of new block */
2029         block = new_Block(1, &pre);
2030         /* insert new jmp node to new block */
2031         set_cur_block(block);
2032         jmp = new_Jmp();
2033         set_cur_block(n);
2034         /* set successor of new block */
2035         set_irn_n(n, i, jmp);
2036         *changed = 1;
2037       } /* predecessor has multiple successors */
2038     } /* for all predecessors */
2039   } /* n is a block */
2040 }
2041
2042 void remove_critical_cf_edges(ir_graph *irg) {
2043   int changed = 0;
2044   irg_walk_graph(irg, NULL, walk_critical_cf_edges, &changed);
2045
2046   if (changed) {
2047     /* control flow changed */
2048     set_irg_outs_inconsistent(irg);
2049     set_irg_extblk_inconsistent(irg);
2050     set_irg_doms_inconsistent(current_ir_graph);
2051     set_irg_loopinfo_inconsistent(current_ir_graph);
2052   }
2053
2054 }