nsz Git - libfirm/blob - ir/ir/irgopt.c

   1 /*
   2  * Project:     libFIRM
   3  * File name:   ir/ir/irgopt.c
   4  * Purpose:     Optimizations for a whole ir graph, i.e., a procedure.
   5  * Author:      Christian Schaefer, Goetz Lindenmaier
   6  * Modified by: Sebastian Felis
   7  * Created:
   8  * CVS-ID:      $Id$
   9  * Copyright:   (c) 1998-2003 Universität Karlsruhe
  10  * Licence:     This file protected by GPL -  GNU GENERAL PUBLIC LICENSE.
  11  */
  12
  13
  14 #ifdef HAVE_CONFIG_H
  15 # include <config.h>
  16 #endif
  17
  18 # include <assert.h>
  19 # include <stdbool.h>
  20
  21 # include "irprog.h"
  22 # include "irgopt.h"
  23 # include "irnode_t.h"
  24 # include "irgraph_t.h"
  25 # include "iropt_t.h"
  26 # include "irgwalk.h"
  27 # include "ircons.h"
  28 # include "irgmod.h"
  29 # include "array.h"
  30 # include "pset.h"
  31 # include "eset.h"
  32 # include "pdeq.h"       /* Fuer code placement */
  33 # include "irouts.h"
  34 # include "irloop.h"
  35 # include "irbackedge_t.h"
  36 # include "irflag_t.h"
  37 # include "firmstat.h"
  38
  39 /* Defined in iropt.c */
  40 pset *new_identities (void);
  41 void  del_identities (pset *value_table);
  42 void  add_identities   (pset *value_table, ir_node *node);
  43
  44 /*------------------------------------------------------------------*/
  45 /* apply optimizations of iropt to all nodes.                       */
  46 /*------------------------------------------------------------------*/
  47
  48 static void init_link (ir_node *n, void *env) {
  49   set_irn_link(n, NULL);
  50 }
  51
  52 #if 0   /* Old version. Avoids Ids.
  53        This is not necessary:  we do a postwalk, and get_irn_n
  54        removes ids anyways.  So it's much cheaper to call the
  55        optimization less often and use the exchange() algorithm. */
  56 static void
  57 optimize_in_place_wrapper (ir_node *n, void *env) {
  58   int i, irn_arity;
  59   ir_node *optimized, *old;
  60
  61   irn_arity = intern_get_irn_arity(n);
  62   for (i = 0; i < irn_arity; i++) {
  63     /* get_irn_n skips Id nodes, so comparison old != optimized does not
  64        show all optimizations. Therefore always set new predecessor. */
  65     old = intern_get_irn_intra_n(n, i);
  66     optimized = optimize_in_place_2(old);
  67     set_irn_n(n, i, optimized);
  68   }
  69
  70   if (intern_get_irn_op(n) == op_Block) {
  71     optimized = optimize_in_place_2(n);
  72     if (optimized != n) exchange (n, optimized);
  73   }
  74 }
  75 #else
  76 static void
  77 optimize_in_place_wrapper (ir_node *n, void *env) {
  78   ir_node *optimized = optimize_in_place_2(n);
  79   if (optimized != n) exchange (n, optimized);
  80 }
  81 #endif
  82
  83
  84
  85 void
  86 local_optimize_graph (ir_graph *irg) {
  87   ir_graph *rem = current_ir_graph;
  88   current_ir_graph = irg;
  89
  90   /* Handle graph state */
  91   assert(get_irg_phase_state(irg) != phase_building);
  92   if (get_opt_global_cse())
  93     set_irg_pinned(current_ir_graph, floats);
  94   if (get_irg_outs_state(current_ir_graph) == outs_consistent)
  95     set_irg_outs_inconsistent(current_ir_graph);
  96   if (get_irg_dom_state(current_ir_graph) == dom_consistent)
  97     set_irg_dom_inconsistent(current_ir_graph);
  98
  99   /* Clean the value_table in irg for the cse. */
 100   del_identities(irg->value_table);
 101   irg->value_table = new_identities();
 102
 103   /* walk over the graph */
 104   irg_walk(irg->end, init_link, optimize_in_place_wrapper, NULL);
 105
 106   current_ir_graph = rem;
 107 }
 108
 109 /*------------------------------------------------------------------*/
 110 /* Routines for dead node elimination / copying garbage collection  */
 111 /* of the obstack.                                                  */
 112 /*------------------------------------------------------------------*/
 113
 114 /**
 115  * Remember the new node in the old node by using a field all nodes have.
 116  */
 117 static INLINE void
 118 set_new_node (ir_node *old, ir_node *new)
 119 {
 120   old->link = new;
 121 }
 122
 123 /**
 124  * Get this new node, before the old node is forgotton.
 125  */
 126 static INLINE ir_node *
 127 get_new_node (ir_node * n)
 128 {
 129   return n->link;
 130 }
 131
 132 /**
 133  * We use the block_visited flag to mark that we have computed the
 134  * number of useful predecessors for this block.
 135  * Further we encode the new arity in this flag in the old blocks.
 136  * Remembering the arity is useful, as it saves a lot of pointer
 137  * accesses.  This function is called for all Phi and Block nodes
 138  * in a Block.
 139  */
 140 static INLINE int
 141 compute_new_arity(ir_node *b) {
 142   int i, res, irn_arity;
 143   int irg_v, block_v;
 144
 145   irg_v = get_irg_block_visited(current_ir_graph);
 146   block_v = get_Block_block_visited(b);
 147   if (block_v >= irg_v) {
 148     /* we computed the number of preds for this block and saved it in the
 149        block_v flag */
 150     return block_v - irg_v;
 151   } else {
 152     /* compute the number of good predecessors */
 153     res = irn_arity = intern_get_irn_arity(b);
 154     for (i = 0; i < irn_arity; i++)
 155       if (intern_get_irn_opcode(intern_get_irn_n(b, i)) == iro_Bad) res--;
 156     /* save it in the flag. */
 157     set_Block_block_visited(b, irg_v + res);
 158     return res;
 159   }
 160 }
 161
 162 /* TODO: add an ir_op operation */
 163 static INLINE void new_backedge_info(ir_node *n) {
 164   switch(intern_get_irn_opcode(n)) {
 165   case iro_Block:
 166     n->attr.block.cg_backedge = NULL;
 167     n->attr.block.backedge = new_backedge_arr(current_ir_graph->obst, intern_get_irn_arity(n));
 168     break;
 169   case iro_Phi:
 170     n->attr.phi_backedge = new_backedge_arr(current_ir_graph->obst, intern_get_irn_arity(n));
 171     break;
 172   case iro_Filter:
 173     n->attr.filter.backedge = new_backedge_arr(current_ir_graph->obst, intern_get_irn_arity(n));
 174     break;
 175   default: ;
 176   }
 177 }
 178
 179 /**
 180  * Copies the node to the new obstack. The Ins of the new node point to
 181  * the predecessors on the old obstack.  For block/phi nodes not all
 182  * predecessors might be copied.  n->link points to the new node.
 183  * For Phi and Block nodes the function allocates in-arrays with an arity
 184  * only for useful predecessors.  The arity is determined by counting
 185  * the non-bad predecessors of the block.
 186  */
 187 static void
 188 copy_node (ir_node *n, void *env) {
 189   ir_node *nn, *block;
 190   int new_arity;
 191
 192   /* The end node looses it's flexible in array.  This doesn't matter,
 193      as dead node elimination builds End by hand, inlineing doesn't use
 194      the End node. */
 195   /* assert(n->op == op_End ||  ((_ARR_DESCR(n->in))->cookie != ARR_F_MAGIC)); */
 196
 197   if (intern_get_irn_opcode(n) == iro_Block) {
 198     block = NULL;
 199     new_arity = compute_new_arity(n);
 200     n->attr.block.graph_arr = NULL;
 201   } else {
 202     block = get_nodes_Block(n);
 203     if (intern_get_irn_opcode(n) == iro_Phi) {
 204       new_arity = compute_new_arity(block);
 205     } else {
 206       new_arity = intern_get_irn_arity(n);
 207     }
 208   }
 209   nn = new_ir_node(get_irn_dbg_info(n),
 210            current_ir_graph,
 211            block,
 212            intern_get_irn_op(n),
 213            intern_get_irn_mode(n),
 214            new_arity,
 215            get_irn_in(n));
 216   /* Copy the attributes.  These might point to additional data.  If this
 217      was allocated on the old obstack the pointers now are dangling.  This
 218      frees e.g. the memory of the graph_arr allocated in new_immBlock. */
 219   copy_attrs(n, nn);
 220   new_backedge_info(nn);
 221   set_new_node(n, nn);
 222
 223   /*  printf("\n old node: "); DDMSG2(n);
 224       printf(" new node: "); DDMSG2(nn); */
 225
 226 }
 227
 228 /**
 229  * Copies new predecessors of old node to new node remembered in link.
 230  * Spare the Bad predecessors of Phi and Block nodes.
 231  */
 232 static void
 233 copy_preds (ir_node *n, void *env) {
 234   ir_node *nn, *block;
 235   int i, j, irn_arity;
 236
 237   nn = get_new_node(n);
 238
 239   /* printf("\n old node: "); DDMSG2(n);
 240      printf(" new node: "); DDMSG2(nn);
 241      printf(" arities: old: %d, new: %d\n", intern_get_irn_arity(n), intern_get_irn_arity(nn)); */
 242
 243   if (intern_get_irn_opcode(n) == iro_Block) {
 244     /* Don't copy Bad nodes. */
 245     j = 0;
 246     irn_arity = intern_get_irn_arity(n);
 247     for (i = 0; i < irn_arity; i++)
 248       if (intern_get_irn_opcode(intern_get_irn_n(n, i)) != iro_Bad) {
 249     set_irn_n (nn, j, get_new_node(intern_get_irn_n(n, i)));
 250     /*if (is_backedge(n, i)) set_backedge(nn, j);*/
 251     j++;
 252       }
 253     /* repair the block visited flag from above misuse. Repair it in both
 254        graphs so that the old one can still be used. */
 255     set_Block_block_visited(nn, 0);
 256     set_Block_block_visited(n, 0);
 257     /* Local optimization could not merge two subsequent blocks if
 258        in array contained Bads.  Now it's possible.
 259        We don't call optimize_in_place as it requires
 260        that the fields in ir_graph are set properly. */
 261     if ((get_opt_control_flow_straightening()) &&
 262     (get_Block_n_cfgpreds(nn) == 1) &&
 263     (intern_get_irn_op(get_Block_cfgpred(nn, 0)) == op_Jmp))
 264       exchange(nn, get_nodes_Block(get_Block_cfgpred(nn, 0)));
 265   } else if (intern_get_irn_opcode(n) == iro_Phi) {
 266     /* Don't copy node if corresponding predecessor in block is Bad.
 267        The Block itself should not be Bad. */
 268     block = get_nodes_Block(n);
 269     set_irn_n (nn, -1, get_new_node(block));
 270     j = 0;
 271     irn_arity = intern_get_irn_arity(n);
 272     for (i = 0; i < irn_arity; i++)
 273       if (intern_get_irn_opcode(intern_get_irn_n(block, i)) != iro_Bad) {
 274     set_irn_n (nn, j, get_new_node(intern_get_irn_n(n, i)));
 275     /*if (is_backedge(n, i)) set_backedge(nn, j);*/
 276     j++;
 277       }
 278     /* If the pre walker reached this Phi after the post walker visited the
 279        block block_visited is > 0. */
 280     set_Block_block_visited(get_nodes_Block(n), 0);
 281     /* Compacting the Phi's ins might generate Phis with only one
 282        predecessor. */
 283     if (intern_get_irn_arity(n) == 1)
 284       exchange(n, intern_get_irn_n(n, 0));
 285   } else {
 286     irn_arity = intern_get_irn_arity(n);
 287     for (i = -1; i < irn_arity; i++)
 288       set_irn_n (nn, i, get_new_node(intern_get_irn_n(n, i)));
 289   }
 290   /* Now the new node is complete.  We can add it to the hash table for cse.
 291      @@@ inlinening aborts if we identify End. Why? */
 292   if(intern_get_irn_op(nn) != op_End)
 293     add_identities (current_ir_graph->value_table, nn);
 294 }
 295
 296 /**
 297  * Copies the graph recursively, compacts the keepalive of the end node.
 298  */
 299 static void
 300 copy_graph (void) {
 301   ir_node *oe, *ne; /* old end, new end */
 302   ir_node *ka;      /* keep alive */
 303   int i, irn_arity;
 304
 305   oe = get_irg_end(current_ir_graph);
 306   /* copy the end node by hand, allocate dynamic in array! */
 307   ne = new_ir_node(get_irn_dbg_info(oe),
 308            current_ir_graph,
 309            NULL,
 310            op_End,
 311            mode_X,
 312            -1,
 313            NULL);
 314   /* Copy the attributes.  Well, there might be some in the future... */
 315   copy_attrs(oe, ne);
 316   set_new_node(oe, ne);
 317
 318   /* copy the live nodes */
 319   irg_walk(get_nodes_Block(oe), copy_node, copy_preds, NULL);
 320   /* copy_preds for the end node ... */
 321   set_nodes_Block(ne, get_new_node(get_nodes_Block(oe)));
 322
 323   /*- ... and now the keep alives. -*/
 324   /* First pick the not marked block nodes and walk them.  We must pick these
 325      first as else we will oversee blocks reachable from Phis. */
 326   irn_arity = intern_get_irn_arity(oe);
 327   for (i = 0; i < irn_arity; i++) {
 328     ka = intern_get_irn_intra_n(oe, i);
 329     if ((intern_get_irn_op(ka) == op_Block) &&
 330     (get_irn_visited(ka) < get_irg_visited(current_ir_graph))) {
 331       /* We must keep the block alive and copy everything reachable */
 332       set_irg_visited(current_ir_graph, get_irg_visited(current_ir_graph)-1);
 333       irg_walk(ka, copy_node, copy_preds, NULL);
 334       add_End_keepalive(ne, get_new_node(ka));
 335     }
 336   }
 337
 338   /* Now pick the Phis.  Here we will keep all! */
 339   irn_arity = intern_get_irn_arity(oe);
 340   for (i = 0; i < irn_arity; i++) {
 341     ka = intern_get_irn_intra_n(oe, i);
 342     if ((intern_get_irn_op(ka) == op_Phi)) {
 343       if (get_irn_visited(ka) < get_irg_visited(current_ir_graph)) {
 344     /* We didn't copy the Phi yet.  */
 345     set_irg_visited(current_ir_graph, get_irg_visited(current_ir_graph)-1);
 346     irg_walk(ka, copy_node, copy_preds, NULL);
 347       }
 348       add_End_keepalive(ne, get_new_node(ka));
 349     }
 350   }
 351 }
 352
 353 /**
 354  * Copies the graph reachable from current_ir_graph->end to the obstack
 355  * in current_ir_graph and fixes the environment.
 356  * Then fixes the fields in current_ir_graph containing nodes of the
 357  * graph.
 358  */
 359 static void
 360 copy_graph_env (void) {
 361   ir_node *old_end;
 362   /* Not all nodes remembered in current_ir_graph might be reachable
 363      from the end node.  Assure their link is set to NULL, so that
 364      we can test whether new nodes have been computed. */
 365   set_irn_link(get_irg_frame  (current_ir_graph), NULL);
 366   set_irn_link(get_irg_globals(current_ir_graph), NULL);
 367   set_irn_link(get_irg_args   (current_ir_graph), NULL);
 368
 369   /* we use the block walk flag for removing Bads from Blocks ins. */
 370   inc_irg_block_visited(current_ir_graph);
 371
 372   /* copy the graph */
 373   copy_graph();
 374
 375   /* fix the fields in current_ir_graph */
 376   old_end = get_irg_end(current_ir_graph);
 377   set_irg_end (current_ir_graph, get_new_node(old_end));
 378   set_irg_end_except (current_ir_graph, get_irg_end(current_ir_graph));
 379   set_irg_end_reg    (current_ir_graph, get_irg_end(current_ir_graph));
 380   free_End(old_end);
 381   set_irg_end_block  (current_ir_graph, get_new_node(get_irg_end_block(current_ir_graph)));
 382   if (get_irn_link(get_irg_frame(current_ir_graph)) == NULL) {
 383     copy_node (get_irg_frame(current_ir_graph), NULL);
 384     copy_preds(get_irg_frame(current_ir_graph), NULL);
 385   }
 386   if (get_irn_link(get_irg_globals(current_ir_graph)) == NULL) {
 387     copy_node (get_irg_globals(current_ir_graph), NULL);
 388     copy_preds(get_irg_globals(current_ir_graph), NULL);
 389   }
 390   if (get_irn_link(get_irg_args(current_ir_graph)) == NULL) {
 391     copy_node (get_irg_args(current_ir_graph), NULL);
 392     copy_preds(get_irg_args(current_ir_graph), NULL);
 393   }
 394   set_irg_start  (current_ir_graph, get_new_node(get_irg_start(current_ir_graph)));
 395
 396   set_irg_start_block(current_ir_graph,
 397               get_new_node(get_irg_start_block(current_ir_graph)));
 398   set_irg_frame  (current_ir_graph, get_new_node(get_irg_frame(current_ir_graph)));
 399   set_irg_globals(current_ir_graph, get_new_node(get_irg_globals(current_ir_graph)));
 400   set_irg_args   (current_ir_graph, get_new_node(get_irg_args(current_ir_graph)));
 401   if (get_irn_link(get_irg_bad(current_ir_graph)) == NULL) {
 402     copy_node(get_irg_bad(current_ir_graph), NULL);
 403     copy_preds(get_irg_bad(current_ir_graph), NULL);
 404   }
 405   set_irg_bad(current_ir_graph, get_new_node(get_irg_bad(current_ir_graph)));
 406   /* GL removed: we need unknown with mode for analyses.
 407   if (get_irn_link(get_irg_unknown(current_ir_graph)) == NULL) {
 408     copy_node(get_irg_unknown(current_ir_graph), NULL);
 409     copy_preds(get_irg_unknown(current_ir_graph), NULL);
 410   }
 411   set_irg_unknown(current_ir_graph, get_new_node(get_irg_unknown(current_ir_graph)));
 412   */
 413 }
 414
 415 /**
 416  * Copies all reachable nodes to a new obstack.  Removes bad inputs
 417  * from block nodes and the corresponding inputs from Phi nodes.
 418  * Merges single exit blocks with single entry blocks and removes
 419  * 1-input Phis.
 420  * Adds all new nodes to a new hash table for cse.  Does not
 421  * perform cse, so the hash table might contain common subexpressions.
 422  */
 423 /* Amroq call this emigrate() */
 424 void
 425 dead_node_elimination(ir_graph *irg) {
 426   ir_graph *rem;
 427   int rem_ipview = interprocedural_view;
 428   struct obstack *graveyard_obst = NULL;
 429   struct obstack *rebirth_obst   = NULL;
 430
 431   stat_dead_node_elim_start(irg);
 432
 433   /* Remember external state of current_ir_graph. */
 434   rem = current_ir_graph;
 435   current_ir_graph = irg;
 436   interprocedural_view = 0;
 437
 438   /* Handle graph state */
 439   assert(get_irg_phase_state(current_ir_graph) != phase_building);
 440   assert(get_irg_callee_info_state(current_ir_graph) == irg_callee_info_none);
 441   free_outs(current_ir_graph);
 442
 443   /* @@@ so far we loose loops when copying */
 444   free_loop_information(current_ir_graph);
 445
 446   if (get_opt_optimize() && get_opt_dead_node_elimination()) {
 447
 448     /* A quiet place, where the old obstack can rest in peace,
 449        until it will be cremated. */
 450     graveyard_obst = irg->obst;
 451
 452     /* A new obstack, where the reachable nodes will be copied to. */
 453     rebirth_obst = (struct obstack *) xmalloc (sizeof (struct obstack));
 454     current_ir_graph->obst = rebirth_obst;
 455     obstack_init (current_ir_graph->obst);
 456
 457     /* We also need a new hash table for cse */
 458     del_identities (irg->value_table);
 459     irg->value_table = new_identities ();
 460
 461     /* Copy the graph from the old to the new obstack */
 462     copy_graph_env();
 463
 464     /* Free memory from old unoptimized obstack */
 465     obstack_free(graveyard_obst, 0);  /* First empty the obstack ... */
 466     xfree (graveyard_obst);           /* ... then free it.           */
 467   }
 468
 469   stat_dead_node_elim_stop(irg);
 470
 471   current_ir_graph = rem;
 472   interprocedural_view = rem_ipview;
 473 }
 474
 475 /**
 476  * Relink bad predeseccors of a block and store the old in array to the
 477  * link field. This function is called by relink_bad_predecessors().
 478  * The array of link field starts with the block operand at position 0.
 479  * If block has bad predecessors, create a new in array without bad preds.
 480  * Otherwise let in array untouched.
 481  */
 482 static void relink_bad_block_predecessors(ir_node *n, void *env) {
 483   ir_node **new_in, *irn;
 484   int i, new_irn_n, old_irn_arity, new_irn_arity = 0;
 485
 486   /* if link field of block is NULL, look for bad predecessors otherwise
 487      this is allready done */
 488   if (intern_get_irn_op(n) == op_Block &&
 489       get_irn_link(n) == NULL) {
 490
 491     /* save old predecessors in link field (position 0 is the block operand)*/
 492     set_irn_link(n, (void *)get_irn_in(n));
 493
 494     /* count predecessors without bad nodes */
 495     old_irn_arity = intern_get_irn_arity(n);
 496     for (i = 0; i < old_irn_arity; i++)
 497       if (!is_Bad(intern_get_irn_n(n, i))) new_irn_arity++;
 498
 499     /* arity changing: set new predecessors without bad nodes */
 500     if (new_irn_arity < old_irn_arity) {
 501       /* get new predecessor array without Block predecessor */
 502       new_in = NEW_ARR_D (ir_node *, current_ir_graph->obst, (new_irn_arity+1));
 503
 504       /* set new predeseccors in array */
 505       new_in[0] = NULL;
 506       new_irn_n = 1;
 507       for (i = 1; i < old_irn_arity; i++) {
 508     irn = intern_get_irn_n(n, i);
 509     if (!is_Bad(irn)) new_in[new_irn_n++] = irn;
 510       }
 511       n->in = new_in;
 512     } /* ir node has bad predecessors */
 513
 514   } /* Block is not relinked */
 515 }
 516
 517 /**
 518  * Relinks Bad predecesors from Bocks and Phis called by walker
 519  * remove_bad_predecesors(). If n is a Block, call
 520  * relink_bad_block_redecessors(). If n is a Phinode, call also the relinking
 521  * function of Phi's Block. If this block has bad predecessors, relink preds
 522  * of the Phinode.
 523  */
 524 static void relink_bad_predecessors(ir_node *n, void *env) {
 525   ir_node *block, **old_in;
 526   int i, old_irn_arity, new_irn_arity;
 527
 528   /* relink bad predeseccors of a block */
 529   if (intern_get_irn_op(n) == op_Block)
 530     relink_bad_block_predecessors(n, env);
 531
 532   /* If Phi node relink its block and its predecessors */
 533   if (intern_get_irn_op(n) == op_Phi) {
 534
 535     /* Relink predeseccors of phi's block */
 536     block = get_nodes_Block(n);
 537     if (get_irn_link(block) == NULL)
 538       relink_bad_block_predecessors(block, env);
 539
 540     old_in = (ir_node **)get_irn_link(block); /* Of Phi's Block */
 541     old_irn_arity = ARR_LEN(old_in);
 542
 543     /* Relink Phi predeseccors if count of predeseccors changed */
 544     if (old_irn_arity != ARR_LEN(get_irn_in(block))) {
 545       /* set new predeseccors in array
 546      n->in[0] remains the same block */
 547       new_irn_arity = 1;
 548       for(i = 1; i < old_irn_arity; i++)
 549     if (!is_Bad((ir_node *)old_in[i])) n->in[new_irn_arity++] = n->in[i];
 550
 551       ARR_SETLEN(ir_node *, n->in, new_irn_arity);
 552     }
 553
 554   } /* n is a Phi node */
 555 }
 556
 557 /**
 558  * Removes Bad Bad predecesors from Blocks and the corresponding
 559  * inputs to Phi nodes as in dead_node_elimination but without
 560  * copying the graph.
 561  * On walking up set the link field to NULL, on walking down call
 562  * relink_bad_predecessors() (This function stores the old in array
 563  * to the link field and sets a new in array if arity of predecessors
 564  * changes).
 565  */
 566 void remove_bad_predecessors(ir_graph *irg) {
 567   irg_walk_graph(irg, init_link, relink_bad_predecessors, NULL);
 568 }
 569
 570
 571 /*--------------------------------------------------------------------*/
 572 /*  Funcionality for inlining                                         */
 573 /*--------------------------------------------------------------------*/
 574
 575 /**
 576  * Copy node for inlineing.  Updates attributes that change when
 577  * inlineing but not for dead node elimination.
 578  *
 579  * Copies the node by calling copy_node and then updates the entity if
 580  * it's a local one.  env must be a pointer of the frame type of the
 581  * inlined procedure. The new entities must be in the link field of
 582  * the entities.
 583  */
 584 static INLINE void
 585 copy_node_inline (ir_node *n, void *env) {
 586   ir_node *new;
 587   type *frame_tp = (type *)env;
 588
 589   copy_node(n, NULL);
 590   if (intern_get_irn_op(n) == op_Sel) {
 591     new = get_new_node (n);
 592     assert(intern_get_irn_op(new) == op_Sel);
 593     if (get_entity_owner(get_Sel_entity(n)) == frame_tp) {
 594       set_Sel_entity(new, get_entity_link(get_Sel_entity(n)));
 595     }
 596   } else if (intern_get_irn_op(n) == op_Block) {
 597     new = get_new_node (n);
 598     new->attr.block.irg = current_ir_graph;
 599   }
 600 }
 601
 602 static void find_addr(ir_node *node, void *env)
 603 {
 604   if (get_irn_opcode(node) == iro_Proj) {
 605     if (get_Proj_proj(node) == pn_Start_P_value_arg_base)
 606       *(int *)env = 0;
 607   }
 608 }
 609
 610 /*
 611  * currently, we cannot inline two cases:
 612  * - call with compound arguments
 613  * - graphs that take the address of a parameter
 614  *
 615  * check these condition here
 616  */
 617 static int can_inline(ir_node *call, ir_graph *called_graph)
 618 {
 619   type *call_type = get_Call_type(call);
 620   int params, ress, i, res;
 621
 622   assert(is_method_type(call_type));
 623
 624   params = get_method_n_params(call_type);
 625   ress   = get_method_n_ress(call_type);
 626
 627   /* check params */
 628   for (i = 0; i < params; ++i) {
 629     type *p_type = get_method_param_type(call_type, i);
 630
 631     if (is_compound_type(p_type))
 632       return 0;
 633   }
 634
 635   /* check res */
 636   for (i = 0; i < ress; ++i) {
 637     type *r_type = get_method_res_type(call_type, i);
 638
 639     if (is_compound_type(r_type))
 640       return 0;
 641   }
 642
 643   res = 1;
 644   irg_walk_graph(called_graph, find_addr, NULL, &res);
 645
 646   return res;
 647 }
 648
 649 void inline_method(ir_node *call, ir_graph *called_graph) {
 650   ir_node *pre_call;
 651   ir_node *post_call, *post_bl;
 652   ir_node *in[5];
 653   ir_node *end, *end_bl;
 654   ir_node **res_pred;
 655   ir_node **cf_pred;
 656   ir_node *ret, *phi;
 657   int arity, n_ret, n_exc, n_res, i, j, rem_opt, irn_arity;
 658   int exc_handling;
 659   type *called_frame;
 660   irg_inline_property prop = get_irg_inline_property(called_graph);
 661
 662   if ( (prop != irg_inline_forced) && (!get_opt_optimize() || !get_opt_inline() ||
 663       (prop == irg_inline_forbidden))) return;
 664
 665
 666   /*
 667    * currently, we cannot inline two cases:
 668    * - call with compound arguments
 669    * - graphs that take the address of a parameter
 670    */
 671   if (! can_inline(call, called_graph))
 672     return;
 673
 674   /* --  Turn off optimizations, this can cause problems when allocating new nodes. -- */
 675   rem_opt = get_opt_optimize();
 676   set_optimize(0);
 677
 678   /* Handle graph state */
 679   assert(get_irg_phase_state(current_ir_graph) != phase_building);
 680   assert(get_irg_pinned(current_ir_graph) == pinned);
 681   assert(get_irg_pinned(called_graph) == pinned);
 682   if (get_irg_outs_state(current_ir_graph) == outs_consistent)
 683     set_irg_outs_inconsistent(current_ir_graph);
 684
 685   /* -- Check preconditions -- */
 686   assert(get_irn_op(call) == op_Call);
 687   /* @@@ does not work for InterfaceIII.java after cgana
 688      assert(get_Call_type(call) == get_entity_type(get_irg_ent(called_graph)));
 689      assert(smaller_type(get_entity_type(get_irg_ent(called_graph)),
 690      get_Call_type(call)));
 691   */
 692   assert(get_type_tpop(get_Call_type(call)) == type_method);
 693   if (called_graph == current_ir_graph) {
 694     set_optimize(rem_opt);
 695     return;
 696   }
 697
 698   /* here we know we WILL inline, so inform the statistics */
 699   stat_inline(call, called_graph);
 700
 701   /* -- Decide how to handle exception control flow: Is there a handler
 702      for the Call node, or do we branch directly to End on an exception?
 703      exc_handling: 0 There is a handler.
 704                    1 Branches to End.
 705            2 Exception handling not represented in Firm. -- */
 706   {
 707     ir_node *proj, *Mproj = NULL, *Xproj = NULL;
 708     for (proj = (ir_node *)get_irn_link(call); proj; proj = (ir_node *)get_irn_link(proj)) {
 709       assert(get_irn_op(proj) == op_Proj);
 710       if (get_Proj_proj(proj) == pn_Call_X_except) Xproj = proj;
 711       if (get_Proj_proj(proj) == pn_Call_M_except) Mproj = proj;
 712     }
 713     if      (Mproj) { assert(Xproj); exc_handling = 0; } /*  Mproj           */
 714     else if (Xproj) {                exc_handling = 1; } /* !Mproj &&  Xproj   */
 715     else            {                exc_handling = 2; } /* !Mproj && !Xproj   */
 716   }
 717
 718
 719   /* --
 720       the procedure and later replaces the Start node of the called graph.
 721       Post_call is the old Call node and collects the results of the called
 722       graph. Both will end up being a tuple.  -- */
 723   post_bl = get_nodes_Block(call);
 724   set_irg_current_block(current_ir_graph, post_bl);
 725   /* XxMxPxP of Start + parameter of Call */
 726   in[pn_Start_X_initial_exec] = new_Jmp();
 727   in[pn_Start_M]              = get_Call_mem(call);
 728   in[pn_Start_P_frame_base]   = get_irg_frame(current_ir_graph);
 729   in[pn_Start_P_globals]      = get_irg_globals(current_ir_graph);
 730   in[pn_Start_T_args]         = new_Tuple(get_Call_n_params(call), get_Call_param_arr(call));
 731   /* in[pn_Start_P_value_arg_base] = ??? */
 732   pre_call = new_Tuple(5, in);
 733   post_call = call;
 734
 735   /* --
 736       The new block gets the ins of the old block, pre_call and all its
 737       predecessors and all Phi nodes. -- */
 738   part_block(pre_call);
 739
 740   /* -- Prepare state for dead node elimination -- */
 741   /* Visited flags in calling irg must be >= flag in called irg.
 742      Else walker and arity computation will not work. */
 743   if (get_irg_visited(current_ir_graph) <= get_irg_visited(called_graph))
 744     set_irg_visited(current_ir_graph, get_irg_visited(called_graph)+1);
 745   if (get_irg_block_visited(current_ir_graph)< get_irg_block_visited(called_graph))
 746     set_irg_block_visited(current_ir_graph, get_irg_block_visited(called_graph));
 747   /* Set pre_call as new Start node in link field of the start node of
 748      calling graph and pre_calls block as new block for the start block
 749      of calling graph.
 750      Further mark these nodes so that they are not visited by the
 751      copying. */
 752   set_irn_link(get_irg_start(called_graph), pre_call);
 753   set_irn_visited(get_irg_start(called_graph),
 754           get_irg_visited(current_ir_graph));
 755   set_irn_link(get_irg_start_block(called_graph),
 756            get_nodes_Block(pre_call));
 757   set_irn_visited(get_irg_start_block(called_graph),
 758           get_irg_visited(current_ir_graph));
 759
 760   /* Initialize for compaction of in arrays */
 761   inc_irg_block_visited(current_ir_graph);
 762
 763   /* -- Replicate local entities of the called_graph -- */
 764   /* copy the entities. */
 765   called_frame = get_irg_frame_type(called_graph);
 766   for (i = 0; i < get_class_n_members(called_frame); i++) {
 767     entity *new_ent, *old_ent;
 768     old_ent = get_class_member(called_frame, i);
 769     new_ent = copy_entity_own(old_ent, get_cur_frame_type());
 770     set_entity_link(old_ent, new_ent);
 771   }
 772
 773   /* visited is > than that of called graph.  With this trick visited will
 774      remain unchanged so that an outer walker, e.g., searching the call nodes
 775      to inline, calling this inline will not visit the inlined nodes. */
 776   set_irg_visited(current_ir_graph, get_irg_visited(current_ir_graph)-1);
 777
 778   /* -- Performing dead node elimination inlines the graph -- */
 779   /* Copies the nodes to the obstack of current_ir_graph. Updates links to new
 780      entities. */
 781   /* @@@ endless loops are not copied!! -- they should be, I think... */
 782   irg_walk(get_irg_end(called_graph), copy_node_inline, copy_preds,
 783        get_irg_frame_type(called_graph));
 784
 785   /* Repair called_graph */
 786   set_irg_visited(called_graph, get_irg_visited(current_ir_graph));
 787   set_irg_block_visited(called_graph, get_irg_block_visited(current_ir_graph));
 788   set_Block_block_visited(get_irg_start_block(called_graph), 0);
 789
 790   /* -- Merge the end of the inlined procedure with the call site -- */
 791   /* We will turn the old Call node into a Tuple with the following
 792      predecessors:
 793        -1:  Block of Tuple.
 794        0: Phi of all Memories of Return statements.
 795        1: Jmp from new Block that merges the control flow from all exception
 796       predecessors of the old end block.
 797        2: Tuple of all arguments.
 798        3: Phi of Exception memories.
 799      In case the old Call directly branches to End on an exception we don't
 800      need the block merging all exceptions nor the Phi of the exception
 801      memories.
 802   */
 803
 804   /* -- Precompute some values -- */
 805   end_bl = get_new_node(get_irg_end_block(called_graph));
 806   end = get_new_node(get_irg_end(called_graph));
 807   arity = intern_get_irn_arity(end_bl);    /* arity = n_exc + n_ret  */
 808   n_res = get_method_n_ress(get_Call_type(call));
 809
 810   res_pred = (ir_node **) malloc (n_res * sizeof (ir_node *));
 811   cf_pred =  (ir_node **) malloc (arity * sizeof (ir_node *));
 812
 813   set_irg_current_block(current_ir_graph, post_bl); /* just to make sure */
 814
 815   /* -- archive keepalives -- */
 816   irn_arity = intern_get_irn_arity(end);
 817   for (i = 0; i < irn_arity; i++)
 818     add_End_keepalive(get_irg_end(current_ir_graph), intern_get_irn_n(end, i));
 819
 820   /* The new end node will die.  We need not free as the in array is on the obstack:
 821      copy_node only generated 'D' arrays. */
 822
 823   /* -- Replace Return nodes by Jump nodes. -- */
 824   n_ret = 0;
 825   for (i = 0; i < arity; i++) {
 826     ir_node *ret;
 827     ret = intern_get_irn_n(end_bl, i);
 828     if (intern_get_irn_op(ret) == op_Return) {
 829       cf_pred[n_ret] = new_r_Jmp(current_ir_graph, get_nodes_Block(ret));
 830       n_ret++;
 831     }
 832   }
 833   set_irn_in(post_bl, n_ret, cf_pred);
 834
 835   /* -- Build a Tuple for all results of the method.
 836      Add Phi node if there was more than one Return.  -- */
 837   turn_into_tuple(post_call, 4);
 838   /* First the Memory-Phi */
 839   n_ret = 0;
 840   for (i = 0; i < arity; i++) {
 841     ret = intern_get_irn_n(end_bl, i);
 842     if (intern_get_irn_op(ret) == op_Return) {
 843       cf_pred[n_ret] = get_Return_mem(ret);
 844       n_ret++;
 845     }
 846   }
 847   phi = new_Phi(n_ret, cf_pred, mode_M);
 848   set_Tuple_pred(call, pn_Call_M_regular, phi);
 849   /* Conserve Phi-list for further inlinings -- but might be optimized */
 850   if (get_nodes_Block(phi) == post_bl) {
 851     set_irn_link(phi, get_irn_link(post_bl));
 852     set_irn_link(post_bl, phi);
 853   }
 854   /* Now the real results */
 855   if (n_res > 0) {
 856     for (j = 0; j < n_res; j++) {
 857       n_ret = 0;
 858       for (i = 0; i < arity; i++) {
 859         ret = intern_get_irn_n(end_bl, i);
 860         if (intern_get_irn_op(ret) == op_Return) {
 861           cf_pred[n_ret] = get_Return_res(ret, j);
 862           n_ret++;
 863         }
 864       }
 865       phi = new_Phi(n_ret, cf_pred, intern_get_irn_mode(cf_pred[0]));
 866       res_pred[j] = phi;
 867       /* Conserve Phi-list for further inlinings -- but might be optimized */
 868       if (get_nodes_Block(phi) == post_bl) {
 869         set_irn_link(phi, get_irn_link(post_bl));
 870         set_irn_link(post_bl, phi);
 871       }
 872     }
 873     set_Tuple_pred(call, pn_Call_T_result, new_Tuple(n_res, res_pred));
 874   } else {
 875     set_Tuple_pred(call, pn_Call_T_result, new_Bad());
 876   }
 877   /* Finally the exception control flow.
 878      We have two (three) possible situations:
 879      First if the Call branches to an exception handler: We need to add a Phi node to
 880      collect the memory containing the exception objects.  Further we need
 881      to add another block to get a correct representation of this Phi.  To
 882      this block we add a Jmp that resolves into the X output of the Call
 883      when the Call is turned into a tuple.
 884      Second the Call branches to End, the exception is not handled.  Just
 885      add all inlined exception branches to the End node.
 886      Third: there is no Exception edge at all. Handle as case two. */
 887   if (exc_handling == 0) {
 888     n_exc = 0;
 889     for (i = 0; i < arity; i++) {
 890       ir_node *ret;
 891       ret = intern_get_irn_n(end_bl, i);
 892       if (is_fragile_op(skip_Proj(ret)) || (intern_get_irn_op(skip_Proj(ret)) == op_Raise)) {
 893     cf_pred[n_exc] = ret;
 894     n_exc++;
 895       }
 896     }
 897     if (n_exc > 0) {
 898       new_Block(n_exc, cf_pred);      /* watch it: current_block is changed! */
 899       set_Tuple_pred(call, pn_Call_X_except, new_Jmp());
 900       /* The Phi for the memories with the exception objects */
 901       n_exc = 0;
 902       for (i = 0; i < arity; i++) {
 903     ir_node *ret;
 904     ret = skip_Proj(intern_get_irn_n(end_bl, i));
 905     if (intern_get_irn_op(ret) == op_Call) {
 906       cf_pred[n_exc] = new_r_Proj(current_ir_graph, get_nodes_Block(ret), ret, mode_M, 3);
 907       n_exc++;
 908     } else if (is_fragile_op(ret)) {
 909     /* We rely that all cfops have the memory output at the same position. */
 910       cf_pred[n_exc] = new_r_Proj(current_ir_graph, get_nodes_Block(ret), ret, mode_M, 0);
 911       n_exc++;
 912     } else if (intern_get_irn_op(ret) == op_Raise) {
 913       cf_pred[n_exc] = new_r_Proj(current_ir_graph, get_nodes_Block(ret), ret, mode_M, 1);
 914       n_exc++;
 915     }
 916       }
 917       set_Tuple_pred(call, pn_Call_M_except, new_Phi(n_exc, cf_pred, mode_M));
 918     } else {
 919       set_Tuple_pred(call, pn_Call_X_except, new_Bad());
 920       set_Tuple_pred(call, pn_Call_M_except, new_Bad());
 921     }
 922   } else {
 923     ir_node *main_end_bl;
 924     int main_end_bl_arity;
 925     ir_node **end_preds;
 926
 927     /* assert(exc_handling == 1 || no exceptions. ) */
 928     n_exc = 0;
 929     for (i = 0; i < arity; i++) {
 930       ir_node *ret = intern_get_irn_n(end_bl, i);
 931
 932       if (is_fragile_op(skip_Proj(ret)) || (intern_get_irn_op(skip_Proj(ret)) == op_Raise)) {
 933         cf_pred[n_exc] = ret;
 934         n_exc++;
 935       }
 936     }
 937     main_end_bl = get_irg_end_block(current_ir_graph);
 938     main_end_bl_arity = intern_get_irn_arity(main_end_bl);
 939     end_preds =  (ir_node **) malloc ((n_exc + main_end_bl_arity) * sizeof (ir_node *));
 940
 941     for (i = 0; i < main_end_bl_arity; ++i)
 942       end_preds[i] = intern_get_irn_n(main_end_bl, i);
 943     for (i = 0; i < n_exc; ++i)
 944       end_preds[main_end_bl_arity + i] = cf_pred[i];
 945     set_irn_in(main_end_bl, n_exc + main_end_bl_arity, end_preds);
 946     set_Tuple_pred(call, pn_Call_X_except, new_Bad());
 947     set_Tuple_pred(call, pn_Call_M_except, new_Bad());
 948     free(end_preds);
 949   }
 950   free(res_pred);
 951   free(cf_pred);
 952
 953 #if 0  /* old. now better, correcter, faster implementation. */
 954   if (n_exc > 0) {
 955     /* -- If the exception control flow from the inlined Call directly
 956        branched to the end block we now have the following control
 957        flow predecessor pattern: ProjX -> Tuple -> Jmp.  We must
 958        remove the Jmp along with it's empty block and add Jmp's
 959        predecessors as predecessors of this end block.  No problem if
 960        there is no exception, because then branches Bad to End which
 961        is fine. --
 962        @@@ can't we know this beforehand: by getting the Proj(1) from
 963        the Call link list and checking whether it goes to Proj. */
 964     /* find the problematic predecessor of the end block. */
 965     end_bl = get_irg_end_block(current_ir_graph);
 966     for (i = 0; i < get_Block_n_cfgpreds(end_bl); i++) {
 967       cf_op = get_Block_cfgpred(end_bl, i);
 968       if (intern_get_irn_op(cf_op) == op_Proj) {
 969     cf_op = get_Proj_pred(cf_op);
 970     if ((intern_get_irn_op(cf_op) == op_Tuple) && (cf_op == call)) {
 971       /*  There are unoptimized tuples from inlineing before when no exc */
 972       assert(get_Proj_proj(get_Block_cfgpred(end_bl, i)) == pn_Call_X_except);
 973       cf_op = get_Tuple_pred(cf_op, pn_Call_X_except);
 974       assert(intern_get_irn_op(cf_op) == op_Jmp);
 975       break;
 976     }
 977       }
 978     }
 979     /* repair */
 980     if (i < get_Block_n_cfgpreds(end_bl)) {
 981       bl = get_nodes_Block(cf_op);
 982       arity = get_Block_n_cfgpreds(end_bl) + get_Block_n_cfgpreds(bl) - 1;
 983       cf_pred = (ir_node **) malloc (arity * sizeof (ir_node *));
 984       for (j = 0; j < i; j++)
 985     cf_pred[j] = get_Block_cfgpred(end_bl, j);
 986       for (j = j; j < i + get_Block_n_cfgpreds(bl); j++)
 987     cf_pred[j] = get_Block_cfgpred(bl, j-i);
 988       for (j = j; j < arity; j++)
 989     cf_pred[j] = get_Block_cfgpred(end_bl, j-get_Block_n_cfgpreds(bl) +1);
 990       set_irn_in(end_bl, arity, cf_pred);
 991       free(cf_pred);
 992       /*  Remove the exception pred from post-call Tuple. */
 993       set_Tuple_pred(call, pn_Call_X_except, new_Bad());
 994     }
 995   }
 996 #endif
 997
 998   /* --  Turn cse back on. -- */
 999   set_optimize(rem_opt);
1000 }
1001
1002 /********************************************************************/
1003 /* Apply inlineing to small methods.                                */
1004 /********************************************************************/
1005
1006 /* It makes no sense to inline too many calls in one procedure. Anyways,
1007    I didn't get a version with NEW_ARR_F to run. */
1008 #define MAX_INLINE 1024
1009
1010 /**
1011  * environment for inlining small irgs
1012  */
1013 typedef struct _inline_env_t {
1014   int pos;
1015   ir_node *calls[MAX_INLINE];
1016 } inline_env_t;
1017
1018 /**
1019  * Returns the irg called from a Call node. If the irg is not
1020  * known, NULL is returned.
1021  */
1022 static ir_graph *get_call_called_irg(ir_node *call) {
1023   ir_node *addr;
1024   tarval *tv;
1025   ir_graph *called_irg = NULL;
1026
1027   assert(get_irn_op(call) == op_Call);
1028
1029   addr = get_Call_ptr(call);
1030   if (intern_get_irn_op(addr) == op_Const) {
1031     /* Check whether the constant is the pointer to a compiled entity. */
1032     tv = get_Const_tarval(addr);
1033     if (tarval_to_entity(tv))
1034       called_irg = get_entity_irg(tarval_to_entity(tv));
1035   }
1036   return called_irg;
1037 }
1038
1039 static void collect_calls(ir_node *call, void *env) {
1040   inline_env_t *ienv = env;
1041   ir_node *addr;
1042   tarval *tv;
1043   ir_graph *called_irg;
1044
1045   if (intern_get_irn_op(call) != op_Call) return;
1046
1047   addr = get_Call_ptr(call);
1048   if (intern_get_irn_op(addr) == op_Const) {
1049     /* Check whether the constant is the pointer to a compiled entity. */
1050     tv = get_Const_tarval(addr);
1051     if (tarval_to_entity(tv)) {
1052       called_irg = get_entity_irg(tarval_to_entity(tv));
1053       if (called_irg && ienv->pos < MAX_INLINE) {
1054         /* The Call node calls a locally defined method.  Remember to inline. */
1055         ienv->calls[ienv->pos++] = call;
1056       }
1057     }
1058   }
1059 }
1060
1061 /**
1062  * Inlines all small methods at call sites where the called address comes
1063  * from a Const node that references the entity representing the called
1064  * method.
1065  * The size argument is a rough measure for the code size of the method:
1066  * Methods where the obstack containing the firm graph is smaller than
1067  * size are inlined.
1068  */
1069 void inline_small_irgs(ir_graph *irg, int size) {
1070   int i;
1071   ir_graph *rem = current_ir_graph;
1072   inline_env_t env;
1073
1074   if (!(get_opt_optimize() && get_opt_inline())) return;
1075
1076   current_ir_graph = irg;
1077   /* Handle graph state */
1078   assert(get_irg_phase_state(current_ir_graph) != phase_building);
1079   assert(get_irg_callee_info_state(current_ir_graph) == irg_callee_info_none);
1080
1081   /* Find Call nodes to inline.
1082      (We can not inline during a walk of the graph, as inlineing the same
1083      method several times changes the visited flag of the walked graph:
1084      after the first inlineing visited of the callee equals visited of
1085      the caller.  With the next inlineing both are increased.) */
1086   env.pos = 0;
1087   irg_walk(get_irg_end(irg), NULL, collect_calls, &env);
1088
1089   if ((env.pos > 0) && (env.pos < MAX_INLINE)) {
1090     /* There are calls to inline */
1091     collect_phiprojs(irg);
1092     for (i = 0; i < env.pos; i++) {
1093       tarval *tv;
1094       ir_graph *callee;
1095       tv = get_Const_tarval(get_Call_ptr(env.calls[i]));
1096       callee = get_entity_irg(tarval_to_entity(tv));
1097       if (((_obstack_memory_used(callee->obst) - obstack_room(callee->obst)) < size) ||
1098       (get_irg_inline_property(callee) == irg_inline_forced)) {
1099         inline_method(env.calls[i], callee);
1100       }
1101     }
1102   }
1103
1104   current_ir_graph = rem;
1105 }
1106
1107 /**
1108  * Environment for inlining irgs.
1109  */
1110 typedef struct {
1111   int n_nodes;       /**< Nodes in graph except Id, Tuple, Proj, Start, End */
1112   int n_nodes_orig;  /**< for statistics */
1113   eset *call_nodes;  /**< All call nodes in this graph */
1114   int n_call_nodes;
1115   int n_call_nodes_orig; /**< for statistics */
1116   int n_callers;   /**< Number of known graphs that call this graphs. */
1117   int n_callers_orig; /**< for statistics */
1118 } inline_irg_env;
1119
1120 static inline_irg_env *new_inline_irg_env(void) {
1121   inline_irg_env *env = malloc(sizeof(inline_irg_env));
1122   env->n_nodes = -2; /* uncount Start, End */
1123   env->n_nodes_orig = -2; /* uncount Start, End */
1124   env->call_nodes = eset_create();
1125   env->n_call_nodes = 0;
1126   env->n_call_nodes_orig = 0;
1127   env->n_callers = 0;
1128   env->n_callers_orig = 0;
1129   return env;
1130 }
1131
1132 static void free_inline_irg_env(inline_irg_env *env) {
1133   eset_destroy(env->call_nodes);
1134   free(env);
1135 }
1136
1137 static void collect_calls2(ir_node *call, void *env) {
1138   inline_irg_env *x = (inline_irg_env *)env;
1139   ir_op *op = intern_get_irn_op(call);
1140   ir_graph *callee;
1141
1142   /* count nodes in irg */
1143   if (op != op_Proj && op != op_Tuple && op != op_Sync) {
1144     x->n_nodes++;
1145     x->n_nodes_orig++;
1146   }
1147
1148   if (op != op_Call) return;
1149
1150   /* collect all call nodes */
1151   eset_insert(x->call_nodes, (void *)call);
1152   x->n_call_nodes++;
1153   x->n_call_nodes_orig++;
1154
1155   /* count all static callers */
1156   callee = get_call_called_irg(call);
1157   if (callee) {
1158     ((inline_irg_env *)get_irg_link(callee))->n_callers++;
1159     ((inline_irg_env *)get_irg_link(callee))->n_callers_orig++;
1160   }
1161 }
1162
1163 INLINE static int is_leave(ir_graph *irg) {
1164   return (((inline_irg_env *)get_irg_link(irg))->n_call_nodes == 0);
1165 }
1166
1167 INLINE static int is_smaller(ir_graph *callee, int size) {
1168   return (((inline_irg_env *)get_irg_link(callee))->n_nodes < size);
1169 }
1170
1171
1172 /**
1173  * Inlines small leave methods at call sites where the called address comes
1174  * from a Const node that references the entity representing the called
1175  * method.
1176  * The size argument is a rough measure for the code size of the method:
1177  * Methods where the obstack containing the firm graph is smaller than
1178  * size are inlined.
1179  */
1180 void inline_leave_functions(int maxsize, int leavesize, int size) {
1181   inline_irg_env *env;
1182   int i, n_irgs = get_irp_n_irgs();
1183   ir_graph *rem = current_ir_graph;
1184   int did_inline = 1;
1185
1186   if (!(get_opt_optimize() && get_opt_inline())) return;
1187
1188   /* extend all irgs by a temporary data structure for inlineing. */
1189   for (i = 0; i < n_irgs; ++i)
1190     set_irg_link(get_irp_irg(i), new_inline_irg_env());
1191
1192   /* Precompute information in temporary data structure. */
1193   for (i = 0; i < n_irgs; ++i) {
1194     current_ir_graph = get_irp_irg(i);
1195     assert(get_irg_phase_state(current_ir_graph) != phase_building);
1196     assert(get_irg_callee_info_state(current_ir_graph) == irg_callee_info_none);
1197
1198     irg_walk(get_irg_end(current_ir_graph), NULL, collect_calls2,
1199          get_irg_link(current_ir_graph));
1200   }
1201
1202   /* and now inline.
1203      Inline leaves recursively -- we might construct new leaves. */
1204   /* int itercnt = 1; */
1205   while (did_inline) {
1206     /* printf("iteration %d\n", itercnt++); */
1207     did_inline = 0;
1208     for (i = 0; i < n_irgs; ++i) {
1209       ir_node *call;
1210       eset *walkset;
1211       int phiproj_computed = 0;
1212
1213       current_ir_graph = get_irp_irg(i);
1214       env = (inline_irg_env *)get_irg_link(current_ir_graph);
1215
1216       /* we can not walk and change a set, nor remove from it.
1217       So recompute.*/
1218       walkset = env->call_nodes;
1219       env->call_nodes = eset_create();
1220       for (call = eset_first(walkset); call; call = eset_next(walkset)) {
1221         inline_irg_env *callee_env;
1222         ir_graph *callee = get_call_called_irg(call);
1223
1224         if (env->n_nodes > maxsize) break;
1225         if (callee &&
1226         ((is_leave(callee) && is_smaller(callee, leavesize)) ||
1227          (get_irg_inline_property(callee) == irg_inline_forced))) {
1228           if (!phiproj_computed) {
1229             phiproj_computed = 1;
1230             collect_phiprojs(current_ir_graph);
1231           }
1232           callee_env = (inline_irg_env *)get_irg_link(callee);
1233 /*         printf(" %s: Inlineing %s.\n", get_entity_name(get_irg_entity(current_ir_graph)), */
1234 /*         get_entity_name(get_irg_entity(callee))); */
1235           inline_method(call, callee);
1236           did_inline = 1;
1237           env->n_call_nodes--;
1238           eset_insert_all(env->call_nodes, callee_env->call_nodes);
1239           env->n_call_nodes += callee_env->n_call_nodes;
1240           env->n_nodes += callee_env->n_nodes;
1241           callee_env->n_callers--;
1242         } else {
1243           eset_insert(env->call_nodes, call);
1244         }
1245       }
1246       eset_destroy(walkset);
1247     }
1248   }
1249
1250   /* printf("Non leaves\n"); */
1251   /* inline other small functions. */
1252   for (i = 0; i < n_irgs; ++i) {
1253     ir_node *call;
1254     eset *walkset;
1255     int phiproj_computed = 0;
1256
1257     current_ir_graph = get_irp_irg(i);
1258     env = (inline_irg_env *)get_irg_link(current_ir_graph);
1259
1260     /* we can not walk and change a set, nor remove from it.
1261        So recompute.*/
1262     walkset = env->call_nodes;
1263     env->call_nodes = eset_create();
1264     for (call = eset_first(walkset); call; call = eset_next(walkset)) {
1265       inline_irg_env *callee_env;
1266       ir_graph *callee = get_call_called_irg(call);
1267
1268       if (env->n_nodes > maxsize) break;
1269       if (callee && is_smaller(callee, size)) {
1270         if (!phiproj_computed) {
1271             phiproj_computed = 1;
1272             collect_phiprojs(current_ir_graph);
1273         }
1274         callee_env = (inline_irg_env *)get_irg_link(callee);
1275 /*       printf(" %s: Inlineing %s.\n", get_entity_name(get_irg_entity(current_ir_graph)), */
1276 /*       get_entity_name(get_irg_entity(callee))); */
1277         inline_method(call, callee);
1278         did_inline = 1;
1279         env->n_call_nodes--;
1280         eset_insert_all(env->call_nodes, callee_env->call_nodes);
1281         env->n_call_nodes += callee_env->n_call_nodes;
1282         env->n_nodes += callee_env->n_nodes;
1283         callee_env->n_callers--;
1284       } else {
1285         eset_insert(env->call_nodes, call);
1286       }
1287     }
1288     eset_destroy(walkset);
1289   }
1290
1291   for (i = 0; i < n_irgs; ++i) {
1292     current_ir_graph = get_irp_irg(i);
1293 #if 0
1294     env = (inline_irg_env *)get_irg_link(current_ir_graph);
1295     if ((env->n_call_nodes_orig != env->n_call_nodes) ||
1296     (env->n_callers_orig != env->n_callers))
1297       printf("Nodes:%3d ->%3d, calls:%3d ->%3d, callers:%3d ->%3d, -- %s\n",
1298          env->n_nodes_orig, env->n_nodes, env->n_call_nodes_orig, env->n_call_nodes,
1299          env->n_callers_orig, env->n_callers,
1300          get_entity_name(get_irg_entity(current_ir_graph)));
1301 #endif
1302     free_inline_irg_env((inline_irg_env *)get_irg_link(current_ir_graph));
1303   }
1304
1305   current_ir_graph = rem;
1306 }
1307
1308 /*******************************************************************/
1309 /*  Code Placement.  Pins all floating nodes to a block where they */
1310 /*  will be executed only if needed.                               */
1311 /*******************************************************************/
1312
1313 /**
1314  * Find the earliest correct block for N.  --- Place N into the
1315  * same Block as its dominance-deepest Input.
1316  */
1317 static void
1318 place_floats_early(ir_node *n, pdeq *worklist)
1319 {
1320   int i, start, irn_arity;
1321
1322   /* we must not run into an infinite loop */
1323   assert (irn_not_visited(n));
1324   mark_irn_visited(n);
1325
1326   /* Place floating nodes. */
1327   if (get_op_pinned(intern_get_irn_op(n)) == floats) {
1328     int depth = 0;
1329     ir_node *b = new_Bad();   /* The block to place this node in */
1330
1331     assert(intern_get_irn_op(n) != op_Block);
1332
1333     if ((intern_get_irn_op(n) == op_Const) ||
1334     (intern_get_irn_op(n) == op_SymConst) ||
1335     (is_Bad(n)) ||
1336     (intern_get_irn_op(n) == op_Unknown)) {
1337       /* These nodes will not be placed by the loop below. */
1338       b = get_irg_start_block(current_ir_graph);
1339       depth = 1;
1340     }
1341
1342     /* find the block for this node. */
1343     irn_arity = intern_get_irn_arity(n);
1344     for (i = 0; i < irn_arity; i++) {
1345       ir_node *dep = intern_get_irn_n(n, i);
1346       ir_node *dep_block;
1347       if ((irn_not_visited(dep)) &&
1348       (get_op_pinned(intern_get_irn_op(dep)) == floats)) {
1349         place_floats_early(dep, worklist);
1350       }
1351       /* Because all loops contain at least one pinned node, now all
1352          our inputs are either pinned or place_early has already
1353          been finished on them.  We do not have any unfinished inputs!  */
1354       dep_block = get_nodes_Block(dep);
1355       if ((!is_Bad(dep_block)) &&
1356           (get_Block_dom_depth(dep_block) > depth)) {
1357         b = dep_block;
1358         depth = get_Block_dom_depth(dep_block);
1359       }
1360       /* Avoid that the node is placed in the Start block */
1361       if ((depth == 1) && (get_Block_dom_depth(get_nodes_Block(n)) > 1)) {
1362         b = get_Block_cfg_out(get_irg_start_block(current_ir_graph), 0);
1363         assert(b != get_irg_start_block(current_ir_graph));
1364         depth = 2;
1365       }
1366     }
1367     set_nodes_Block(n, b);
1368   }
1369
1370   /* Add predecessors of non floating nodes on worklist. */
1371   start = (intern_get_irn_op(n) == op_Block) ? 0 : -1;
1372   irn_arity = intern_get_irn_arity(n);
1373   for (i = start; i < irn_arity; i++) {
1374     ir_node *pred = intern_get_irn_n(n, i);
1375     if (irn_not_visited(pred)) {
1376       pdeq_putr (worklist, pred);
1377     }
1378   }
1379 }
1380
1381 /**
1382  * Floating nodes form subgraphs that begin at nodes as Const, Load,
1383  * Start, Call and end at pinned nodes as Store, Call.  Place_early
1384  * places all floating nodes reachable from its argument through floating
1385  * nodes and adds all beginnings at pinned nodes to the worklist.
1386  */
1387 static INLINE void place_early(pdeq* worklist) {
1388   assert(worklist);
1389   inc_irg_visited(current_ir_graph);
1390
1391   /* this inits the worklist */
1392   place_floats_early(get_irg_end(current_ir_graph), worklist);
1393
1394   /* Work the content of the worklist. */
1395   while (!pdeq_empty (worklist)) {
1396     ir_node *n = pdeq_getl (worklist);
1397     if (irn_not_visited(n)) place_floats_early(n, worklist);
1398   }
1399
1400   set_irg_outs_inconsistent(current_ir_graph);
1401   current_ir_graph->pinned = pinned;
1402 }
1403
1404
1405 /** deepest common dominance ancestor of DCA and CONSUMER of PRODUCER. */
1406 static ir_node *
1407 consumer_dom_dca (ir_node *dca, ir_node *consumer, ir_node *producer)
1408 {
1409   ir_node *block = NULL;
1410
1411   /* Compute the latest block into which we can place a node so that it is
1412      before consumer. */
1413   if (intern_get_irn_op(consumer) == op_Phi) {
1414     /* our consumer is a Phi-node, the effective use is in all those
1415        blocks through which the Phi-node reaches producer */
1416     int i, irn_arity;
1417     ir_node *phi_block = get_nodes_Block(consumer);
1418     irn_arity = intern_get_irn_arity(consumer);
1419     for (i = 0;  i < irn_arity; i++) {
1420       if (intern_get_irn_n(consumer, i) == producer) {
1421     block = get_nodes_Block(get_Block_cfgpred(phi_block, i));
1422       }
1423     }
1424   } else {
1425     assert(is_no_Block(consumer));
1426     block = get_nodes_Block(consumer);
1427   }
1428
1429   /* Compute the deepest common ancestor of block and dca. */
1430   assert(block);
1431   if (!dca) return block;
1432   while (get_Block_dom_depth(block) > get_Block_dom_depth(dca))
1433     block = get_Block_idom(block);
1434   while (get_Block_dom_depth(dca) > get_Block_dom_depth(block))
1435     dca = get_Block_idom(dca);
1436   while (block != dca)
1437     { block = get_Block_idom(block); dca = get_Block_idom(dca); }
1438
1439   return dca;
1440 }
1441
1442 static INLINE int get_irn_loop_depth(ir_node *n) {
1443   return get_loop_depth(get_irn_loop(n));
1444 }
1445
1446 /**
1447  * Move n to a block with less loop depth than it's current block. The
1448  * new block must be dominated by early.
1449  */
1450 static void
1451 move_out_of_loops (ir_node *n, ir_node *early)
1452 {
1453   ir_node *best, *dca;
1454   assert(n && early);
1455
1456
1457   /* Find the region deepest in the dominator tree dominating
1458      dca with the least loop nesting depth, but still dominated
1459      by our early placement. */
1460   dca = get_nodes_Block(n);
1461   best = dca;
1462   while (dca != early) {
1463     dca = get_Block_idom(dca);
1464     if (!dca) break; /* should we put assert(dca)? */
1465     if (get_irn_loop_depth(dca) < get_irn_loop_depth(best)) {
1466       best = dca;
1467     }
1468   }
1469   if (best != get_nodes_Block(n)) {
1470     /* debug output
1471     printf("Moving out of loop: "); DDMN(n);
1472     printf(" Outermost block: "); DDMN(early);
1473     printf(" Best block: "); DDMN(best);
1474     printf(" Innermost block: "); DDMN(get_nodes_Block(n));
1475     */
1476     set_nodes_Block(n, best);
1477   }
1478 }
1479
1480 /**
1481  * Find the latest legal block for N and place N into the
1482  * `optimal' Block between the latest and earliest legal block.
1483  * The `optimal' block is the dominance-deepest block of those
1484  * with the least loop-nesting-depth.  This places N out of as many
1485  * loops as possible and then makes it as control dependant as
1486  * possible.
1487  */
1488 static void
1489 place_floats_late(ir_node *n, pdeq *worklist)
1490 {
1491   int i;
1492   ir_node *early;
1493
1494   assert (irn_not_visited(n)); /* no multiple placement */
1495
1496   /* no need to place block nodes, control nodes are already placed. */
1497   if ((intern_get_irn_op(n) != op_Block) &&
1498       (!is_cfop(n)) &&
1499       (intern_get_irn_mode(n) != mode_X)) {
1500     /* Remember the early placement of this block to move it
1501        out of loop no further than the early placement. */
1502     early = get_nodes_Block(n);
1503     /* Assure that our users are all placed, except the Phi-nodes.
1504        --- Each data flow cycle contains at least one Phi-node.  We
1505        have to break the `user has to be placed before the
1506        producer' dependence cycle and the Phi-nodes are the
1507        place to do so, because we need to base our placement on the
1508        final region of our users, which is OK with Phi-nodes, as they
1509        are pinned, and they never have to be placed after a
1510        producer of one of their inputs in the same block anyway. */
1511     for (i = 0; i < get_irn_n_outs(n); i++) {
1512       ir_node *succ = get_irn_out(n, i);
1513       if (irn_not_visited(succ) && (intern_get_irn_op(succ) != op_Phi))
1514     place_floats_late(succ, worklist);
1515     }
1516
1517     /* We have to determine the final block of this node... except for
1518        constants. */
1519     if ((get_op_pinned(intern_get_irn_op(n)) == floats) &&
1520     (intern_get_irn_op(n) != op_Const) &&
1521     (intern_get_irn_op(n) != op_SymConst)) {
1522       ir_node *dca = NULL;  /* deepest common ancestor in the
1523                    dominator tree of all nodes'
1524                    blocks depending on us; our final
1525                    placement has to dominate DCA. */
1526       for (i = 0; i < get_irn_n_outs(n); i++) {
1527     dca = consumer_dom_dca (dca, get_irn_out(n, i), n);
1528       }
1529       set_nodes_Block(n, dca);
1530
1531       move_out_of_loops (n, early);
1532     }
1533   }
1534
1535   mark_irn_visited(n);
1536
1537   /* Add predecessors of all non-floating nodes on list. (Those of floating
1538      nodes are placeded already and therefore are marked.)  */
1539   for (i = 0; i < get_irn_n_outs(n); i++) {
1540     if (irn_not_visited(get_irn_out(n, i))) {
1541       pdeq_putr (worklist, get_irn_out(n, i));
1542     }
1543   }
1544 }
1545
1546 static INLINE void place_late(pdeq* worklist) {
1547   assert(worklist);
1548   inc_irg_visited(current_ir_graph);
1549
1550   /* This fills the worklist initially. */
1551   place_floats_late(get_irg_start_block(current_ir_graph), worklist);
1552   /* And now empty the worklist again... */
1553   while (!pdeq_empty (worklist)) {
1554     ir_node *n = pdeq_getl (worklist);
1555     if (irn_not_visited(n)) place_floats_late(n, worklist);
1556   }
1557 }
1558
1559 void place_code(ir_graph *irg) {
1560   pdeq* worklist;
1561   ir_graph *rem = current_ir_graph;
1562
1563   current_ir_graph = irg;
1564
1565   if (!(get_opt_optimize() && get_opt_global_cse())) return;
1566
1567   /* Handle graph state */
1568   assert(get_irg_phase_state(irg) != phase_building);
1569   if (get_irg_dom_state(irg) != dom_consistent)
1570     compute_doms(irg);
1571
1572   if (get_irg_loopinfo_state(irg) != loopinfo_consistent) {
1573     free_loop_information(irg);
1574     construct_backedges(irg);
1575   }
1576
1577   /* Place all floating nodes as early as possible. This guarantees
1578      a legal code placement. */
1579   worklist = new_pdeq();
1580   place_early(worklist);
1581
1582   /* place_early invalidates the outs, place_late needs them. */
1583   compute_outs(irg);
1584   /* Now move the nodes down in the dominator tree. This reduces the
1585      unnecessary executions of the node. */
1586   place_late(worklist);
1587
1588   set_irg_outs_inconsistent(current_ir_graph);
1589   set_irg_loopinfo_inconsistent(current_ir_graph);
1590   del_pdeq(worklist);
1591   current_ir_graph = rem;
1592 }
1593
1594
1595
1596 /********************************************************************/
1597 /* Control flow optimization.                                       */
1598 /* Removes Bad control flow predecessors and empty blocks.  A block */
1599 /* is empty if it contains only a Jmp node.                         */
1600 /* Blocks can only be removed if they are not needed for the        */
1601 /* semantics of Phi nodes.                                          */
1602 /********************************************************************/
1603
1604 /**
1605  * Removes Tuples from Block control flow predecessors.
1606  * Optimizes blocks with equivalent_node().
1607  * Replaces n by Bad if n is unreachable control flow.
1608  */
1609 static void merge_blocks(ir_node *n, void *env) {
1610   int i;
1611   set_irn_link(n, NULL);
1612
1613   if (intern_get_irn_op(n) == op_Block) {
1614     /* Remove Tuples */
1615     for (i = 0; i < get_Block_n_cfgpreds(n); i++)
1616       /* GL @@@ : is this possible? if (get_opt_normalize()) -- added, all tests go through.
1617        A different order of optimizations might cause problems. */
1618       if (get_opt_normalize())
1619         set_Block_cfgpred(n, i, skip_Tuple(get_Block_cfgpred(n, i)));
1620   } else if (get_opt_optimize() && (intern_get_irn_mode(n) == mode_X)) {
1621     /* We will soon visit a block.  Optimize it before visiting! */
1622     ir_node *b = get_nodes_Block(n);
1623     ir_node *new_node = equivalent_node(b);
1624     while (irn_not_visited(b) && (!is_Bad(new_node)) && (new_node != b)) {
1625       /* We would have to run gigo if new is bad, so we
1626      promote it directly below. */
1627       assert(((b == new_node) ||
1628           get_opt_control_flow_straightening() ||
1629           get_opt_control_flow_weak_simplification()) &&
1630          ("strange flag setting"));
1631       exchange (b, new_node);
1632       b = new_node;
1633       new_node = equivalent_node(b);
1634     }
1635     /* GL @@@ get_opt_normalize hinzugefuegt, 5.5.2003 */
1636     if (is_Bad(new_node) && get_opt_normalize()) exchange(n, new_Bad());
1637   }
1638 }
1639
1640 /**
1641  * Collects all Phi nodes in link list of Block.
1642  * Marks all blocks "block_visited" if they contain a node other
1643  * than Jmp.
1644  */
1645 static void collect_nodes(ir_node *n, void *env) {
1646   if (is_no_Block(n)) {
1647     ir_node *b = get_nodes_Block(n);
1648
1649     if ((intern_get_irn_op(n) == op_Phi)) {
1650       /* Collect Phi nodes to compact ins along with block's ins. */
1651       set_irn_link(n, get_irn_link(b));
1652       set_irn_link(b, n);
1653     } else if (intern_get_irn_op(n) != op_Jmp) {  /* Check for non empty block. */
1654       mark_Block_block_visited(b);
1655     }
1656   }
1657 }
1658
1659 /** Returns true if pred is predecessor of block. */
1660 static int is_pred_of(ir_node *pred, ir_node *b) {
1661   int i;
1662   for (i = 0; i < get_Block_n_cfgpreds(b); i++) {
1663     ir_node *b_pred = get_nodes_Block(get_Block_cfgpred(b, i));
1664     if (b_pred == pred) return 1;
1665   }
1666   return 0;
1667 }
1668
1669 static int test_whether_dispensable(ir_node *b, int pos) {
1670   int i, j, n_preds = 1;
1671   int dispensable = 1;
1672   ir_node *cfop = get_Block_cfgpred(b, pos);
1673   ir_node *pred = get_nodes_Block(cfop);
1674
1675   if (get_Block_block_visited(pred) + 1
1676       < get_irg_block_visited(current_ir_graph)) {
1677     if (!get_opt_optimize() || !get_opt_control_flow_strong_simplification()) {
1678       /* Mark block so that is will not be removed. */
1679       set_Block_block_visited(pred, get_irg_block_visited(current_ir_graph)-1);
1680       return 1;
1681     }
1682     /* Seems to be empty. */
1683     if (!get_irn_link(b)) {
1684       /* There are no Phi nodes ==> dispensable. */
1685       n_preds = get_Block_n_cfgpreds(pred);
1686     } else {
1687       /* b's pred blocks and pred's pred blocks must be pairwise disjunct.
1688      Work preds < pos as if they were already removed. */
1689       for (i = 0; i < pos; i++) {
1690         ir_node *b_pred = get_nodes_Block(get_Block_cfgpred(b, i));
1691         if (get_Block_block_visited(b_pred) + 1
1692             < get_irg_block_visited(current_ir_graph)) {
1693           for (j = 0; j < get_Block_n_cfgpreds(b_pred); j++) {
1694             ir_node *b_pred_pred = get_nodes_Block(get_Block_cfgpred(b_pred, j));
1695             if (is_pred_of(b_pred_pred, pred)) dispensable = 0;
1696           }
1697         } else {
1698           if (is_pred_of(b_pred, pred)) dispensable = 0;
1699         }
1700       }
1701       for (i = pos +1; i < get_Block_n_cfgpreds(b); i++) {
1702         ir_node *b_pred = get_nodes_Block(get_Block_cfgpred(b, i));
1703         if (is_pred_of(b_pred, pred)) dispensable = 0;
1704       }
1705       if (!dispensable) {
1706         set_Block_block_visited(pred, get_irg_block_visited(current_ir_graph)-1);
1707         n_preds = 1;
1708       } else {
1709         n_preds = get_Block_n_cfgpreds(pred);
1710       }
1711     }
1712   }
1713
1714   return n_preds;
1715 }
1716
1717 static void optimize_blocks(ir_node *b, void *env) {
1718   int i, j, k, max_preds, n_preds;
1719   ir_node *pred, *phi;
1720   ir_node **in;
1721
1722   /* Count the number of predecessor if this block is merged with pred blocks
1723      that are empty. */
1724   max_preds = 0;
1725   for (i = 0; i < get_Block_n_cfgpreds(b); i++) {
1726     max_preds += test_whether_dispensable(b, i);
1727   }
1728   in = (ir_node **) malloc(max_preds * sizeof(ir_node *));
1729
1730 /*-
1731   printf(" working on "); DDMN(b);
1732   for (i = 0; i < get_Block_n_cfgpreds(b); i++) {
1733     pred = get_nodes_Block(get_Block_cfgpred(b, i));
1734     if (is_Bad(get_Block_cfgpred(b, i))) {
1735       printf("  removing Bad %i\n ", i);
1736     } else if (get_Block_block_visited(pred) +1
1737            < get_irg_block_visited(current_ir_graph)) {
1738       printf("  removing pred %i ", i); DDMN(pred);
1739     } else { printf("  Nothing to do for "); DDMN(pred); }
1740   }
1741   * end Debug output -*/
1742
1743   /*- Fix the Phi nodes -*/
1744   phi = get_irn_link(b);
1745   while (phi) {
1746     assert(intern_get_irn_op(phi) == op_Phi);
1747     /* Find the new predecessors for the Phi */
1748     n_preds = 0;
1749     for (i = 0; i < get_Block_n_cfgpreds(b); i++) {
1750       pred = get_nodes_Block(get_Block_cfgpred(b, i));
1751       if (is_Bad(get_Block_cfgpred(b, i))) {
1752         /* Do nothing */
1753       } else if (get_Block_block_visited(pred) +1
1754          < get_irg_block_visited(current_ir_graph)) {
1755         /* It's an empty block and not yet visited. */
1756         ir_node *phi_pred = get_Phi_pred(phi, i);
1757         for (j = 0; j < get_Block_n_cfgpreds(pred); j++) {
1758           if (get_nodes_Block(phi_pred) == pred) {
1759             assert(intern_get_irn_op(phi_pred) == op_Phi);  /* Block is empty!! */
1760             in[n_preds] = get_Phi_pred(phi_pred, j);
1761           } else {
1762             in[n_preds] = phi_pred;
1763           }
1764           n_preds++;
1765         }
1766         /* The Phi_pred node is replaced now if it is a Phi.
1767            In Schleifen kann offenbar der entfernte Phi Knoten legal verwendet werden.
1768            Daher muss der Phiknoten durch den neuen ersetzt werden.
1769            Weiter muss der alte Phiknoten entfernt werden (durch ersetzen oder
1770            durch einen Bad) damit er aus den keep_alive verschwinden kann.
1771            Man sollte also, falls keine Schleife vorliegt, exchange mit new_Bad
1772            aufrufen.  */
1773         if (get_nodes_Block(phi_pred) == pred) {
1774           /* remove the Phi as it might be kept alive. Further there
1775              might be other users. */
1776           exchange(phi_pred, phi);  /* geht, ist aber doch semantisch falsch! Warum?? */
1777         }
1778       } else {
1779         in[n_preds] = get_Phi_pred(phi, i);
1780         n_preds ++;
1781       }
1782     }
1783     /* Fix the node */
1784     set_irn_in(phi, n_preds, in);
1785
1786     phi = get_irn_link(phi);
1787   }
1788
1789 /*-
1790       This happens only if merge between loop backedge and single loop entry. -*/
1791   for (k = 0; k < get_Block_n_cfgpreds(b); k++) {
1792     pred = get_nodes_Block(get_Block_cfgpred(b, k));
1793     if (get_Block_block_visited(pred)+1 < get_irg_block_visited(current_ir_graph)) {
1794       phi = get_irn_link(pred);
1795       while (phi) {
1796         if (intern_get_irn_op(phi) == op_Phi) {
1797           set_nodes_Block(phi, b);
1798
1799           n_preds = 0;
1800           for (i = 0; i < k; i++) {
1801             pred = get_nodes_Block(get_Block_cfgpred(b, i));
1802             if (is_Bad(get_Block_cfgpred(b, i))) {
1803               /* Do nothing */
1804             } else if (get_Block_block_visited(pred) +1
1805                    < get_irg_block_visited(current_ir_graph)) {
1806               /* It's an empty block and not yet visited. */
1807               for (j = 0; j < get_Block_n_cfgpreds(pred); j++) {
1808             /* @@@ Hier brauche ich Schleifeninformation!!! Kontrollflusskante
1809                muss Rueckwaertskante sein! (An allen vier in[n_preds] = phi
1810                Anweisungen.) Trotzdem tuts bisher!! */
1811             in[n_preds] = phi;
1812             n_preds++;
1813               }
1814             } else {
1815               in[n_preds] = phi;
1816               n_preds++;
1817             }
1818           }
1819           for (i = 0; i < get_Phi_n_preds(phi); i++) {
1820             in[n_preds] = get_Phi_pred(phi, i);
1821             n_preds++;
1822           }
1823           for (i = k+1; i < get_Block_n_cfgpreds(b); i++) {
1824             pred = get_nodes_Block(get_Block_cfgpred(b, i));
1825             if (is_Bad(get_Block_cfgpred(b, i))) {
1826               /* Do nothing */
1827             } else if (get_Block_block_visited(pred) +1
1828                    < get_irg_block_visited(current_ir_graph)) {
1829               /* It's an empty block and not yet visited. */
1830               for (j = 0; j < get_Block_n_cfgpreds(pred); j++) {
1831                 in[n_preds] = phi;
1832                 n_preds++;
1833               }
1834             } else {
1835               in[n_preds] = phi;
1836               n_preds++;
1837             }
1838           }
1839           set_irn_in(phi, n_preds, in);
1840         }
1841         phi = get_irn_link(phi);
1842       }
1843     }
1844   }
1845
1846   /*- Fix the block -*/
1847   n_preds = 0;
1848   for (i = 0; i < get_Block_n_cfgpreds(b); i++) {
1849     pred = get_nodes_Block(get_Block_cfgpred(b, i));
1850     if (is_Bad(get_Block_cfgpred(b, i))) {
1851       /* Do nothing */
1852     } else if (get_Block_block_visited(pred) +1
1853            < get_irg_block_visited(current_ir_graph)) {
1854       /* It's an empty block and not yet visited. */
1855       assert(get_Block_n_cfgpreds(b) > 1);
1856                         /* Else it should be optimized by equivalent_node. */
1857       for (j = 0; j < get_Block_n_cfgpreds(pred); j++) {
1858         in[n_preds] = get_Block_cfgpred(pred, j);
1859         n_preds++;
1860       }
1861       /* Remove block as it might be kept alive. */
1862       exchange(pred, b/*new_Bad()*/);
1863     } else {
1864       in[n_preds] = get_Block_cfgpred(b, i);
1865       n_preds ++;
1866     }
1867   }
1868   set_irn_in(b, n_preds, in);
1869   free(in);
1870 }
1871
1872 void optimize_cf(ir_graph *irg) {
1873   int i;
1874   ir_node **in;
1875   ir_node *end = get_irg_end(irg);
1876   ir_graph *rem = current_ir_graph;
1877   current_ir_graph = irg;
1878
1879   /* Handle graph state */
1880   assert(get_irg_phase_state(irg) != phase_building);
1881   if (get_irg_outs_state(current_ir_graph) == outs_consistent)
1882     set_irg_outs_inconsistent(current_ir_graph);
1883   if (get_irg_dom_state(current_ir_graph) == dom_consistent)
1884     set_irg_dom_inconsistent(current_ir_graph);
1885
1886   /* Use block visited flag to mark non-empty blocks. */
1887   inc_irg_block_visited(irg);
1888   irg_walk(end, merge_blocks, collect_nodes, NULL);
1889
1890   /* Optimize the standard code. */
1891   irg_block_walk(get_irg_end_block(irg), optimize_blocks, NULL, NULL);
1892
1893   /* Walk all keep alives, optimize them if block, add to new in-array
1894      for end if useful. */
1895   in = NEW_ARR_F (ir_node *, 1);
1896   in[0] = get_nodes_Block(end);
1897   inc_irg_visited(current_ir_graph);
1898   for(i = 0; i < get_End_n_keepalives(end); i++) {
1899     ir_node *ka = get_End_keepalive(end, i);
1900     if (irn_not_visited(ka)) {
1901       if ((intern_get_irn_op(ka) == op_Block) && Block_not_block_visited(ka)) {
1902         set_irg_block_visited(current_ir_graph,  /* Don't walk all the way to Start. */
1903                       get_irg_block_visited(current_ir_graph)-1);
1904         irg_block_walk(ka, optimize_blocks, NULL, NULL);
1905         mark_irn_visited(ka);
1906         ARR_APP1 (ir_node *, in, ka);
1907       } else if (intern_get_irn_op(ka) == op_Phi) {
1908         mark_irn_visited(ka);
1909         ARR_APP1 (ir_node *, in, ka);
1910       }
1911     }
1912   }
1913   /* DEL_ARR_F(end->in);   GL @@@ tut nicht ! */
1914   end->in = in;
1915
1916   current_ir_graph = rem;
1917 }
1918
1919
1920 /**
1921  * Called by walker of remove_critical_cf_edges().
1922  *
1923  * Place an empty block to an edge between a blocks of multiple
1924  * predecessors and a block of multiple successors.
1925  *
1926  * @param n IR node
1927  * @param env Environment of walker. This field is unused and has
1928  *            the value NULL.
1929  */
1930 static void walk_critical_cf_edges(ir_node *n, void *env) {
1931   int arity, i;
1932   ir_node *pre, *block, **in, *jmp;
1933
1934   /* Block has multiple predecessors */
1935   if ((op_Block == intern_get_irn_op(n)) &&
1936       (intern_get_irn_arity(n) > 1)) {
1937     arity = intern_get_irn_arity(n);
1938
1939     if (n == get_irg_end_block(current_ir_graph))
1940       return;  /*  No use to add a block here.      */
1941
1942     for (i=0; i<arity; i++) {
1943       pre = intern_get_irn_n(n, i);
1944       /* Predecessor has multiple successors. Insert new flow edge */
1945       if ((NULL != pre) &&
1946         (op_Proj == intern_get_irn_op(pre)) &&
1947         op_Raise != intern_get_irn_op(skip_Proj(pre))) {
1948
1949         /* set predecessor array for new block */
1950         in = NEW_ARR_D (ir_node *, current_ir_graph->obst, 1);
1951         /* set predecessor of new block */
1952         in[0] = pre;
1953         block = new_Block(1, in);
1954         /* insert new jmp node to new block */
1955         switch_block(block);
1956         jmp = new_Jmp();
1957         switch_block(n);
1958         /* set successor of new block */
1959         set_irn_n(n, i, jmp);
1960
1961       } /* predecessor has multiple successors */
1962     } /* for all predecessors */
1963   } /* n is a block */
1964 }
1965
1966 void remove_critical_cf_edges(ir_graph *irg) {
1967   if (get_opt_critical_edges())
1968     irg_walk_graph(irg, NULL, walk_critical_cf_edges, NULL);
1969 }