nsz Git - libfirm/blob - ir/opt/opt_inline.c

   1 /*
   2  * Copyright (C) 1995-2008 University of Karlsruhe.  All right reserved.
   3  *
   4  * This file is part of libFirm.
   5  *
   6  * This file may be distributed and/or modified under the terms of the
   7  * GNU General Public License version 2 as published by the Free Software
   8  * Foundation and appearing in the file LICENSE.GPL included in the
   9  * packaging of this file.
  10  *
  11  * Licensees holding valid libFirm Professional Edition licenses may use
  12  * this file in accordance with the libFirm Commercial License.
  13  * Agreement provided with the Software.
  14  *
  15  * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
  16  * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
  17  * PURPOSE.
  18  */
  19
  20 /**
  21  * @file
  22  * @brief    Dead node elimination and Procedure Inlining.
  23  * @author   Michael Beck, Goetz Lindenmaier
  24  * @version  $Id$
  25  */
  26 #ifdef HAVE_CONFIG_H
  27 # include "config.h"
  28 #endif
  29
  30 #include <limits.h>
  31 #include <assert.h>
  32
  33 #include "irnode_t.h"
  34 #include "irgraph_t.h"
  35 #include "irprog_t.h"
  36
  37 #include "iroptimize.h"
  38 #include "ircons_t.h"
  39 #include "iropt_t.h"
  40 #include "irgopt.h"
  41 #include "irgmod.h"
  42 #include "irgwalk.h"
  43
  44 #include "adt/array.h"
  45 #include "adt/pset.h"
  46 #include "adt/pmap.h"
  47 #include "adt/pdeq.h"
  48 #include "adt/xmalloc.h"
  49
  50 #include "irouts.h"
  51 #include "irloop_t.h"
  52 #include "irbackedge_t.h"
  53 #include "opt_inline_t.h"
  54 #include "cgana.h"
  55 #include "trouts.h"
  56 #include "error.h"
  57
  58 #include "analyze_irg_args.h"
  59 #include "iredges_t.h"
  60 #include "irflag_t.h"
  61 #include "irhooks.h"
  62 #include "irtools.h"
  63
  64 DEBUG_ONLY(static firm_dbg_module_t *dbg;)
  65
  66 /*------------------------------------------------------------------*/
  67 /* Routines for dead node elimination / copying garbage collection  */
  68 /* of the obstack.                                                  */
  69 /*------------------------------------------------------------------*/
  70
  71 /**
  72  * Remember the new node in the old node by using a field all nodes have.
  73  */
  74 #define set_new_node(oldn, newn)  set_irn_link(oldn, newn)
  75
  76 /**
  77  * Get this new node, before the old node is forgotten.
  78  */
  79 #define get_new_node(oldn) get_irn_link(oldn)
  80
  81 /**
  82  * Check if a new node was set.
  83  */
  84 #define has_new_node(n) (get_new_node(n) != NULL)
  85
  86 /**
  87  * We use the block_visited flag to mark that we have computed the
  88  * number of useful predecessors for this block.
  89  * Further we encode the new arity in this flag in the old blocks.
  90  * Remembering the arity is useful, as it saves a lot of pointer
  91  * accesses.  This function is called for all Phi and Block nodes
  92  * in a Block.
  93  */
  94 static INLINE int
  95 compute_new_arity(ir_node *b) {
  96         int i, res, irn_arity;
  97         int irg_v, block_v;
  98
  99         irg_v = get_irg_block_visited(current_ir_graph);
 100         block_v = get_Block_block_visited(b);
 101         if (block_v >= irg_v) {
 102                 /* we computed the number of preds for this block and saved it in the
 103                    block_v flag */
 104                 return block_v - irg_v;
 105         } else {
 106                 /* compute the number of good predecessors */
 107                 res = irn_arity = get_irn_arity(b);
 108                 for (i = 0; i < irn_arity; i++)
 109                         if (is_Bad(get_irn_n(b, i))) res--;
 110                         /* save it in the flag. */
 111                         set_Block_block_visited(b, irg_v + res);
 112                         return res;
 113         }
 114 }
 115
 116 /**
 117  * Copies the node to the new obstack. The Ins of the new node point to
 118  * the predecessors on the old obstack.  For block/phi nodes not all
 119  * predecessors might be copied.  n->link points to the new node.
 120  * For Phi and Block nodes the function allocates in-arrays with an arity
 121  * only for useful predecessors.  The arity is determined by counting
 122  * the non-bad predecessors of the block.
 123  *
 124  * @param n    The node to be copied
 125  * @param env  if non-NULL, the node number attribute will be copied to the new node
 126  *
 127  * Note: Also used for loop unrolling.
 128  */
 129 static void copy_node(ir_node *n, void *env) {
 130         ir_node *nn, *block;
 131         int new_arity;
 132         ir_op *op = get_irn_op(n);
 133         (void) env;
 134
 135         if (op == op_Bad) {
 136                 /* node copied already */
 137                 return;
 138         } else if (op == op_Block) {
 139                 block = NULL;
 140                 new_arity = compute_new_arity(n);
 141                 n->attr.block.graph_arr = NULL;
 142         } else {
 143                 block = get_nodes_block(n);
 144                 if (op == op_Phi) {
 145                         new_arity = compute_new_arity(block);
 146                 } else {
 147                         new_arity = get_irn_arity(n);
 148                 }
 149         }
 150         nn = new_ir_node(get_irn_dbg_info(n),
 151                 current_ir_graph,
 152                 block,
 153                 op,
 154                 get_irn_mode(n),
 155                 new_arity,
 156                 get_irn_in(n) + 1);
 157         /* Copy the attributes.  These might point to additional data.  If this
 158            was allocated on the old obstack the pointers now are dangling.  This
 159            frees e.g. the memory of the graph_arr allocated in new_immBlock. */
 160         if (op == op_Block) {
 161                 /* we cannot allow blocks WITHOUT macroblock input */
 162                 set_Block_MacroBlock(nn, get_Block_MacroBlock(n));
 163         }
 164         copy_node_attr(n, nn);
 165
 166 #ifdef DEBUG_libfirm
 167         {
 168                 int copy_node_nr = env != NULL;
 169                 if (copy_node_nr) {
 170                         /* for easier debugging, we want to copy the node numbers too */
 171                         nn->node_nr = n->node_nr;
 172                 }
 173         }
 174 #endif
 175
 176         set_new_node(n, nn);
 177         hook_dead_node_elim_subst(current_ir_graph, n, nn);
 178 }
 179
 180 /**
 181  * Copies new predecessors of old node to new node remembered in link.
 182  * Spare the Bad predecessors of Phi and Block nodes.
 183  */
 184 static void copy_preds(ir_node *n, void *env) {
 185         ir_node *nn, *block;
 186         int i, j, irn_arity;
 187         (void) env;
 188
 189         nn = get_new_node(n);
 190
 191         if (is_Block(n)) {
 192                 /* copy the macro block header */
 193                 ir_node *mbh = get_Block_MacroBlock(n);
 194
 195                 if (mbh == n) {
 196                         /* this block is a macroblock header */
 197                         set_Block_MacroBlock(nn, nn);
 198                 } else {
 199                         /* get the macro block header */
 200                         ir_node *nmbh = get_new_node(mbh);
 201                         assert(nmbh != NULL);
 202                         set_Block_MacroBlock(nn, nmbh);
 203                 }
 204
 205                 /* Don't copy Bad nodes. */
 206                 j = 0;
 207                 irn_arity = get_irn_arity(n);
 208                 for (i = 0; i < irn_arity; i++) {
 209                         if (! is_Bad(get_irn_n(n, i))) {
 210                                 ir_node *pred = get_irn_n(n, i);
 211                                 set_irn_n(nn, j, get_new_node(pred));
 212                                 j++;
 213                         }
 214                 }
 215                 /* repair the block visited flag from above misuse. Repair it in both
 216                    graphs so that the old one can still be used. */
 217                 set_Block_block_visited(nn, 0);
 218                 set_Block_block_visited(n, 0);
 219                 /* Local optimization could not merge two subsequent blocks if
 220                    in array contained Bads.  Now it's possible.
 221                    We don't call optimize_in_place as it requires
 222                    that the fields in ir_graph are set properly. */
 223                 if ((get_opt_control_flow_straightening()) &&
 224                         (get_Block_n_cfgpreds(nn) == 1) &&
 225                         is_Jmp(get_Block_cfgpred(nn, 0))) {
 226                         ir_node *old = get_nodes_block(get_Block_cfgpred(nn, 0));
 227                         if (nn == old) {
 228                                 /* Jmp jumps into the block it is in -- deal self cycle. */
 229                                 assert(is_Bad(get_new_node(get_irg_bad(current_ir_graph))));
 230                                 exchange(nn, get_new_node(get_irg_bad(current_ir_graph)));
 231                         } else {
 232                                 exchange(nn, old);
 233                         }
 234                 }
 235         } else if (is_Phi(n) && get_irn_arity(n) > 0) {
 236                 /* Don't copy node if corresponding predecessor in block is Bad.
 237                    The Block itself should not be Bad. */
 238                 block = get_nodes_block(n);
 239                 set_nodes_block(nn, get_new_node(block));
 240                 j = 0;
 241                 irn_arity = get_irn_arity(n);
 242                 for (i = 0; i < irn_arity; i++) {
 243                         if (! is_Bad(get_irn_n(block, i))) {
 244                                 ir_node *pred = get_irn_n(n, i);
 245                                 set_irn_n(nn, j, get_new_node(pred));
 246                                 /*if (is_backedge(n, i)) set_backedge(nn, j);*/
 247                                 j++;
 248                         }
 249                 }
 250                 /* If the pre walker reached this Phi after the post walker visited the
 251                    block block_visited is > 0. */
 252                 set_Block_block_visited(get_nodes_block(n), 0);
 253                 /* Compacting the Phi's ins might generate Phis with only one
 254                    predecessor. */
 255                 if (get_irn_arity(nn) == 1)
 256                         exchange(nn, get_irn_n(nn, 0));
 257         } else {
 258                 irn_arity = get_irn_arity(n);
 259                 for (i = -1; i < irn_arity; i++)
 260                         set_irn_n(nn, i, get_new_node(get_irn_n(n, i)));
 261         }
 262         /* Now the new node is complete.  We can add it to the hash table for CSE.
 263            @@@ inlining aborts if we identify End. Why? */
 264         if (!is_End(nn))
 265                 add_identities(current_ir_graph->value_table, nn);
 266 }
 267
 268 /**
 269  * Copies the graph recursively, compacts the keep-alives of the end node.
 270  *
 271  * @param irg           the graph to be copied
 272  * @param copy_node_nr  If non-zero, the node number will be copied
 273  */
 274 static void copy_graph(ir_graph *irg, int copy_node_nr) {
 275         ir_node *oe, *ne, *ob, *nb, *om, *nm; /* old end, new end, old bad, new bad, old NoMem, new NoMem */
 276         ir_node *ka;      /* keep alive */
 277         int i, irn_arity;
 278         unsigned long vfl;
 279
 280         /* Some nodes must be copied by hand, sigh */
 281         vfl = get_irg_visited(irg);
 282         set_irg_visited(irg, vfl + 1);
 283
 284         oe = get_irg_end(irg);
 285         mark_irn_visited(oe);
 286         /* copy the end node by hand, allocate dynamic in array! */
 287         ne = new_ir_node(get_irn_dbg_info(oe),
 288                 irg,
 289                 NULL,
 290                 op_End,
 291                 mode_X,
 292                 -1,
 293                 NULL);
 294         /* Copy the attributes.  Well, there might be some in the future... */
 295         copy_node_attr(oe, ne);
 296         set_new_node(oe, ne);
 297
 298         /* copy the Bad node */
 299         ob = get_irg_bad(irg);
 300         mark_irn_visited(ob);
 301         nb = new_ir_node(get_irn_dbg_info(ob),
 302                 irg,
 303                 NULL,
 304                 op_Bad,
 305                 mode_T,
 306                 0,
 307                 NULL);
 308         copy_node_attr(ob, nb);
 309         set_new_node(ob, nb);
 310
 311         /* copy the NoMem node */
 312         om = get_irg_no_mem(irg);
 313         mark_irn_visited(om);
 314         nm = new_ir_node(get_irn_dbg_info(om),
 315                 irg,
 316                 NULL,
 317                 op_NoMem,
 318                 mode_M,
 319                 0,
 320                 NULL);
 321         copy_node_attr(om, nm);
 322         set_new_node(om, nm);
 323
 324         /* copy the live nodes */
 325         set_irg_visited(irg, vfl);
 326         irg_walk(get_nodes_block(oe), copy_node, copy_preds, INT_TO_PTR(copy_node_nr));
 327
 328         /* Note: from yet, the visited flag of the graph is equal to vfl + 1 */
 329
 330         /* visit the anchors as well */
 331         for (i = get_irg_n_anchors(irg) - 1; i >= 0; --i) {
 332                 ir_node *n = get_irg_anchor(irg, i);
 333
 334                 if (n && (get_irn_visited(n) <= vfl)) {
 335                         set_irg_visited(irg, vfl);
 336                         irg_walk(n, copy_node, copy_preds, INT_TO_PTR(copy_node_nr));
 337                 }
 338         }
 339
 340         /* copy_preds for the end node ... */
 341         set_nodes_block(ne, get_new_node(get_nodes_block(oe)));
 342
 343         /*- ... and now the keep alives. -*/
 344         /* First pick the not marked block nodes and walk them.  We must pick these
 345            first as else we will oversee blocks reachable from Phis. */
 346         irn_arity = get_End_n_keepalives(oe);
 347         for (i = 0; i < irn_arity; i++) {
 348                 ka = get_End_keepalive(oe, i);
 349                 if (is_Block(ka)) {
 350                         if (get_irn_visited(ka) <= vfl) {
 351                                 /* We must keep the block alive and copy everything reachable */
 352                                 set_irg_visited(irg, vfl);
 353                                 irg_walk(ka, copy_node, copy_preds, INT_TO_PTR(copy_node_nr));
 354                         }
 355                         add_End_keepalive(ne, get_new_node(ka));
 356                 }
 357         }
 358
 359         /* Now pick other nodes.  Here we will keep all! */
 360         irn_arity = get_End_n_keepalives(oe);
 361         for (i = 0; i < irn_arity; i++) {
 362                 ka = get_End_keepalive(oe, i);
 363                 if (!is_Block(ka)) {
 364                         if (get_irn_visited(ka) <= vfl) {
 365                                 /* We didn't copy the node yet.  */
 366                                 set_irg_visited(irg, vfl);
 367                                 irg_walk(ka, copy_node, copy_preds, INT_TO_PTR(copy_node_nr));
 368                         }
 369                         add_End_keepalive(ne, get_new_node(ka));
 370                 }
 371         }
 372
 373         /* start block sometimes only reached after keep alives */
 374         set_nodes_block(nb, get_new_node(get_nodes_block(ob)));
 375         set_nodes_block(nm, get_new_node(get_nodes_block(om)));
 376 }
 377
 378 /**
 379  * Copies the graph reachable from current_ir_graph->end to the obstack
 380  * in current_ir_graph and fixes the environment.
 381  * Then fixes the fields in current_ir_graph containing nodes of the
 382  * graph.
 383  *
 384  * @param copy_node_nr  If non-zero, the node number will be copied
 385  */
 386 static void
 387 copy_graph_env(int copy_node_nr) {
 388         ir_graph *irg = current_ir_graph;
 389         ir_node *old_end, *new_anchor;
 390         int i;
 391
 392         /* remove end_except and end_reg nodes */
 393         old_end = get_irg_end(irg);
 394         set_irg_end_except (irg, old_end);
 395         set_irg_end_reg    (irg, old_end);
 396
 397         /* Not all nodes remembered in irg might be reachable
 398            from the end node.  Assure their link is set to NULL, so that
 399            we can test whether new nodes have been computed. */
 400         for (i = get_irg_n_anchors(irg) - 1; i >= 0; --i) {
 401                 ir_node *n = get_irg_anchor(irg, i);
 402                 if (n != NULL)
 403                         set_new_node(n, NULL);
 404         }
 405         /* we use the block walk flag for removing Bads from Blocks ins. */
 406         inc_irg_block_visited(irg);
 407
 408         /* copy the graph */
 409         copy_graph(irg, copy_node_nr);
 410
 411         /* fix the anchor */
 412         old_end    = get_irg_end(irg);
 413         new_anchor = new_Anchor(irg);
 414
 415         for (i = get_irg_n_anchors(irg) - 1; i >= 0; --i) {
 416                 ir_node *n = get_irg_anchor(irg, i);
 417                 if (n)
 418                         set_irn_n(new_anchor, i, get_new_node(n));
 419         }
 420         free_End(old_end);
 421         irg->anchor = new_anchor;
 422
 423         /* ensure the new anchor is placed in the endblock */
 424         set_nodes_block(new_anchor, get_irg_end_block(irg));
 425 }
 426
 427 /**
 428  * Copies all reachable nodes to a new obstack.  Removes bad inputs
 429  * from block nodes and the corresponding inputs from Phi nodes.
 430  * Merges single exit blocks with single entry blocks and removes
 431  * 1-input Phis.
 432  * Adds all new nodes to a new hash table for CSE.  Does not
 433  * perform CSE, so the hash table might contain common subexpressions.
 434  */
 435 void dead_node_elimination(ir_graph *irg) {
 436         ir_graph *rem;
 437 #ifdef INTERPROCEDURAL_VIEW
 438         int rem_ipview = get_interprocedural_view();
 439 #endif
 440         struct obstack *graveyard_obst = NULL;
 441         struct obstack *rebirth_obst   = NULL;
 442         assert(! edges_activated(irg) && "dead node elimination requires disabled edges");
 443
 444         /* inform statistics that we started a dead-node elimination run */
 445         hook_dead_node_elim(irg, 1);
 446
 447         /* Remember external state of current_ir_graph. */
 448         rem = current_ir_graph;
 449         current_ir_graph = irg;
 450 #ifdef INTERPROCEDURAL_VIEW
 451         set_interprocedural_view(0);
 452 #endif
 453
 454         assert(get_irg_phase_state(irg) != phase_building);
 455
 456         /* Handle graph state */
 457         free_callee_info(irg);
 458         free_irg_outs(irg);
 459         free_trouts();
 460
 461         /* @@@ so far we loose loops when copying */
 462         free_loop_information(irg);
 463
 464         set_irg_doms_inconsistent(irg);
 465
 466         /* A quiet place, where the old obstack can rest in peace,
 467            until it will be cremated. */
 468         graveyard_obst = irg->obst;
 469
 470         /* A new obstack, where the reachable nodes will be copied to. */
 471         rebirth_obst = xmalloc(sizeof(*rebirth_obst));
 472         irg->obst = rebirth_obst;
 473         obstack_init(irg->obst);
 474         irg->last_node_idx = 0;
 475
 476         /* We also need a new value table for CSE */
 477         del_identities(irg->value_table);
 478         irg->value_table = new_identities();
 479
 480         /* Copy the graph from the old to the new obstack */
 481         copy_graph_env(/*copy_node_nr=*/1);
 482
 483         /* Free memory from old unoptimized obstack */
 484         obstack_free(graveyard_obst, 0);  /* First empty the obstack ... */
 485         xfree(graveyard_obst);            /* ... then free it.           */
 486
 487         /* inform statistics that the run is over */
 488         hook_dead_node_elim(irg, 0);
 489
 490         current_ir_graph = rem;
 491 #ifdef INTERPROCEDURAL_VIEW
 492         set_interprocedural_view(rem_ipview);
 493 #endif
 494 }
 495
 496 /**
 497  * Relink bad predecessors of a block and store the old in array to the
 498  * link field. This function is called by relink_bad_predecessors().
 499  * The array of link field starts with the block operand at position 0.
 500  * If block has bad predecessors, create a new in array without bad preds.
 501  * Otherwise let in array untouched.
 502  */
 503 static void relink_bad_block_predecessors(ir_node *n, void *env) {
 504         ir_node **new_in, *irn;
 505         int i, new_irn_n, old_irn_arity, new_irn_arity = 0;
 506         (void) env;
 507
 508         /* if link field of block is NULL, look for bad predecessors otherwise
 509            this is already done */
 510         if (is_Block(n) && get_irn_link(n) == NULL) {
 511                 /* save old predecessors in link field (position 0 is the block operand)*/
 512                 set_irn_link(n, get_irn_in(n));
 513
 514                 /* count predecessors without bad nodes */
 515                 old_irn_arity = get_irn_arity(n);
 516                 for (i = 0; i < old_irn_arity; i++)
 517                         if (!is_Bad(get_irn_n(n, i)))
 518                                 ++new_irn_arity;
 519
 520                 /* arity changing: set new predecessors without bad nodes */
 521                 if (new_irn_arity < old_irn_arity) {
 522                         /* Get new predecessor array. We do not resize the array, as we must
 523                            keep the old one to update Phis. */
 524                         new_in = NEW_ARR_D(ir_node *, current_ir_graph->obst, (new_irn_arity+1));
 525
 526                         /* set new predecessors in array */
 527                         new_in[0] = NULL;
 528                         new_irn_n = 1;
 529                         for (i = 0; i < old_irn_arity; i++) {
 530                                 irn = get_irn_n(n, i);
 531                                 if (!is_Bad(irn)) {
 532                                         new_in[new_irn_n] = irn;
 533                                         is_backedge(n, i) ? set_backedge(n, new_irn_n-1) : set_not_backedge(n, new_irn_n-1);
 534                                         ++new_irn_n;
 535                                 }
 536                         }
 537                         /* ARR_SETLEN(int, n->attr.block.backedge, new_irn_arity); */
 538                         ARR_SHRINKLEN(n->attr.block.backedge, new_irn_arity);
 539                         n->in = new_in;
 540                 } /* ir node has bad predecessors */
 541         } /* Block is not relinked */
 542 }
 543
 544 /**
 545  * Relinks Bad predecessors from Blocks and Phis called by walker
 546  * remove_bad_predecesors(). If n is a Block, call
 547  * relink_bad_block_redecessors(). If n is a Phi-node, call also the relinking
 548  * function of Phi's Block. If this block has bad predecessors, relink preds
 549  * of the Phi-node.
 550  */
 551 static void relink_bad_predecessors(ir_node *n, void *env) {
 552         ir_node *block, **old_in;
 553         int i, old_irn_arity, new_irn_arity;
 554
 555         /* relink bad predecessors of a block */
 556         if (is_Block(n))
 557                 relink_bad_block_predecessors(n, env);
 558
 559         /* If Phi node relink its block and its predecessors */
 560         if (is_Phi(n)) {
 561                 /* Relink predecessors of phi's block */
 562                 block = get_nodes_block(n);
 563                 if (get_irn_link(block) == NULL)
 564                         relink_bad_block_predecessors(block, env);
 565
 566                 old_in = (ir_node **)get_irn_link(block); /* Of Phi's Block */
 567                 old_irn_arity = ARR_LEN(old_in);
 568
 569                 /* Relink Phi predecessors if count of predecessors changed */
 570                 if (old_irn_arity != ARR_LEN(get_irn_in(block))) {
 571                         /* set new predecessors in array
 572                            n->in[0] remains the same block */
 573                         new_irn_arity = 1;
 574                         for(i = 1; i < old_irn_arity; i++)
 575                                 if (!is_Bad(old_in[i])) {
 576                                         n->in[new_irn_arity] = n->in[i];
 577                                         is_backedge(n, i) ? set_backedge(n, new_irn_arity) : set_not_backedge(n, new_irn_arity);
 578                                         ++new_irn_arity;
 579                                 }
 580
 581                                 ARR_SETLEN(ir_node *, n->in, new_irn_arity);
 582                                 ARR_SETLEN(int, n->attr.phi.u.backedge, new_irn_arity);
 583                 }
 584         } /* n is a Phi node */
 585 }
 586
 587 /*
 588  * Removes Bad Bad predecessors from Blocks and the corresponding
 589  * inputs to Phi nodes as in dead_node_elimination but without
 590  * copying the graph.
 591  * On walking up set the link field to NULL, on walking down call
 592  * relink_bad_predecessors() (This function stores the old in array
 593  * to the link field and sets a new in array if arity of predecessors
 594  * changes).
 595  */
 596 void remove_bad_predecessors(ir_graph *irg) {
 597         panic("Fix backedge handling first");
 598         irg_walk_graph(irg, firm_clear_link, relink_bad_predecessors, NULL);
 599 }
 600
 601
 602 /*
 603    __                      _  __ __
 604   (_     __    o     _    | \/  |_
 605   __)|_| | \_/ | \_/(/_   |_/\__|__
 606
 607   The following stuff implements a facility that automatically patches
 608   registered ir_node pointers to the new node when a dead node elimination occurs.
 609 */
 610
 611 struct _survive_dce_t {
 612         struct obstack obst;
 613         pmap *places;
 614         pmap *new_places;
 615         hook_entry_t dead_node_elim;
 616         hook_entry_t dead_node_elim_subst;
 617 };
 618
 619 typedef struct _survive_dce_list_t {
 620         struct _survive_dce_list_t *next;
 621         ir_node **place;
 622 } survive_dce_list_t;
 623
 624 static void dead_node_hook(void *context, ir_graph *irg, int start) {
 625         survive_dce_t *sd = context;
 626         (void) irg;
 627
 628         /* Create a new map before the dead node elimination is performed. */
 629         if (start) {
 630                 sd->new_places = pmap_create_ex(pmap_count(sd->places));
 631         } else {
 632                 /* Patch back all nodes if dead node elimination is over and something is to be done. */
 633                 pmap_destroy(sd->places);
 634                 sd->places     = sd->new_places;
 635                 sd->new_places = NULL;
 636         }
 637 }
 638
 639 /**
 640  * Hook called when dead node elimination replaces old by nw.
 641  */
 642 static void dead_node_subst_hook(void *context, ir_graph *irg, ir_node *old, ir_node *nw) {
 643         survive_dce_t *sd = context;
 644         survive_dce_list_t *list = pmap_get(sd->places, old);
 645         (void) irg;
 646
 647         /* If the node is to be patched back, write the new address to all registered locations. */
 648         if (list) {
 649                 survive_dce_list_t *p;
 650
 651                 for (p = list; p; p = p->next)
 652                         *(p->place) = nw;
 653
 654                 pmap_insert(sd->new_places, nw, list);
 655         }
 656 }
 657
 658 /**
 659  * Make a new Survive DCE environment.
 660  */
 661 survive_dce_t *new_survive_dce(void) {
 662         survive_dce_t *res = xmalloc(sizeof(res[0]));
 663         obstack_init(&res->obst);
 664         res->places     = pmap_create();
 665         res->new_places = NULL;
 666
 667         res->dead_node_elim.hook._hook_dead_node_elim = dead_node_hook;
 668         res->dead_node_elim.context                   = res;
 669         res->dead_node_elim.next                      = NULL;
 670
 671         res->dead_node_elim_subst.hook._hook_dead_node_elim_subst = dead_node_subst_hook;
 672         res->dead_node_elim_subst.context = res;
 673         res->dead_node_elim_subst.next    = NULL;
 674
 675 #ifndef FIRM_ENABLE_HOOKS
 676         assert(0 && "need hooks enabled");
 677 #endif
 678
 679         register_hook(hook_dead_node_elim, &res->dead_node_elim);
 680         register_hook(hook_dead_node_elim_subst, &res->dead_node_elim_subst);
 681         return res;
 682 }
 683
 684 /**
 685  * Free a Survive DCE environment.
 686  */
 687 void free_survive_dce(survive_dce_t *sd) {
 688         obstack_free(&sd->obst, NULL);
 689         pmap_destroy(sd->places);
 690         unregister_hook(hook_dead_node_elim, &sd->dead_node_elim);
 691         unregister_hook(hook_dead_node_elim_subst, &sd->dead_node_elim_subst);
 692         xfree(sd);
 693 }
 694
 695 /**
 696  * Register a node pointer to be patched upon DCE.
 697  * When DCE occurs, the node pointer specified by @p place will be
 698  * patched to the new address of the node it is pointing to.
 699  *
 700  * @param sd    The Survive DCE environment.
 701  * @param place The address of the node pointer.
 702  */
 703 void survive_dce_register_irn(survive_dce_t *sd, ir_node **place) {
 704         if (*place != NULL) {
 705                 ir_node *irn      = *place;
 706                 survive_dce_list_t *curr = pmap_get(sd->places, irn);
 707                 survive_dce_list_t *nw   = obstack_alloc(&sd->obst, sizeof(nw[0]));
 708
 709                 nw->next  = curr;
 710                 nw->place = place;
 711
 712                 pmap_insert(sd->places, irn, nw);
 713         }
 714 }
 715
 716 /*--------------------------------------------------------------------*/
 717 /*  Functionality for inlining                                         */
 718 /*--------------------------------------------------------------------*/
 719
 720 /**
 721  * Copy node for inlineing.  Updates attributes that change when
 722  * inlineing but not for dead node elimination.
 723  *
 724  * Copies the node by calling copy_node() and then updates the entity if
 725  * it's a local one.  env must be a pointer of the frame type of the
 726  * inlined procedure. The new entities must be in the link field of
 727  * the entities.
 728  */
 729 static INLINE void
 730 copy_node_inline(ir_node *n, void *env) {
 731         ir_node *nn;
 732         ir_type *frame_tp = (ir_type *)env;
 733
 734         copy_node(n, NULL);
 735         if (is_Sel(n)) {
 736                 nn = get_new_node (n);
 737                 assert(is_Sel(nn));
 738                 if (get_entity_owner(get_Sel_entity(n)) == frame_tp) {
 739                         set_Sel_entity(nn, get_entity_link(get_Sel_entity(n)));
 740                 }
 741         } else if (is_Block(n)) {
 742                 nn = get_new_node (n);
 743                 nn->attr.block.irg = current_ir_graph;
 744         }
 745 }
 746
 747 /**
 748  * Walker: checks if P_value_arg_base is used.
 749  */
 750 static void find_addr(ir_node *node, void *env) {
 751         int *allow_inline = env;
 752         if (is_Proj(node) &&
 753                         is_Start(get_Proj_pred(node)) &&
 754                         get_Proj_proj(node) == pn_Start_P_value_arg_base) {
 755                 *allow_inline = 0;
 756         } else if (is_Alloc(node) && get_Alloc_where(node) == stack_alloc) {
 757                 /* From GCC:
 758                  * Refuse to inline alloca call unless user explicitly forced so as this
 759                  * may change program's memory overhead drastically when the function
 760                  * using alloca is called in loop.  In GCC present in SPEC2000 inlining
 761                  * into schedule_block cause it to require 2GB of ram instead of 256MB.
 762                  *
 763                  * Sorryly this is true with our implementation also.
 764                  * Moreover, we cannot differentiate between alloca() and VLA yet, so this
 765                  * disables inlining of functions using VLA (with are completely save).
 766                  *
 767                  * 2 Solutions:
 768                  * - add a flag to the Alloc node for "real" alloca() calls
 769                  * - add a new Stack-Restore node at the end of a function using alloca()
 770                  */
 771                 *allow_inline = 0;
 772         }
 773 }
 774
 775 /**
 776  * Check if we can inline a given call.
 777  * Currently, we cannot inline two cases:
 778  * - call with compound arguments
 779  * - graphs that take the address of a parameter
 780  *
 781  * check these conditions here
 782  */
 783 static int can_inline(ir_node *call, ir_graph *called_graph) {
 784         ir_type *call_type = get_Call_type(call);
 785         int params, ress, i, res;
 786         assert(is_Method_type(call_type));
 787
 788         params = get_method_n_params(call_type);
 789         ress   = get_method_n_ress(call_type);
 790
 791         /* check parameters for compound arguments */
 792         for (i = 0; i < params; ++i) {
 793                 ir_type *p_type = get_method_param_type(call_type, i);
 794
 795                 if (is_compound_type(p_type))
 796                         return 0;
 797         }
 798
 799         /* check results for compound arguments */
 800         for (i = 0; i < ress; ++i) {
 801                 ir_type *r_type = get_method_res_type(call_type, i);
 802
 803                 if (is_compound_type(r_type))
 804                         return 0;
 805         }
 806
 807         res = 1;
 808         irg_walk_graph(called_graph, find_addr, NULL, &res);
 809
 810         return res;
 811 }
 812
 813 enum exc_mode {
 814         exc_handler    = 0, /**< There is a handler. */
 815         exc_to_end     = 1, /**< Branches to End. */
 816         exc_no_handler = 2  /**< Exception handling not represented. */
 817 };
 818
 819 /* Inlines a method at the given call site. */
 820 int inline_method(ir_node *call, ir_graph *called_graph) {
 821         ir_node             *pre_call;
 822         ir_node             *post_call, *post_bl;
 823         ir_node             *in[pn_Start_max];
 824         ir_node             *end, *end_bl;
 825         ir_node             **res_pred;
 826         ir_node             **cf_pred;
 827         ir_node             *ret, *phi;
 828         int                 arity, n_ret, n_exc, n_res, i, n, j, rem_opt, irn_arity;
 829         enum exc_mode       exc_handling;
 830         ir_type             *called_frame, *curr_frame;
 831         ir_entity           *ent;
 832         ir_graph            *rem, *irg;
 833         irg_inline_property prop = get_irg_inline_property(called_graph);
 834
 835         if (prop == irg_inline_forbidden)
 836                 return 0;
 837
 838         ent = get_irg_entity(called_graph);
 839
 840         /* Do not inline variadic functions. */
 841         if (get_method_variadicity(get_entity_type(ent)) == variadicity_variadic) {
 842                 /* Arg, KR functions are marked as variadic one's, so check further */
 843                 ir_type *mtp     = get_entity_type(ent);
 844                 ir_type *ctp     = get_Call_type(call);
 845                 int     n_params = get_method_n_params(mtp);
 846                 int     i;
 847
 848                 /* This is too strong, but probably ok. Function calls with a wrong number of
 849                    parameters should not be inlined. */
 850                 if (n_params != get_method_n_params(ctp))
 851                         return 0;
 852
 853                 /* check types: for K&R calls, this was not done by the compiler. Again, this is
 854                    too strong, but ok for now. */
 855                 for (i = n_params - 1; i >= 0; --i) {
 856                         ir_type *param_tp = get_method_param_type(mtp, i);
 857                         ir_type *arg_tp   = get_method_param_type(ctp, i);
 858
 859                         if (param_tp != arg_tp)
 860                                 return 0;
 861                 }
 862                 DB((dbg, LEVEL_1, "Inlining allowed for variadic function %+F\n", called_graph));
 863                 /* types match, fine: when the frame is access, the inliner stops at can_inline() */
 864         }
 865
 866         if (get_method_n_params(get_entity_type(ent)) > get_method_n_params(get_Call_type(call))) {
 867                 /* this is a bad feature of C: without a prototype, we can can call a function with less
 868                    parameters than needed. Currently we don't support this, although it would be
 869                    to use Unknown than. */
 870                 return 0;
 871         }
 872
 873         irg = get_irn_irg(call);
 874
 875         /*
 876          * We cannot inline a recursive call. The graph must be copied before
 877          * the call the inline_method() using create_irg_copy().
 878          */
 879         if (called_graph == irg)
 880                 return 0;
 881
 882         /*
 883          * currently, we cannot inline two cases:
 884          * - call with compound arguments
 885          * - graphs that take the address of a parameter
 886          */
 887         if (! can_inline(call, called_graph))
 888                 return 0;
 889
 890         rem = current_ir_graph;
 891         current_ir_graph = irg;
 892
 893         DB((dbg, LEVEL_1, "Inlining %+F(%+F) into %+F\n", call, called_graph, irg));
 894
 895         /* --  Turn off optimizations, this can cause problems when allocating new nodes. -- */
 896         rem_opt = get_opt_optimize();
 897         set_optimize(0);
 898
 899         /* Handle graph state */
 900         assert(get_irg_phase_state(irg) != phase_building);
 901         assert(get_irg_pinned(irg) == op_pin_state_pinned);
 902         assert(get_irg_pinned(called_graph) == op_pin_state_pinned);
 903         set_irg_outs_inconsistent(irg);
 904         set_irg_extblk_inconsistent(irg);
 905         set_irg_doms_inconsistent(irg);
 906         set_irg_loopinfo_inconsistent(irg);
 907         set_irg_callee_info_state(irg, irg_callee_info_inconsistent);
 908
 909         /* -- Check preconditions -- */
 910         assert(is_Call(call));
 911
 912         /* here we know we WILL inline, so inform the statistics */
 913         hook_inline(call, called_graph);
 914
 915         /* -- Decide how to handle exception control flow: Is there a handler
 916            for the Call node, or do we branch directly to End on an exception?
 917            exc_handling:
 918            0 There is a handler.
 919            1 Branches to End.
 920            2 Exception handling not represented in Firm. -- */
 921         {
 922                 ir_node *proj, *Mproj = NULL, *Xproj = NULL;
 923                 for (proj = get_irn_link(call); proj; proj = get_irn_link(proj)) {
 924                         long proj_nr = get_Proj_proj(proj);
 925                         if (proj_nr == pn_Call_X_except) Xproj = proj;
 926                         if (proj_nr == pn_Call_M_except) Mproj = proj;
 927                 }
 928                 if      (Mproj) { assert(Xproj); exc_handling = exc_handler; } /*  Mproj           */
 929                 else if (Xproj) {                exc_handling = exc_to_end; } /* !Mproj &&  Xproj   */
 930                 else            {                exc_handling = exc_no_handler; } /* !Mproj && !Xproj   */
 931         }
 932
 933         /* --
 934            the procedure and later replaces the Start node of the called graph.
 935            Post_call is the old Call node and collects the results of the called
 936            graph. Both will end up being a tuple.  -- */
 937         post_bl = get_nodes_block(call);
 938         set_irg_current_block(irg, post_bl);
 939         /* XxMxPxPxPxT of Start + parameter of Call */
 940         in[pn_Start_X_initial_exec]   = new_Jmp();
 941         in[pn_Start_M]                = get_Call_mem(call);
 942         in[pn_Start_P_frame_base]     = get_irg_frame(irg);
 943         in[pn_Start_P_tls]            = get_irg_tls(irg);
 944         in[pn_Start_T_args]           = new_Tuple(get_Call_n_params(call), get_Call_param_arr(call));
 945         /* in[pn_Start_P_value_arg_base] = ??? */
 946         assert(pn_Start_P_value_arg_base == pn_Start_max - 1 && "pn_Start_P_value_arg_base not supported, fix");
 947         pre_call = new_Tuple(pn_Start_max - 1, in);
 948         post_call = call;
 949
 950         /* --
 951            The new block gets the ins of the old block, pre_call and all its
 952            predecessors and all Phi nodes. -- */
 953         part_block(pre_call);
 954
 955         /* -- Prepare state for dead node elimination -- */
 956         /* Visited flags in calling irg must be >= flag in called irg.
 957            Else walker and arity computation will not work. */
 958         if (get_irg_visited(irg) <= get_irg_visited(called_graph))
 959                 set_irg_visited(irg, get_irg_visited(called_graph)+1);
 960         if (get_irg_block_visited(irg) < get_irg_block_visited(called_graph))
 961                 set_irg_block_visited(irg, get_irg_block_visited(called_graph));
 962         /* Set pre_call as new Start node in link field of the start node of
 963            calling graph and pre_calls block as new block for the start block
 964            of calling graph.
 965            Further mark these nodes so that they are not visited by the
 966            copying. */
 967         set_irn_link(get_irg_start(called_graph), pre_call);
 968         set_irn_visited(get_irg_start(called_graph), get_irg_visited(irg));
 969         set_irn_link(get_irg_start_block(called_graph), get_nodes_block(pre_call));
 970         set_irn_visited(get_irg_start_block(called_graph), get_irg_visited(irg));
 971         set_irn_link(get_irg_bad(called_graph), get_irg_bad(irg));
 972         set_irn_visited(get_irg_bad(called_graph), get_irg_visited(irg));
 973
 974         /* Initialize for compaction of in arrays */
 975         inc_irg_block_visited(irg);
 976
 977         /* -- Replicate local entities of the called_graph -- */
 978         /* copy the entities. */
 979         called_frame = get_irg_frame_type(called_graph);
 980         curr_frame   = get_irg_frame_type(irg);
 981         for (i = 0, n = get_class_n_members(called_frame); i < n; ++i) {
 982                 ir_entity *new_ent, *old_ent;
 983                 old_ent = get_class_member(called_frame, i);
 984                 new_ent = copy_entity_own(old_ent, curr_frame);
 985                 set_entity_link(old_ent, new_ent);
 986         }
 987
 988         /* visited is > than that of called graph.  With this trick visited will
 989            remain unchanged so that an outer walker, e.g., searching the call nodes
 990             to inline, calling this inline will not visit the inlined nodes. */
 991         set_irg_visited(irg, get_irg_visited(irg)-1);
 992
 993         /* -- Performing dead node elimination inlines the graph -- */
 994         /* Copies the nodes to the obstack of current_ir_graph. Updates links to new
 995            entities. */
 996         irg_walk(get_irg_end(called_graph), copy_node_inline, copy_preds,
 997                  get_irg_frame_type(called_graph));
 998
 999         /* Repair called_graph */
1000         set_irg_visited(called_graph, get_irg_visited(irg));
1001         set_irg_block_visited(called_graph, get_irg_block_visited(irg));
1002         set_Block_block_visited(get_irg_start_block(called_graph), 0);
1003
1004         /* -- Merge the end of the inlined procedure with the call site -- */
1005         /* We will turn the old Call node into a Tuple with the following
1006            predecessors:
1007            -1:  Block of Tuple.
1008            0: Phi of all Memories of Return statements.
1009            1: Jmp from new Block that merges the control flow from all exception
1010            predecessors of the old end block.
1011            2: Tuple of all arguments.
1012            3: Phi of Exception memories.
1013            In case the old Call directly branches to End on an exception we don't
1014            need the block merging all exceptions nor the Phi of the exception
1015            memories.
1016         */
1017
1018         /* -- Precompute some values -- */
1019         end_bl = get_new_node(get_irg_end_block(called_graph));
1020         end = get_new_node(get_irg_end(called_graph));
1021         arity = get_irn_arity(end_bl);    /* arity = n_exc + n_ret  */
1022         n_res = get_method_n_ress(get_Call_type(call));
1023
1024         res_pred = xmalloc(n_res * sizeof(*res_pred));
1025         cf_pred  = xmalloc(arity * sizeof(*res_pred));
1026
1027         set_irg_current_block(irg, post_bl); /* just to make sure */
1028
1029         /* -- archive keepalives -- */
1030         irn_arity = get_irn_arity(end);
1031         for (i = 0; i < irn_arity; i++) {
1032                 ir_node *ka = get_End_keepalive(end, i);
1033                 if (! is_Bad(ka))
1034                         add_End_keepalive(get_irg_end(irg), ka);
1035         }
1036
1037         /* The new end node will die.  We need not free as the in array is on the obstack:
1038            copy_node() only generated 'D' arrays. */
1039
1040         /* -- Replace Return nodes by Jump nodes. -- */
1041         n_ret = 0;
1042         for (i = 0; i < arity; i++) {
1043                 ir_node *ret;
1044                 ret = get_irn_n(end_bl, i);
1045                 if (is_Return(ret)) {
1046                         cf_pred[n_ret] = new_r_Jmp(irg, get_nodes_block(ret));
1047                         n_ret++;
1048                 }
1049         }
1050         set_irn_in(post_bl, n_ret, cf_pred);
1051
1052         /* -- Build a Tuple for all results of the method.
1053            Add Phi node if there was more than one Return.  -- */
1054         turn_into_tuple(post_call, pn_Call_max);
1055         /* First the Memory-Phi */
1056         n_ret = 0;
1057         for (i = 0; i < arity; i++) {
1058                 ret = get_irn_n(end_bl, i);
1059                 if (is_Return(ret)) {
1060                         cf_pred[n_ret] = get_Return_mem(ret);
1061                         n_ret++;
1062                 }
1063         }
1064         phi = new_Phi(n_ret, cf_pred, mode_M);
1065         set_Tuple_pred(call, pn_Call_M_regular, phi);
1066         /* Conserve Phi-list for further inlinings -- but might be optimized */
1067         if (get_nodes_block(phi) == post_bl) {
1068                 set_irn_link(phi, get_irn_link(post_bl));
1069                 set_irn_link(post_bl, phi);
1070         }
1071         /* Now the real results */
1072         if (n_res > 0) {
1073                 for (j = 0; j < n_res; j++) {
1074                         n_ret = 0;
1075                         for (i = 0; i < arity; i++) {
1076                                 ret = get_irn_n(end_bl, i);
1077                                 if (is_Return(ret)) {
1078                                         cf_pred[n_ret] = get_Return_res(ret, j);
1079                                         n_ret++;
1080                                 }
1081                         }
1082                         if (n_ret > 0)
1083                                 phi = new_Phi(n_ret, cf_pred, get_irn_mode(cf_pred[0]));
1084                         else
1085                                 phi = new_Bad();
1086                         res_pred[j] = phi;
1087                         /* Conserve Phi-list for further inlinings -- but might be optimized */
1088                         if (get_nodes_block(phi) == post_bl) {
1089                                 set_Phi_next(phi, get_Block_phis(post_bl));
1090                                 set_Block_phis(post_bl, phi);
1091                         }
1092                 }
1093                 set_Tuple_pred(call, pn_Call_T_result, new_Tuple(n_res, res_pred));
1094         } else {
1095                 set_Tuple_pred(call, pn_Call_T_result, new_Bad());
1096         }
1097         /* handle the regular call */
1098         set_Tuple_pred(call, pn_Call_X_regular, new_Jmp());
1099
1100         /* For now, we cannot inline calls with value_base */
1101         set_Tuple_pred(call, pn_Call_P_value_res_base, new_Bad());
1102
1103         /* Finally the exception control flow.
1104            We have two (three) possible situations:
1105            First if the Call branches to an exception handler: We need to add a Phi node to
1106            collect the memory containing the exception objects.  Further we need
1107            to add another block to get a correct representation of this Phi.  To
1108            this block we add a Jmp that resolves into the X output of the Call
1109            when the Call is turned into a tuple.
1110            Second the Call branches to End, the exception is not handled.  Just
1111            add all inlined exception branches to the End node.
1112            Third: there is no Exception edge at all. Handle as case two. */
1113         if (exc_handling == exc_handler) {
1114                 n_exc = 0;
1115                 for (i = 0; i < arity; i++) {
1116                         ir_node *ret, *irn;
1117                         ret = get_irn_n(end_bl, i);
1118                         irn = skip_Proj(ret);
1119                         if (is_fragile_op(irn) || is_Raise(irn)) {
1120                                 cf_pred[n_exc] = ret;
1121                                 ++n_exc;
1122                         }
1123                 }
1124                 if (n_exc > 0) {
1125                         new_Block(n_exc, cf_pred);      /* watch it: current_block is changed! */
1126                         set_Tuple_pred(call, pn_Call_X_except, new_Jmp());
1127                         /* The Phi for the memories with the exception objects */
1128                         n_exc = 0;
1129                         for (i = 0; i < arity; i++) {
1130                                 ir_node *ret;
1131                                 ret = skip_Proj(get_irn_n(end_bl, i));
1132                                 if (is_Call(ret)) {
1133                                         cf_pred[n_exc] = new_r_Proj(irg, get_nodes_block(ret), ret, mode_M, 3);
1134                                         n_exc++;
1135                                 } else if (is_fragile_op(ret)) {
1136                                         /* We rely that all cfops have the memory output at the same position. */
1137                                         cf_pred[n_exc] = new_r_Proj(irg, get_nodes_block(ret), ret, mode_M, 0);
1138                                         n_exc++;
1139                                 } else if (is_Raise(ret)) {
1140                                         cf_pred[n_exc] = new_r_Proj(irg, get_nodes_block(ret), ret, mode_M, 1);
1141                                         n_exc++;
1142                                 }
1143                         }
1144                         set_Tuple_pred(call, pn_Call_M_except, new_Phi(n_exc, cf_pred, mode_M));
1145                 } else {
1146                         set_Tuple_pred(call, pn_Call_X_except, new_Bad());
1147                         set_Tuple_pred(call, pn_Call_M_except, new_Bad());
1148                 }
1149         } else {
1150                 ir_node *main_end_bl;
1151                 int main_end_bl_arity;
1152                 ir_node **end_preds;
1153
1154                 /* assert(exc_handling == 1 || no exceptions. ) */
1155                 n_exc = 0;
1156                 for (i = 0; i < arity; i++) {
1157                         ir_node *ret = get_irn_n(end_bl, i);
1158                         ir_node *irn = skip_Proj(ret);
1159
1160                         if (is_fragile_op(irn) || is_Raise(irn)) {
1161                                 cf_pred[n_exc] = ret;
1162                                 n_exc++;
1163                         }
1164                 }
1165                 main_end_bl = get_irg_end_block(irg);
1166                 main_end_bl_arity = get_irn_arity(main_end_bl);
1167                 end_preds =  xmalloc((n_exc + main_end_bl_arity) * sizeof(*end_preds));
1168
1169                 for (i = 0; i < main_end_bl_arity; ++i)
1170                         end_preds[i] = get_irn_n(main_end_bl, i);
1171                 for (i = 0; i < n_exc; ++i)
1172                         end_preds[main_end_bl_arity + i] = cf_pred[i];
1173                 set_irn_in(main_end_bl, n_exc + main_end_bl_arity, end_preds);
1174                 set_Tuple_pred(call, pn_Call_X_except,  new_Bad());
1175                 set_Tuple_pred(call, pn_Call_M_except,  new_Bad());
1176                 free(end_preds);
1177         }
1178         free(res_pred);
1179         free(cf_pred);
1180
1181         /* --  Turn CSE back on. -- */
1182         set_optimize(rem_opt);
1183         current_ir_graph = rem;
1184
1185         return 1;
1186 }
1187
1188 /********************************************************************/
1189 /* Apply inlineing to small methods.                                */
1190 /********************************************************************/
1191
1192 static struct obstack  temp_obst;
1193
1194 /** Represents a possible inlinable call in a graph. */
1195 typedef struct _call_entry call_entry;
1196 struct _call_entry {
1197         ir_node    *call;      /**< the Call node */
1198         ir_graph   *callee;    /**< the callee IR-graph called here */
1199         call_entry *next;      /**< for linking the next one */
1200         int        loop_depth; /**< the loop depth of this call */
1201 };
1202
1203 /**
1204  * environment for inlining small irgs
1205  */
1206 typedef struct _inline_env_t {
1207         struct obstack obst;  /**< an obstack where call_entries are allocated on. */
1208         call_entry *head;     /**< the head of the call entry list */
1209         call_entry *tail;     /**< the tail of the call entry list */
1210 } inline_env_t;
1211
1212 /**
1213  * Returns the irg called from a Call node. If the irg is not
1214  * known, NULL is returned.
1215  *
1216  * @param call  the call node
1217  */
1218 static ir_graph *get_call_called_irg(ir_node *call) {
1219         ir_node *addr;
1220
1221         addr = get_Call_ptr(call);
1222         if (is_Global(addr)) {
1223                 ir_entity *ent = get_Global_entity(addr);
1224                 return get_entity_irg(ent);
1225         }
1226
1227         return NULL;
1228 }
1229
1230 /**
1231  * Walker: Collect all calls to known graphs inside a graph.
1232  */
1233 static void collect_calls(ir_node *call, void *env) {
1234         if (is_Call(call)) {
1235                 ir_graph *called_irg = get_call_called_irg(call);
1236
1237                 if (called_irg != NULL) {
1238                         /* The Call node calls a locally defined method.  Remember to inline. */
1239                         inline_env_t *ienv  = env;
1240                         call_entry   *entry = obstack_alloc(&ienv->obst, sizeof(*entry));
1241                         entry->call       = call;
1242                         entry->callee     = called_irg;
1243                         entry->next       = NULL;
1244                         entry->loop_depth = 0;
1245
1246                         if (ienv->tail == NULL)
1247                                 ienv->head = entry;
1248                         else
1249                                 ienv->tail->next = entry;
1250                         ienv->tail = entry;
1251                 }
1252         }
1253 }
1254
1255 /**
1256  * Inlines all small methods at call sites where the called address comes
1257  * from a Const node that references the entity representing the called
1258  * method.
1259  * The size argument is a rough measure for the code size of the method:
1260  * Methods where the obstack containing the firm graph is smaller than
1261  * size are inlined.
1262  */
1263 void inline_small_irgs(ir_graph *irg, int size) {
1264         ir_graph *rem = current_ir_graph;
1265         inline_env_t env;
1266         call_entry *entry;
1267
1268         current_ir_graph = irg;
1269         /* Handle graph state */
1270         assert(get_irg_phase_state(irg) != phase_building);
1271         free_callee_info(irg);
1272
1273         /* Find Call nodes to inline.
1274            (We can not inline during a walk of the graph, as inlineing the same
1275            method several times changes the visited flag of the walked graph:
1276            after the first inlineing visited of the callee equals visited of
1277            the caller.  With the next inlineing both are increased.) */
1278         obstack_init(&env.obst);
1279         env.head = env.tail = NULL;
1280         irg_walk_graph(irg, NULL, collect_calls, &env);
1281
1282         if (env.head != NULL) {
1283                 /* There are calls to inline */
1284                 collect_phiprojs(irg);
1285                 for (entry = env.head; entry != NULL; entry = entry->next) {
1286                         ir_graph *callee = entry->callee;
1287                         if (((_obstack_memory_used(callee->obst) - (int)obstack_room(callee->obst)) < size) ||
1288                             (get_irg_inline_property(callee) >= irg_inline_forced)) {
1289                                 inline_method(entry->call, callee);
1290                         }
1291                 }
1292         }
1293         obstack_free(&env.obst, NULL);
1294         current_ir_graph = rem;
1295 }
1296
1297 /**
1298  * Environment for inlining irgs.
1299  */
1300 typedef struct {
1301         int n_nodes;             /**< Number of nodes in graph except Id, Tuple, Proj, Start, End. */
1302         int n_blocks;            /**< Number of Blocks in graph without Start and End block. */
1303         int n_nodes_orig;        /**< for statistics */
1304         int n_call_nodes;        /**< Number of Call nodes in the graph. */
1305         int n_call_nodes_orig;   /**< for statistics */
1306         int n_callers;           /**< Number of known graphs that call this graphs. */
1307         int n_callers_orig;      /**< for statistics */
1308         unsigned got_inline:1;   /**< Set, if at least one call inside this graph was inlined. */
1309         unsigned local_vars:1;   /**< Set, if a inlined function gets the address of an inlined variable. */
1310         unsigned recursive:1;    /**< Set, if this function is self recursive. */
1311         call_entry *call_head;   /**< The head of the list of all call nodes in this graph. */
1312         call_entry *call_tail;   /**< The tail of the list of all call nodes in this graph .*/
1313         unsigned *local_weights; /**< Once allocated, the beneficial weight for transmitting local addresses. */
1314 } inline_irg_env;
1315
1316 /**
1317  * Allocate a new environment for inlining.
1318  */
1319 static inline_irg_env *alloc_inline_irg_env(void) {
1320         inline_irg_env *env    = obstack_alloc(&temp_obst, sizeof(*env));
1321         env->n_nodes           = -2; /* do not count count Start, End */
1322         env->n_blocks          = -2; /* do not count count Start, End Block */
1323         env->n_nodes_orig      = -2; /* do not count Start, End */
1324         env->call_head         = NULL;
1325         env->call_tail         = NULL;
1326         env->n_call_nodes      = 0;
1327         env->n_call_nodes_orig = 0;
1328         env->n_callers         = 0;
1329         env->n_callers_orig    = 0;
1330         env->got_inline        = 0;
1331         env->local_vars        = 0;
1332         env->recursive         = 0;
1333         env->local_weights     = NULL;
1334         return env;
1335 }
1336
1337 typedef struct walker_env {
1338         inline_irg_env *x;     /**< the inline environment */
1339         call_entry *last_call; /**< points to the last inserted call */
1340         char ignore_runtime;   /**< the ignore runtime flag */
1341         char ignore_callers;   /**< if set, do change callers data */
1342 } wenv_t;
1343
1344 /**
1345  * post-walker: collect all calls in the inline-environment
1346  * of a graph and sum some statistics.
1347  */
1348 static void collect_calls2(ir_node *call, void *ctx) {
1349         wenv_t         *env = ctx;
1350         inline_irg_env *x = env->x;
1351         ir_opcode      code = get_irn_opcode(call);
1352         ir_graph       *callee;
1353         call_entry     *entry;
1354
1355         /* count meaningful nodes in irg */
1356         if (code != iro_Proj && code != iro_Tuple && code != iro_Sync) {
1357                 if (code != iro_Block) {
1358                         ++x->n_nodes;
1359                         ++x->n_nodes_orig;
1360                 } else {
1361                         ++x->n_blocks;
1362                 }
1363         }
1364
1365         if (code != iro_Call) return;
1366
1367         /* check, if it's a runtime call */
1368         if (env->ignore_runtime) {
1369                 ir_node *symc = get_Call_ptr(call);
1370
1371                 if (is_Global(symc)) {
1372                         ir_entity *ent = get_Global_entity(symc);
1373
1374                         if (get_entity_additional_properties(ent) & mtp_property_runtime)
1375                                 return;
1376                 }
1377         }
1378
1379         /* collect all call nodes */
1380         ++x->n_call_nodes;
1381         ++x->n_call_nodes_orig;
1382
1383         callee = get_call_called_irg(call);
1384         if (callee != NULL) {
1385                 if (! env->ignore_callers) {
1386                         inline_irg_env *callee_env = get_irg_link(callee);
1387                         /* count all static callers */
1388                         ++callee_env->n_callers;
1389                         ++callee_env->n_callers_orig;
1390                 }
1391                 if (callee == current_ir_graph)
1392                         x->recursive = 1;
1393
1394                 /* link it in the list of possible inlinable entries */
1395                 entry = obstack_alloc(&temp_obst, sizeof(*entry));
1396                 entry->call       = call;
1397                 entry->callee     = callee;
1398                 entry->next       = NULL;
1399                 entry->loop_depth = get_irn_loop(get_nodes_block(call))->depth;
1400
1401                 /* note: we use call_tail here as a pointer to the last inserted */
1402                 if (x->call_head == NULL) {
1403                         x->call_head = entry;
1404                 } else {
1405                         if (entry->loop_depth == env->last_call->loop_depth) {
1406                                 /* same depth as the last one, enqueue after it */
1407                                 entry->next          = env->last_call->next;
1408                                 env->last_call->next = entry;
1409                         } else if (entry->loop_depth > x->call_head->loop_depth) {
1410                                 /* put first */
1411                                 entry->next  = x->call_head;
1412                                 x->call_head = entry;
1413                         } else {
1414                                 /* search the insertion point */
1415                                 call_entry *p;
1416
1417                                 for (p = x->call_head; p->next != NULL; p = p->next)
1418                                         if (entry->loop_depth > p->next->loop_depth)
1419                                                 break;
1420                                 entry->next = p->next;
1421                                 p->next     = entry;
1422                         }
1423                 }
1424                 env->last_call = entry;
1425                 if (entry->next == NULL) {
1426                         /* keep tail up to date */
1427                         x->call_tail = entry;
1428                 }
1429         }
1430 }
1431
1432 /**
1433  * Returns TRUE if the number of callers is 0 in the irg's environment,
1434  * hence this irg is a leave.
1435  */
1436 INLINE static int is_leave(ir_graph *irg) {
1437         inline_irg_env *env = get_irg_link(irg);
1438         return env->n_call_nodes == 0;
1439 }
1440
1441 /**
1442  * Returns TRUE if the number of nodes in the callee is
1443  * smaller then size in the irg's environment.
1444  */
1445 INLINE static int is_smaller(ir_graph *callee, int size) {
1446         inline_irg_env *env = get_irg_link(callee);
1447         return env->n_nodes < size;
1448 }
1449
1450 /**
1451  * Append the nodes of the list src to the nodes of the list in environment dst.
1452  */
1453 static void append_call_list(inline_irg_env *dst, call_entry *src) {
1454         call_entry *entry, *nentry;
1455
1456         /* Note that the src list points to Call nodes in the inlined graph, but
1457            we need Call nodes in our graph. Luckily the inliner leaves this information
1458            in the link field. */
1459         for (entry = src; entry != NULL; entry = entry->next) {
1460                 nentry = obstack_alloc(&temp_obst, sizeof(*nentry));
1461                 nentry->call         = get_irn_link(entry->call);
1462                 nentry->callee       = entry->callee;
1463                 nentry->next         = NULL;
1464                 nentry->loop_depth   = entry->loop_depth;
1465                 dst->call_tail->next = nentry;
1466                 dst->call_tail       = nentry;
1467         }
1468 }
1469
1470 /**
1471  * Add the nodes of the list src in front to the nodes of the list dst.
1472  */
1473 static call_entry *replace_entry_by_call_list(call_entry *dst, call_entry *src) {
1474         call_entry *entry, *nentry, *head, *tail;
1475
1476         /* Note that the src list points to Call nodes in the inlined graph, but
1477            we need Call nodes in our graph. Luckily the inliner leaves this information
1478            in the link field. */
1479         head = tail = NULL;
1480         for (entry = src; entry != NULL; entry = entry->next) {
1481                 nentry = obstack_alloc(&temp_obst, sizeof(*nentry));
1482                 nentry->call         = get_irn_link(entry->call);
1483                 nentry->callee       = entry->callee;
1484                 nentry->next         = NULL;
1485                 nentry->loop_depth   = entry->loop_depth + dst->loop_depth;
1486                 if (head == NULL)
1487                         head = nentry;
1488                 else
1489                         tail->next = nentry;
1490                 tail = nentry;
1491         }
1492         /* skip the head of dst */
1493         if (head != NULL) {
1494                 tail->next = dst->next;
1495         } else {
1496                 head = dst->next;
1497         }
1498         return head;
1499 }
1500
1501 /*
1502  * Inlines small leave methods at call sites where the called address comes
1503  * from a Const node that references the entity representing the called
1504  * method.
1505  * The size argument is a rough measure for the code size of the method:
1506  * Methods where the obstack containing the firm graph is smaller than
1507  * size are inlined.
1508  */
1509 void inline_leave_functions(int maxsize, int leavesize, int size, int ignore_runtime) {
1510         inline_irg_env   *env;
1511         ir_graph         *irg;
1512         int              i, n_irgs;
1513         ir_graph         *rem;
1514         int              did_inline;
1515         wenv_t           wenv;
1516         call_entry       *entry, *tail;
1517         const call_entry *centry;
1518         pmap             *copied_graphs;
1519         pmap_entry       *pm_entry;
1520
1521         rem = current_ir_graph;
1522         obstack_init(&temp_obst);
1523
1524         /* a map for the copied graphs, used to inline recursive calls */
1525         copied_graphs = pmap_create();
1526
1527         /* extend all irgs by a temporary data structure for inlining. */
1528         n_irgs = get_irp_n_irgs();
1529         for (i = 0; i < n_irgs; ++i)
1530                 set_irg_link(get_irp_irg(i), alloc_inline_irg_env());
1531
1532         /* Precompute information in temporary data structure. */
1533         wenv.ignore_runtime = ignore_runtime;
1534         wenv.ignore_callers = 0;
1535         for (i = 0; i < n_irgs; ++i) {
1536                 ir_graph *irg = get_irp_irg(i);
1537
1538                 assert(get_irg_phase_state(irg) != phase_building);
1539                 free_callee_info(irg);
1540
1541                 assure_cf_loop(irg);
1542                 wenv.x = get_irg_link(irg);
1543                 irg_walk_graph(irg, NULL, collect_calls2, &wenv);
1544         }
1545
1546         /* -- and now inline. -- */
1547
1548         /* Inline leaves recursively -- we might construct new leaves. */
1549         do {
1550                 did_inline = 0;
1551
1552                 for (i = 0; i < n_irgs; ++i) {
1553                         ir_node *call;
1554                         int phiproj_computed = 0;
1555
1556                         current_ir_graph = get_irp_irg(i);
1557                         env = (inline_irg_env *)get_irg_link(current_ir_graph);
1558
1559                         tail = NULL;
1560                         for (entry = env->call_head; entry != NULL; entry = entry->next) {
1561                                 ir_graph *callee;
1562
1563                                 if (env->n_nodes > maxsize) break;
1564
1565                                 call   = entry->call;
1566                                 callee = entry->callee;
1567
1568                                 if (is_leave(callee) && (
1569                                     is_smaller(callee, leavesize) || (get_irg_inline_property(callee) >= irg_inline_forced))) {
1570                                         if (!phiproj_computed) {
1571                                                 phiproj_computed = 1;
1572                                                 collect_phiprojs(current_ir_graph);
1573                                         }
1574                                         did_inline = inline_method(call, callee);
1575
1576                                         if (did_inline) {
1577                                                 inline_irg_env *callee_env = (inline_irg_env *)get_irg_link(callee);
1578
1579                                                 /* was inlined, must be recomputed */
1580                                                 phiproj_computed = 0;
1581
1582                                                 /* Do some statistics */
1583                                                 env->got_inline = 1;
1584                                                 --env->n_call_nodes;
1585                                                 env->n_nodes += callee_env->n_nodes;
1586                                                 --callee_env->n_callers;
1587
1588                                                 /* remove this call from the list */
1589                                                 if (tail != NULL)
1590                                                         tail->next = entry->next;
1591                                                 else
1592                                                         env->call_head = entry->next;
1593                                                 continue;
1594                                         }
1595                                 }
1596                                 tail = entry;
1597                         }
1598                         env->call_tail = tail;
1599                 }
1600         } while (did_inline);
1601
1602         /* inline other small functions. */
1603         for (i = 0; i < n_irgs; ++i) {
1604                 ir_node *call;
1605                 int phiproj_computed = 0;
1606
1607                 current_ir_graph = get_irp_irg(i);
1608                 env = (inline_irg_env *)get_irg_link(current_ir_graph);
1609
1610                 /* note that the list of possible calls is updated during the process */
1611                 tail = NULL;
1612                 for (entry = env->call_head; entry != NULL; entry = entry->next) {
1613                         ir_graph   *callee;
1614                         pmap_entry *e;
1615
1616                         call   = entry->call;
1617                         callee = entry->callee;
1618
1619                         e = pmap_find(copied_graphs, callee);
1620                         if (e != NULL) {
1621                                 /*
1622                                  * Remap callee if we have a copy.
1623                                  * FIXME: Should we do this only for recursive Calls ?
1624                                  */
1625                                 callee = e->value;
1626                         }
1627
1628                         if (((is_smaller(callee, size) && (env->n_nodes < maxsize)) ||    /* small function */
1629                                 (get_irg_inline_property(callee) >= irg_inline_forced))) {
1630                                 if (current_ir_graph == callee) {
1631                                         /*
1632                                          * Recursive call: we cannot directly inline because we cannot walk
1633                                          * the graph and change it. So we have to make a copy of the graph
1634                                          * first.
1635                                          */
1636
1637                                         inline_irg_env *callee_env;
1638                                         ir_graph       *copy;
1639
1640                                         /*
1641                                          * No copy yet, create one.
1642                                          * Note that recursive methods are never leaves, so it is sufficient
1643                                          * to test this condition here.
1644                                          */
1645                                         copy = create_irg_copy(callee);
1646
1647                                         /* create_irg_copy() destroys the Proj links, recompute them */
1648                                         phiproj_computed = 0;
1649
1650                                         /* allocate new environment */
1651                                         callee_env = alloc_inline_irg_env();
1652                                         set_irg_link(copy, callee_env);
1653
1654                                         assure_cf_loop(copy);
1655                                         wenv.x              = callee_env;
1656                                         wenv.ignore_callers = 1;
1657                                         irg_walk_graph(copy, NULL, collect_calls2, &wenv);
1658
1659                                         /*
1660                                          * Enter the entity of the original graph. This is needed
1661                                          * for inline_method(). However, note that ent->irg still points
1662                                          * to callee, NOT to copy.
1663                                          */
1664                                         set_irg_entity(copy, get_irg_entity(callee));
1665
1666                                         pmap_insert(copied_graphs, callee, copy);
1667                                         callee = copy;
1668
1669                                         /* we have only one caller: the original graph */
1670                                         callee_env->n_callers      = 1;
1671                                         callee_env->n_callers_orig = 1;
1672                                 }
1673                                 if (! phiproj_computed) {
1674                                         phiproj_computed = 1;
1675                                         collect_phiprojs(current_ir_graph);
1676                                 }
1677                                 did_inline = inline_method(call, callee);
1678                                 if (did_inline) {
1679                                         inline_irg_env *callee_env = (inline_irg_env *)get_irg_link(callee);
1680
1681                                         /* was inlined, must be recomputed */
1682                                         phiproj_computed = 0;
1683
1684                                         /* callee was inline. Append it's call list. */
1685                                         env->got_inline = 1;
1686                                         --env->n_call_nodes;
1687                                         append_call_list(env, callee_env->call_head);
1688                                         env->n_call_nodes += callee_env->n_call_nodes;
1689                                         env->n_nodes += callee_env->n_nodes;
1690                                         --callee_env->n_callers;
1691
1692                                         /* after we have inlined callee, all called methods inside callee
1693                                            are now called once more */
1694                                         for (centry = callee_env->call_head; centry != NULL; centry = centry->next) {
1695                                                 inline_irg_env *penv = get_irg_link(centry->callee);
1696                                                 ++penv->n_callers;
1697                                         }
1698
1699                                         /* remove this call from the list */
1700                                         if (tail != NULL)
1701                                                 tail->next = entry->next;
1702                                         else
1703                                                 env->call_head = entry->next;
1704                                         continue;
1705                                 }
1706                         }
1707                         tail = entry;
1708                 }
1709                 env->call_tail = tail;
1710         }
1711
1712         for (i = 0; i < n_irgs; ++i) {
1713                 irg = get_irp_irg(i);
1714                 env = (inline_irg_env *)get_irg_link(irg);
1715
1716                 if (env->got_inline) {
1717                         optimize_graph_df(irg);
1718                         optimize_cf(irg);
1719                 }
1720                 if (env->got_inline || (env->n_callers_orig != env->n_callers)) {
1721                         DB((dbg, LEVEL_1, "Nodes:%3d ->%3d, calls:%3d ->%3d, callers:%3d ->%3d, -- %s\n",
1722                         env->n_nodes_orig, env->n_nodes, env->n_call_nodes_orig, env->n_call_nodes,
1723                         env->n_callers_orig, env->n_callers,
1724                         get_entity_name(get_irg_entity(irg))));
1725                 }
1726         }
1727
1728         /* kill the copied graphs: we don't need them anymore */
1729         foreach_pmap(copied_graphs, pm_entry) {
1730                 ir_graph *copy = pm_entry->value;
1731
1732                 /* reset the entity, otherwise it will be deleted in the next step ... */
1733                 set_irg_entity(copy, NULL);
1734                 free_ir_graph(copy);
1735         }
1736         pmap_destroy(copied_graphs);
1737
1738         obstack_free(&temp_obst, NULL);
1739         current_ir_graph = rem;
1740 }
1741
1742 /**
1743  * Calculate the parameter weights for transmitting the address of a local variable.
1744  */
1745 static unsigned calc_method_local_weight(ir_node *arg) {
1746         int      i, j, k;
1747         unsigned v, weight = 0;
1748
1749         for (i = get_irn_n_outs(arg) - 1; i >= 0; --i) {
1750                 ir_node *succ = get_irn_out(arg, i);
1751
1752                 switch (get_irn_opcode(succ)) {
1753                 case iro_Load:
1754                 case iro_Store:
1755                         /* Loads and Store can be removed */
1756                         weight += 3;
1757                         break;
1758                 case iro_Sel:
1759                         /* check if all args are constant */
1760                         for (j = get_Sel_n_indexs(succ) - 1; j >= 0; --j) {
1761                                 ir_node *idx = get_Sel_index(succ, j);
1762                                 if (! is_Const(idx))
1763                                         return 0;
1764                         }
1765                         /* Check users on this Sel. Note: if a 0 is returned here, there was
1766                            some unsupported node. */
1767                         v = calc_method_local_weight(succ);
1768                         if (v == 0)
1769                                 return 0;
1770                         /* we can kill one Sel with constant indexes, this is cheap */
1771                         weight += v + 1;
1772                         break;
1773                 case iro_Id:
1774                         /* when looking backward we might find Id nodes */
1775                         weight += calc_method_local_weight(succ);
1776                         break;
1777                 case iro_Tuple:
1778                         /* unoptimized tuple */
1779                         for (j = get_Tuple_n_preds(succ) - 1; j >= 0; --j) {
1780                                 ir_node *pred = get_Tuple_pred(succ, j);
1781                                 if (pred == arg) {
1782                                         /* look for Proj(j) */
1783                                         for (k = get_irn_n_outs(succ) - 1; k >= 0; --k) {
1784                                                 ir_node *succ_succ = get_irn_out(succ, k);
1785                                                 if (is_Proj(succ_succ)) {
1786                                                         if (get_Proj_proj(succ_succ) == j) {
1787                                                                 /* found */
1788                                                                 weight += calc_method_local_weight(succ_succ);
1789                                                         }
1790                                                 } else {
1791                                                         /* this should NOT happen */
1792                                                         return 0;
1793                                                 }
1794                                         }
1795                                 }
1796                         }
1797                         break;
1798                 default:
1799                         /* any other node: unsupported yet or bad. */
1800                         return 0;
1801                 }
1802         }
1803         return weight;
1804 }
1805
1806 /**
1807  * Calculate the parameter weights for transmitting the address of a local variable.
1808  */
1809 static void analyze_irg_local_weights(inline_irg_env *env, ir_graph *irg) {
1810         ir_entity *ent = get_irg_entity(irg);
1811         ir_type  *mtp;
1812         int      nparams, i, proj_nr;
1813         ir_node  *irg_args, *arg;
1814
1815         mtp      = get_entity_type(ent);
1816         nparams  = get_method_n_params(mtp);
1817
1818         /* allocate a new array. currently used as 'analysed' flag */
1819         env->local_weights = NEW_ARR_D(unsigned, &temp_obst, nparams);
1820
1821         /* If the method haven't parameters we have nothing to do. */
1822         if (nparams <= 0)
1823                 return;
1824
1825         assure_irg_outs(irg);
1826         irg_args = get_irg_args(irg);
1827         for (i = get_irn_n_outs(irg_args) - 1; i >= 0; --i) {
1828                 arg     = get_irn_out(irg_args, i);
1829                 proj_nr = get_Proj_proj(arg);
1830                 env->local_weights[proj_nr] = calc_method_local_weight(arg);
1831         }
1832 }
1833
1834 /**
1835  * Calculate the benefice for transmitting an local variable address.
1836  * After inlining, the local variable might be transformed into a
1837  * SSA variable by scalar_replacement().
1838  */
1839 static unsigned get_method_local_adress_weight(ir_graph *callee, int pos) {
1840         inline_irg_env *env = get_irg_link(callee);
1841
1842         if (env->local_weights != NULL) {
1843                 if (pos < ARR_LEN(env->local_weights))
1844                         return env->local_weights[pos];
1845                 return 0;
1846         }
1847
1848         analyze_irg_local_weights(env, callee);
1849
1850         if (pos < ARR_LEN(env->local_weights))
1851                 return env->local_weights[pos];
1852         return 0;
1853 }
1854
1855 /**
1856  * calculate a benefice value for inlining the given call.
1857  */
1858 static int calc_inline_benefice(ir_node *call, ir_graph *callee, unsigned *local_adr) {
1859         ir_entity *ent = get_irg_entity(callee);
1860         ir_node   *frame_ptr;
1861         ir_type   *mtp;
1862         int       weight = 0;
1863         int       i, n_params, all_const;
1864         unsigned  cc, v;
1865
1866         inline_irg_env *curr_env, *callee_env;
1867
1868         if (get_entity_additional_properties(ent) & mtp_property_noreturn) {
1869                 /* do NOT inline noreturn calls */
1870                 return INT_MIN;
1871         }
1872
1873         /* costs for every passed parameter */
1874         n_params = get_Call_n_params(call);
1875         mtp      = get_entity_type(ent);
1876         cc       = get_method_calling_convention(mtp);
1877         if (cc & cc_reg_param) {
1878                 /* register parameter, smaller costs for register parameters */
1879                 int max_regs = cc & ~cc_bits;
1880
1881                 if (max_regs < n_params)
1882                         weight += max_regs * 2 + (n_params - max_regs) * 5;
1883                 else
1884                         weight += n_params * 2;
1885         } else {
1886                 /* parameters are passed an stack */
1887                 weight += 5 * n_params;
1888         }
1889
1890         /* constant parameters improve the benefice */
1891         frame_ptr = get_irg_frame(current_ir_graph);
1892         all_const = 1;
1893         for (i = 0; i < n_params; ++i) {
1894                 ir_node *param = get_Call_param(call, i);
1895
1896                 if (is_Const(param))
1897                         weight += get_method_param_weight(ent, i);
1898                 else {
1899                         all_const = 0;
1900                         if (is_SymConst(param))
1901                                 weight += get_method_param_weight(ent, i);
1902                         else if (is_Sel(param) && get_Sel_ptr(param) == frame_ptr) {
1903                                 /*
1904                                  * An address of a local variable is transmitted. After inlining,
1905                                  * scalar_replacement might be able to remove the local variable,
1906                                  * so honor this.
1907                                  */
1908                                 v = get_method_local_adress_weight(callee, i);
1909                                 weight += v;
1910                                 if (v > 0)
1911                                         *local_adr = 1;
1912                         }
1913                 }
1914         }
1915
1916         callee_env = get_irg_link(callee);
1917         if (get_entity_visibility(ent) == visibility_local &&
1918             callee_env->n_callers_orig == 1 &&
1919             callee != current_ir_graph) {
1920                 /* we are the only caller, give big bonus */
1921                 weight += 5000;
1922         }
1923
1924         /* do not inline big functions */
1925         weight -= callee_env->n_nodes;
1926
1927         /* reduce the benefice if the current function is already big */
1928         curr_env = get_irg_link(current_ir_graph);
1929         weight -= curr_env->n_nodes / 50;
1930
1931         /* give a bonus for functions with one block */
1932         if (callee_env->n_blocks == 1)
1933                 weight = weight * 3 / 2;
1934
1935         /* and one for small non-recursive functions: we want them to be inlined in mostly every case */
1936         else if (callee_env->n_nodes < 20 && !callee_env->recursive)
1937                 weight += 5000;
1938
1939         /* and finally for leaves: they do not increase the register pressure
1940            because of callee safe registers */
1941         else if (callee_env->n_call_nodes == 0)
1942                 weight += 25;
1943
1944         /*
1945          * Reduce the weight for recursive function IFF not all arguments are const.
1946          * inlining recursive functions is rarely good.
1947          */
1948         if (callee_env->recursive && !all_const)
1949                 weight -= 500;
1950
1951         /*
1952          * All arguments constant is probably a good sign, give an extra bonus
1953          */
1954         if (all_const)
1955                 weight += 100;
1956
1957         return weight;
1958 }
1959
1960 /**
1961  * Heuristic inliner. Calculates a benefice value for every call and inlines
1962  * those calls with a value higher than the threshold.
1963  */
1964 void inline_functions(int maxsize, int inline_threshold) {
1965         inline_irg_env   *env;
1966         int              i, n_irgs;
1967         ir_graph         *rem;
1968         int              did_inline;
1969         wenv_t           wenv;
1970         call_entry       *curr_call, **last_call;
1971         const call_entry *centry;
1972         pmap             *copied_graphs;
1973         pmap_entry       *pm_entry;
1974
1975         rem = current_ir_graph;
1976         obstack_init(&temp_obst);
1977
1978         /* a map for the copied graphs, used to inline recursive calls */
1979         copied_graphs = pmap_create();
1980
1981         /* extend all irgs by a temporary data structure for inlining. */
1982         n_irgs = get_irp_n_irgs();
1983         for (i = 0; i < n_irgs; ++i)
1984                 set_irg_link(get_irp_irg(i), alloc_inline_irg_env());
1985
1986         /* Precompute information in temporary data structure. */
1987         wenv.ignore_runtime = 0;
1988         wenv.ignore_callers = 0;
1989         for (i = 0; i < n_irgs; ++i) {
1990                 ir_graph *irg = get_irp_irg(i);
1991
1992                 assert(get_irg_phase_state(irg) != phase_building);
1993                 free_callee_info(irg);
1994
1995                 wenv.x         = get_irg_link(irg);
1996                 wenv.last_call = NULL;
1997                 assure_cf_loop(irg);
1998                 irg_walk_graph(irg, NULL, collect_calls2, &wenv);
1999         }
2000
2001         /* -- and now inline. -- */
2002         for (i = 0; i < n_irgs; ++i) {
2003                 int      phiproj_computed = 0;
2004                 ir_node  *call;
2005                 ir_graph *irg = get_irp_irg(i);
2006
2007                 current_ir_graph = irg;
2008                 env = get_irg_link(irg);
2009
2010                 /* note that the list of possible calls is updated during the process */
2011                 last_call = &env->call_head;
2012                 for (curr_call = env->call_head; curr_call != NULL;) {
2013                         ir_graph   *callee;
2014                         pmap_entry *e;
2015                         int        benefice;
2016                         unsigned   local_adr;
2017
2018                         if (env->n_nodes > maxsize) break;
2019
2020                         call   = curr_call->call;
2021                         callee = curr_call->callee;
2022
2023                         e = pmap_find(copied_graphs, callee);
2024                         if (e != NULL) {
2025                                 /*
2026                                 * Remap callee if we have a copy.
2027                                 * FIXME: Should we do this only for recursive Calls ?
2028                                 */
2029                                 callee = e->value;
2030                         }
2031
2032                         /* calculate the benefice on the original call to prevent excessive inlining */
2033                         local_adr = 0;
2034                         benefice = calc_inline_benefice(call, callee, &local_adr);
2035                         DB((dbg, LEVEL_2, "In %+F Call %+F has benefice %d\n", irg, callee, benefice));
2036
2037                         if (benefice > -inline_threshold ||
2038                                 (get_irg_inline_property(callee) >= irg_inline_forced)) {
2039                                 if (current_ir_graph == callee) {
2040                                         /*
2041                                          * Recursive call: we cannot directly inline because we cannot walk
2042                                          * the graph and change it. So we have to make a copy of the graph
2043                                          * first.
2044                                          */
2045
2046                                         inline_irg_env *callee_env;
2047                                         ir_graph       *copy;
2048
2049                                         /*
2050                                          * No copy yet, create one.
2051                                          * Note that recursive methods are never leaves, so it is sufficient
2052                                          * to test this condition here.
2053                                          */
2054                                         copy = create_irg_copy(callee);
2055
2056                                         /* create_irg_copy() destroys the Proj links, recompute them */
2057                                         phiproj_computed = 0;
2058
2059                                         /* allocate new environment */
2060                                         callee_env = alloc_inline_irg_env();
2061                                         set_irg_link(copy, callee_env);
2062
2063                                         assure_cf_loop(copy);
2064                                         wenv.x              = callee_env;
2065                                         wenv.ignore_callers = 1;
2066                                         irg_walk_graph(copy, NULL, collect_calls2, &wenv);
2067
2068                                         /*
2069                                          * Enter the entity of the original graph. This is needed
2070                                          * for inline_method(). However, note that ent->irg still points
2071                                          * to callee, NOT to copy.
2072                                          */
2073                                         set_irg_entity(copy, get_irg_entity(callee));
2074
2075                                         pmap_insert(copied_graphs, callee, copy);
2076                                         callee = copy;
2077
2078                                         /* we have only one caller: the original graph */
2079                                         callee_env->n_callers      = 1;
2080                                         callee_env->n_callers_orig = 1;
2081                                 }
2082                                 if (! phiproj_computed) {
2083                                         phiproj_computed = 1;
2084                                         collect_phiprojs(current_ir_graph);
2085                                 }
2086                                 did_inline = inline_method(call, callee);
2087                                 if (did_inline) {
2088                                         inline_irg_env *callee_env = (inline_irg_env *)get_irg_link(callee);
2089
2090                                         /* was inlined, must be recomputed */
2091                                         phiproj_computed = 0;
2092
2093                                         /* after we have inlined callee, all called methods inside callee
2094                                         are now called once more */
2095                                         for (centry = callee_env->call_head; centry != NULL; centry = centry->next) {
2096                                                 inline_irg_env *penv = get_irg_link(centry->callee);
2097                                                 ++penv->n_callers;
2098                                         }
2099
2100                                         /* callee was inline. Append it's call list. */
2101                                         env->got_inline = 1;
2102                                         if (local_adr)
2103                                                 env->local_vars = 1;
2104                                         --env->n_call_nodes;
2105                                         curr_call = replace_entry_by_call_list(curr_call, callee_env->call_head);
2106                                         env->n_call_nodes += callee_env->n_call_nodes;
2107                                         env->n_nodes += callee_env->n_nodes;
2108                                         --callee_env->n_callers;
2109
2110                                         /* remove the current call entry from the list */
2111                                         *last_call = curr_call;
2112                                         continue;
2113                                 }
2114                         }
2115                         last_call = &curr_call->next;
2116                         curr_call = curr_call->next;
2117                 }
2118
2119                 if (env->got_inline) {
2120                         /* this irg got calls inlined: optimize it */
2121
2122                         /* scalar replacement does not work well with Tuple nodes, so optimize them away */
2123                         optimize_graph_df(irg);
2124
2125                         if (env->local_vars) {
2126                                 if (scalar_replacement_opt(irg)) {
2127                                         optimize_graph_df(irg);
2128                                 }
2129                         }
2130                         optimize_cf(irg);
2131                 }
2132                 if (env->got_inline || (env->n_callers_orig != env->n_callers)) {
2133                         DB((dbg, LEVEL_1, "Nodes:%3d ->%3d, calls:%3d ->%3d, callers:%3d ->%3d, -- %s\n",
2134                         env->n_nodes_orig, env->n_nodes, env->n_call_nodes_orig, env->n_call_nodes,
2135                         env->n_callers_orig, env->n_callers,
2136                         get_entity_name(get_irg_entity(irg))));
2137                 }
2138         }
2139
2140         /* kill the copied graphs: we don't need them anymore */
2141         foreach_pmap(copied_graphs, pm_entry) {
2142                 ir_graph *copy = pm_entry->value;
2143
2144                 /* reset the entity, otherwise it will be deleted in the next step ... */
2145                 set_irg_entity(copy, NULL);
2146                 free_ir_graph(copy);
2147         }
2148         pmap_destroy(copied_graphs);
2149
2150         obstack_free(&temp_obst, NULL);
2151         current_ir_graph = rem;
2152 }
2153
2154 void firm_init_inline(void) {
2155         FIRM_DBG_REGISTER(dbg, "firm.opt.inline");
2156 }