nsz Git - libfirm/blob - ir/opt/cfopt.c

   1 /*
   2  * Copyright (C) 1995-2008 University of Karlsruhe.  All right reserved.
   3  *
   4  * This file is part of libFirm.
   5  *
   6  * This file may be distributed and/or modified under the terms of the
   7  * GNU General Public License version 2 as published by the Free Software
   8  * Foundation and appearing in the file LICENSE.GPL included in the
   9  * packaging of this file.
  10  *
  11  * Licensees holding valid libFirm Professional Edition licenses may use
  12  * this file in accordance with the libFirm Commercial License.
  13  * Agreement provided with the Software.
  14  *
  15  * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
  16  * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
  17  * PURPOSE.
  18  */
  19
  20 /**
  21  * @file
  22  * @brief   Control flow optimizations.
  23  * @author  Goetz Lindenmaier, Michael Beck, Sebastian Hack
  24  * @version $Id$
  25  */
  26 #include "config.h"
  27
  28 #include "iroptimize.h"
  29
  30 #include <assert.h>
  31
  32 #include "plist.h"
  33 #include "xmalloc.h"
  34 #include "irnode_t.h"
  35 #include "irgraph_t.h"
  36 #include "irprog_t.h"
  37
  38 #include "ircons.h"
  39 #include "iropt_t.h"
  40 #include "irgwalk.h"
  41 #include "irgmod.h"
  42 #include "irdump.h"
  43 #include "irverify.h"
  44 #include "iredges.h"
  45
  46 #include "array_t.h"
  47
  48 #include "irouts.h"
  49 #include "irbackedge_t.h"
  50
  51 #include "irflag_t.h"
  52 #include "firmstat.h"
  53 #include "irpass.h"
  54
  55 #include "iropt_dbg.h"
  56
  57 /*------------------------------------------------------------------*/
  58 /* Control flow optimization.                                       */
  59 /*                                                                  */
  60 /* Removes Bad control flow predecessors and empty blocks.  A block */
  61 /* is empty if it contains only a Jmp node.                         */
  62 /* Blocks can only be removed if they are not needed for the        */
  63 /* semantics of Phi nodes.                                          */
  64 /* Further, we NEVER remove labeled blocks (even if we could move   */
  65 /* the label.                                                       */
  66 /*------------------------------------------------------------------*/
  67
  68 #define set_Block_removable(block)      set_Block_mark(block, 1)
  69 #define set_Block_non_removable(block)  set_Block_mark(block, 0)
  70 #define is_Block_removable(block)       (get_Block_mark(block) != 0)
  71
  72 /**
  73  * Replace binary Conds that jumps twice into the same block
  74  * by a simple Jmp.
  75  * E.g.
  76  * @verbatim
  77  *               Cond                     Jmp  Bad
  78  *             /       \                   |   /
  79  *       ProjX True   ProjX False  ==>     |  /
  80  *             \       /                   | /
  81  *               Block                    Block
  82  * @endverbatim
  83  *
  84  * Such pattern are the result of if-conversion.
  85  *
  86  * Note that the simple case that Block has only these two
  87  * predecessors are already handled in equivalent_node_Block().
  88  */
  89 static int remove_senseless_conds(ir_node *bl)
  90 {
  91         int i, j;
  92         int n = get_Block_n_cfgpreds(bl);
  93         int changed = 0;
  94
  95         for (i = 0; i < n; ++i) {
  96                 ir_node *pred_i = get_Block_cfgpred(bl, i);
  97                 ir_node *cond_i = skip_Proj(pred_i);
  98
  99                 /* binary Cond */
 100                 if (is_Cond(cond_i) && get_irn_mode(get_Cond_selector(cond_i)) == mode_b) {
 101
 102                         for (j = i + 1; j < n; ++j) {
 103                                 ir_node *pred_j = get_Block_cfgpred(bl, j);
 104                                 ir_node *cond_j = skip_Proj(pred_j);
 105
 106                                 if (cond_j == cond_i) {
 107                                         ir_graph *irg = get_irn_irg(bl);
 108                                         ir_node  *jmp = new_r_Jmp(get_nodes_block(cond_i));
 109                                         set_irn_n(bl, i, jmp);
 110                                         set_irn_n(bl, j, new_r_Bad(irg));
 111
 112                                         DBG_OPT_IFSIM2(cond_i, jmp);
 113                                         changed = 1;
 114                                         break;
 115                                 }
 116                         }
 117                 }
 118         }
 119         return changed;
 120 }
 121
 122 /** An environment for merge_blocks and collect nodes. */
 123 typedef struct merge_env {
 124         int changed;    /**< Set if the graph was changed. */
 125         int phis_moved; /**< Set if Phi nodes were moved. */
 126         plist_t *list;  /**< Helper list for all found Switch Conds. */
 127 } merge_env;
 128
 129 /**
 130  * Removes Tuples from Block control flow predecessors.
 131  * Optimizes blocks with equivalent_node().  This is tricky,
 132  * as we want to avoid nodes that have as block predecessor Bads.
 133  * Therefore we also optimize at control flow operations, depending
 134  * how we first reach the Block.
 135  */
 136 static void merge_blocks(ir_node *node, void *ctx)
 137 {
 138         int i;
 139         ir_node *new_block;
 140         merge_env *env = (merge_env*)ctx;
 141
 142         /* clear the link field for ALL nodes first */
 143         set_irn_link(node, NULL);
 144
 145         if (is_Block(node)) {
 146                 /* Remove Tuples */
 147                 for (i = get_Block_n_cfgpreds(node) - 1; i >= 0; --i) {
 148                         ir_node *pred = get_Block_cfgpred(node, i);
 149                         ir_node *skipped = skip_Tuple(pred);
 150                         if (pred != skipped) {
 151                                 set_Block_cfgpred(node, i, skipped);
 152                                 env->changed = 1;
 153                         }
 154                 }
 155
 156                 /* see below */
 157                 new_block = equivalent_node(node);
 158                 if (new_block != node && ! is_Block_dead(new_block)) {
 159                         exchange(node, new_block);
 160                         env->changed = 1;
 161                 }
 162
 163         } else if (get_opt_optimize() && (get_irn_mode(node) == mode_X)) {
 164                 /* We will soon visit a block.  Optimize it before visiting! */
 165                 ir_node *b = get_nodes_block(skip_Proj(node));
 166
 167                 if (!is_Block_dead(b)) {
 168                         new_block = equivalent_node(b);
 169
 170                         while (!irn_visited(b) && !is_Block_dead(new_block) && new_block != b) {
 171                                 /* We would have to run gigo() if new is bad, so we
 172                                    promote it directly below. Nevertheless, we sometimes reach a block
 173                                    the first time through a dataflow node.  In this case we optimized the
 174                                    block as such and have to promote the Bad here. */
 175                                 exchange(b, new_block);
 176                                 env->changed = 1;
 177                                 b = new_block;
 178                                 new_block = equivalent_node(b);
 179                         }
 180
 181                         /* normally, we would create a Bad block here, but this must be
 182                          * prevented, so just set its cf to Bad.
 183                          */
 184                         if (is_Block_dead(new_block)) {
 185                                 ir_graph *irg = get_irn_irg(node);
 186                                 exchange(node, new_r_Bad(irg));
 187                                 env->changed = 1;
 188                         }
 189                 }
 190         }
 191 }
 192
 193 /**
 194  * Block walker removing control flow from dead block by
 195  * inspecting dominance info.
 196  * Do not replace blocks by Bad.  This optimization shall
 197  * ensure, that all Bad control flow predecessors are
 198  * removed, and no new other Bads are introduced.
 199  * Further removed useless Conds and clear the mark of all blocks.
 200  *
 201  * Must be run in the post walker.
 202  */
 203 static void remove_unreachable_blocks_and_conds(ir_node *block, void *env)
 204 {
 205         int i;
 206         int *changed = (int*)env;
 207
 208         /* Check block predecessors and turn control flow into bad.
 209            Beware of Tuple, kill them. */
 210         for (i = get_Block_n_cfgpreds(block) - 1; i >= 0; --i) {
 211                 ir_node *pred_X  = get_Block_cfgpred(block, i);
 212                 ir_node *skipped = skip_Tuple(pred_X);
 213
 214                 if (! is_Bad(skipped)) {
 215                         ir_node *pred_bl = get_nodes_block(skip_Proj(skipped));
 216
 217                         if (is_Block_dead(pred_bl) || (get_Block_dom_depth(pred_bl) < 0)) {
 218                                 ir_graph *irg = get_irn_irg(block);
 219                                 set_Block_dead(pred_bl);
 220                                 exchange(pred_X, new_r_Bad(irg));
 221                                 *changed = 1;
 222                         } else if (skipped != pred_X) {
 223                                 set_Block_cfgpred(block, i, skipped);
 224                                 *changed = 1;
 225                         }
 226                 }
 227         }
 228
 229         *changed |= remove_senseless_conds(block);
 230
 231         /* clear the block mark of all non labeled blocks */
 232         if (has_Block_entity(block))
 233                 set_Block_non_removable(block);
 234         else
 235                 set_Block_removable(block);
 236 }
 237
 238 /**
 239  * Collects all Phi nodes in link list of Block.
 240  * Marks all blocks "non_removable" if they contain a node other
 241  * than Jmp (and Proj).
 242  * Links all Proj nodes to their predecessors.
 243  * Collects all switch-Conds in a list.
 244  */
 245 static void collect_nodes(ir_node *n, void *ctx)
 246 {
 247         unsigned   code = get_irn_opcode(n);
 248         merge_env *env  = (merge_env*)ctx;
 249
 250         if (code == iro_Block) {
 251                 /* mark the block as non-removable if it is labeled */
 252                 if (has_Block_entity(n))
 253                         set_Block_non_removable(n);
 254         } else {
 255                 ir_node *b = get_nodes_block(n);
 256
 257                 if (code == iro_Phi && get_irn_arity(n) > 0) {
 258                         /* Collect Phi nodes to compact ins along with block's ins. */
 259                         set_irn_link(n, get_irn_link(b));
 260                         set_irn_link(b, n);
 261                 } else if (code != iro_Jmp && !is_Bad(b)) {  /* Check for non-empty block. */
 262                         set_Block_non_removable(b);
 263
 264                         if (code == iro_Proj) {               /* link Proj nodes */
 265                                 ir_node *pred = get_Proj_pred(n);
 266
 267                                 set_irn_link(n, get_irn_link(pred));
 268                                 set_irn_link(pred, n);
 269                         } else if (code == iro_Cond) {
 270                                 ir_node *sel = get_Cond_selector(n);
 271                                 if (mode_is_int(get_irn_mode(sel))) {
 272                                         /* found a switch-Cond, collect */
 273                                         plist_insert_back(env->list, n);
 274                                 }
 275                         }
 276                 }
 277         }
 278 }
 279
 280 /** Returns true if pred is predecessor of block. */
 281 static int is_pred_of(ir_node *pred, ir_node *b)
 282 {
 283         int i;
 284
 285         for (i = get_Block_n_cfgpreds(b) - 1; i >= 0; --i) {
 286                 ir_node *b_pred = get_Block_cfgpred_block(b, i);
 287                 if (b_pred == pred)
 288                         return 1;
 289         }
 290         return 0;
 291 }
 292
 293 /** Test whether we can optimize away pred block pos of b.
 294  *
 295  *  @param  b    A block node.
 296  *  @param  pos  The position of the predecessor block to judge about.
 297  *
 298  *  @returns     The number of predecessors
 299  *
 300  *  The test is rather tricky.
 301  *
 302  *  The situation is something like the following:
 303  *  @verbatim
 304  *                 if-block
 305  *                  /   \
 306  *              then-b  else-b
 307  *                  \   /
 308  *                    b
 309  *  @endverbatim
 310  *
 311  *  b merges the control flow of an if-then-else.  We may not remove
 312  *  the 'then' _and_ the 'else' block of an 'if' if there is a Phi
 313  *  node in b, even if both are empty.  The destruction of this Phi
 314  *  requires that a copy is added before the merge.  We have to
 315  *  keep one of the case blocks to place the copies in.
 316  *
 317  *  To perform the test for pos, we must regard predecessors before pos
 318  *  as already removed.
 319  **/
 320 static int test_whether_dispensable(ir_node *b, int pos)
 321 {
 322         int i, j, n_preds = 1;
 323         ir_node *pred = get_Block_cfgpred_block(b, pos);
 324
 325         /* Bad blocks will be optimized away, so we don't need space for them */
 326         if (is_Block_dead(pred))
 327                 return 0;
 328
 329         if (is_Block_removable(pred)) {
 330                 /* Seems to be empty. At least we detected this in collect_nodes. */
 331                 if (get_irn_link(b) == NULL) {
 332                         /* There are no Phi nodes ==> all predecessors are dispensable. */
 333                         n_preds = get_Block_n_cfgpreds(pred);
 334                 } else {
 335                         /* b's pred blocks and pred's pred blocks must be pairwise disjunct.
 336                            Handle all pred blocks with preds < pos as if they were already removed. */
 337                         for (i = 0; i < pos; i++) {
 338                                 ir_node *b_pred = get_Block_cfgpred_block(b, i);
 339                                 if (! is_Block_dead(b_pred) && is_Block_removable(b_pred)) {
 340                                         for (j = get_Block_n_cfgpreds(b_pred) - 1; j >= 0; --j) {
 341                                                 ir_node *b_pred_pred = get_Block_cfgpred_block(b_pred, j);
 342                                                 if (is_pred_of(b_pred_pred, pred))
 343                                                         goto non_dispensable;
 344                                         }
 345                                 } else {
 346                                         if (is_pred_of(b_pred, pred))
 347                                                 goto non_dispensable;
 348                                 }
 349                         }
 350                         for (i = pos +1; i < get_Block_n_cfgpreds(b); i++) {
 351                                 ir_node *b_pred = get_Block_cfgpred_block(b, i);
 352                                 if (is_pred_of(b_pred, pred))
 353                                         goto non_dispensable;
 354                         }
 355                         /* if we get here, the block is dispensable */
 356                         n_preds = get_Block_n_cfgpreds(pred);
 357                 }
 358         }
 359
 360         return n_preds;
 361
 362 non_dispensable:
 363         set_Block_non_removable(pred);
 364         return 1;
 365 }
 366
 367 /**
 368  * This method removed Bad cf predecessors from Blocks and Phis, and removes
 369  * empty blocks.  A block is empty if it only contains Phi and Jmp nodes.
 370  *
 371  * We first adapt Phi nodes, then Block nodes, as we need the old ins
 372  * of the Block to adapt the Phi nodes.  We do this by computing new
 373  * in arrays, and then replacing the old ones.  So far we compute new in arrays
 374  * for all nodes, not regarding whether there is a possibility for optimization.
 375  *
 376  * For each predecessor p of a Block b there are three cases:
 377  *  -1. The predecessor p is a Bad node:  just skip it.  The in array of b shrinks by one.
 378  *  -2. The predecessor p is empty.  Remove p.  All predecessors of p are now
 379  *      predecessors of b.
 380  *  -3. The predecessor p is a block containing useful code.  Just keep p as is.
 381  *
 382  * For Phi nodes f we have to check the conditions at the Block of f.
 383  * For cases 1 and 3 we proceed as for Blocks.  For case 2 we can have two
 384  * cases:
 385  *  -2a: The old predecessor of the Phi f is a Phi pred_f IN THE BLOCK REMOVED.  In this
 386  *      case we proceed as for blocks. We remove pred_f.  All
 387  *      predecessors of pred_f now are predecessors of f.
 388  *  -2b: The old predecessor of f is NOT in the block removed. It might be a Phi, too.
 389  *      We have to replicate f for each predecessor of the removed block. Or, with
 390  *      other words, the removed predecessor block has exactly one predecessor.
 391  *
 392  * Further there is a special case for self referencing blocks:
 393  * @verbatim
 394  *
 395  *    then_b     else_b                              then_b  else_b
 396  *       \      /                                      \      /
 397  *        \    /                                        |    /
 398  *        pred_b                                        |   /
 399  *         |   ____                                     |  /  ____
 400  *         |  |    |                                    |  | |    |
 401  *         |  |    |       === optimized to ===>        \  | |    |
 402  *        loop_b   |                                     loop_b   |
 403  *         |  |    |                                      |  |    |
 404  *         |  |____|                                      |  |____|
 405  *         |                                              |
 406  * @endverbatim
 407  *
 408  * If there is a Phi in pred_b, but we remove pred_b, we have to generate a
 409  * Phi in loop_b, that has the ins of the Phi in pred_b and a self referencing
 410  * backedge.
 411  * @@@ It is negotiable whether we should do this ... there might end up a copy
 412  * from the Phi in the loop when removing the Phis.
 413  */
 414 static void optimize_blocks(ir_node *b, void *ctx)
 415 {
 416         int i, j, k, n, max_preds, n_preds, p_preds = -1;
 417         ir_node *pred, *phi, *next;
 418         ir_node **in;
 419         merge_env *env = (merge_env*)ctx;
 420
 421         /* Count the number of predecessor if this block is merged with pred blocks
 422            that are empty. */
 423         max_preds = 0;
 424         for (i = 0, k = get_Block_n_cfgpreds(b); i < k; ++i) {
 425                 max_preds += test_whether_dispensable(b, i);
 426         }
 427         in = XMALLOCN(ir_node*, max_preds);
 428
 429         /*- Fix the Phi nodes of the current block -*/
 430         for (phi = (ir_node*)get_irn_link(b); phi != NULL; phi = (ir_node*)next) {
 431                 assert(is_Phi(phi));
 432                 next = (ir_node*)get_irn_link(phi);
 433
 434                 /* Find the new predecessors for the Phi */
 435                 p_preds = 0;
 436                 for (i = 0, n = get_Block_n_cfgpreds(b); i < n; ++i) {
 437                         pred = get_Block_cfgpred_block(b, i);
 438
 439                         if (is_Block_dead(pred)) {
 440                                 /* case Phi 1: Do nothing */
 441                         } else if (is_Block_removable(pred) && !Block_block_visited(pred)) {
 442                                 /* case Phi 2: It's an empty block and not yet visited. */
 443                                 ir_node *phi_pred = get_Phi_pred(phi, i);
 444
 445                                 for (j = 0, k = get_Block_n_cfgpreds(pred); j < k; j++) {
 446                                         /* because of breaking loops, not all predecessors are Bad-clean,
 447                                          * so we must check this here again */
 448                                         if (! is_Bad(get_Block_cfgpred(pred, j))) {
 449                                                 if (get_nodes_block(phi_pred) == pred) {
 450                                                         /* case Phi 2a: */
 451                                                         assert(is_Phi(phi_pred));  /* Block is empty!! */
 452
 453                                                         in[p_preds++] = get_Phi_pred(phi_pred, j);
 454                                                 } else {
 455                                                         /* case Phi 2b: */
 456                                                         in[p_preds++] = phi_pred;
 457                                                 }
 458                                         }
 459                                 }
 460                         } else {
 461                                 /* case Phi 3: */
 462                                 in[p_preds++] = get_Phi_pred(phi, i);
 463                         }
 464                 }
 465                 assert(p_preds <= max_preds);
 466
 467                 /* Fix the node */
 468                 if (p_preds == 1)
 469                         /* By removal of Bad ins the Phi might be degenerated. */
 470                         exchange(phi, in[0]);
 471                 else
 472                         set_irn_in(phi, p_preds, in);
 473                 env->changed = 1;
 474         }
 475
 476         /*- This happens only if merge between loop backedge and single loop entry.
 477             Moreover, it is only needed if predb is the direct dominator of b, else there can be no uses
 478             of the Phi's in predb ... -*/
 479         for (k = 0, n = get_Block_n_cfgpreds(b); k < n; ++k) {
 480                 ir_node *predb = get_nodes_block(get_Block_cfgpred(b, k));
 481
 482                 if (is_Block_removable(predb) && !Block_block_visited(predb)) {
 483                         ir_node *next_phi;
 484
 485                         /* we found a predecessor block at position k that will be removed */
 486                         for (phi = (ir_node*)get_irn_link(predb); phi; phi = next_phi) {
 487                                 int q_preds = 0;
 488                                 next_phi = (ir_node*)get_irn_link(phi);
 489
 490                                 assert(is_Phi(phi));
 491
 492                                 if (get_Block_idom(b) != predb) {
 493                                         /* predb is not the dominator. There can't be uses of pred's Phi nodes, kill them .*/
 494                                         ir_graph *irg = get_irn_irg(b);
 495                                         exchange(phi, new_r_Bad(irg));
 496                                 } else {
 497                                         /* predb is the direct dominator of b. There might be uses of the Phi nodes from
 498                                            predb in further block, so move this phi from the predecessor into the block b */
 499                                         set_nodes_block(phi, b);
 500                                         set_irn_link(phi, get_irn_link(b));
 501                                         set_irn_link(b, phi);
 502                                         env->phis_moved = 1;
 503
 504                                         /* first, copy all 0..k-1 predecessors */
 505                                         for (i = 0; i < k; i++) {
 506                                                 pred = get_Block_cfgpred_block(b, i);
 507
 508                                                 if (is_Block_dead(pred)) {
 509                                                         /* Do nothing */
 510                                                 } else if (is_Block_removable(pred) && !Block_block_visited(pred)) {
 511                                                         /* It's an empty block and not yet visited. */
 512                                                         for (j = 0; j < get_Block_n_cfgpreds(pred); j++) {
 513                                                                 if (! is_Bad(get_Block_cfgpred(pred, j)))
 514                                                                         in[q_preds++] = phi;
 515                                                         }
 516                                                 } else {
 517                                                         in[q_preds++] = phi;
 518                                                 }
 519                                         }
 520
 521                                         /* now we are at k, copy the phi predecessors */
 522                                         pred = get_nodes_block(get_Block_cfgpred(b, k));
 523                                         for (i = 0; i < get_Phi_n_preds(phi); i++) {
 524                                                 if (! is_Bad(get_Block_cfgpred(pred, i)))
 525                                                         in[q_preds++] = get_Phi_pred(phi, i);
 526                                         }
 527
 528                                         /* and now all the rest */
 529                                         for (i = k+1; i < get_Block_n_cfgpreds(b); i++) {
 530                                                 pred = get_Block_cfgpred_block(b, i);
 531
 532                                                 if (is_Block_dead(pred)) {
 533                                                         /* Do nothing */
 534                                                 } else if (is_Block_removable(pred) && !Block_block_visited(pred)) {
 535                                                         /* It's an empty block and not yet visited. */
 536                                                         for (j = 0; j < get_Block_n_cfgpreds(pred); j++) {
 537                                                                 if (! is_Bad(get_Block_cfgpred(pred, j)))
 538                                                                         in[q_preds++] = phi;
 539                                                         }
 540                                                 } else {
 541                                                         in[q_preds++] = phi;
 542                                                 }
 543                                         }
 544
 545                                         /* Fix the node */
 546                                         if (q_preds == 1)
 547                                                 exchange(phi, in[0]);
 548                                         else
 549                                                 set_irn_in(phi, q_preds, in);
 550                                         env->changed = 1;
 551
 552                                         assert(q_preds <= max_preds);
 553                                         // assert(p_preds == q_preds && "Wrong Phi Fix");
 554                                 }
 555                         }
 556                 }
 557         }
 558
 559         /*- Fix the block -*/
 560         n_preds = 0;
 561         for (i = 0; i < get_Block_n_cfgpreds(b); i++) {
 562                 pred = get_Block_cfgpred_block(b, i);
 563
 564                 if (is_Block_dead(pred)) {
 565                         /* case 1: Do nothing */
 566                 } else if (is_Block_removable(pred) && !Block_block_visited(pred)) {
 567                         /* case 2: It's an empty block and not yet visited. */
 568                         assert(get_Block_n_cfgpreds(b) > 1 || has_Block_entity(b));
 569                         /* Else it should be optimized by equivalent_node. */
 570                         for (j = 0; j < get_Block_n_cfgpreds(pred); j++) {
 571                                 ir_node *pred_X = get_Block_cfgpred(pred, j);
 572
 573                                 /* because of breaking loops, not all predecessors are Bad-clean,
 574                                  * so we must check this here again */
 575                                 if (! is_Bad(pred_X))
 576                                         in[n_preds++] = pred_X;
 577                         }
 578                         /* Remove block as it might be kept alive. */
 579                         exchange(pred, b/*new_r_Bad(irg)*/);
 580                 } else {
 581                         /* case 3: */
 582                         in[n_preds++] = get_Block_cfgpred(b, i);
 583                 }
 584         }
 585         assert(n_preds <= max_preds);
 586
 587         set_irn_in(b, n_preds, in);
 588         env->changed = 1;
 589
 590         assert(get_irn_link(b) == NULL || p_preds == -1 || (n_preds == p_preds && "Wrong Phi Fix"));
 591         xfree(in);
 592 }
 593
 594 /**
 595  * Block walker: optimize all blocks using the default optimizations.
 596  * This removes Blocks that with only a Jmp predecessor.
 597  */
 598 static void remove_simple_blocks(ir_node *block, void *ctx)
 599 {
 600         merge_env *env = (merge_env*)ctx;
 601         ir_node   *new_blk = equivalent_node(block);
 602
 603         if (new_blk != block) {
 604                 exchange(block, new_blk);
 605                 env->changed = 1;
 606         }
 607 }
 608
 609 /**
 610  * Handle pre-optimized table switch Cond's.
 611  * During iropt, all Projs from a switch-Cond are already removed except
 612  * the defProj and maybe the taken one.
 613  * The defProj cannot be removed WITHOUT looking backwards, so we do this here.
 614  *
 615  * @param cond the switch-Cond
 616  *
 617  * @return non-zero if a switch-Cond was optimized
 618  *
 619  * Expects all Proj's linked to the cond node
 620  */
 621 static int handle_switch_cond(ir_node *cond)
 622 {
 623         ir_node *sel = get_Cond_selector(cond);
 624
 625         ir_node *proj1 = (ir_node*)get_irn_link(cond);
 626         ir_node *proj2 = (ir_node*)get_irn_link(proj1);
 627         ir_node *jmp, *blk;
 628
 629         blk = get_nodes_block(cond);
 630
 631         if (proj2 == NULL) {
 632                 /* this Cond has only one Proj: must be the defProj */
 633                 assert(get_Cond_default_proj(cond) == get_Proj_proj(proj1));
 634                 /* convert it into a Jmp */
 635                 jmp = new_r_Jmp(blk);
 636                 exchange(proj1, jmp);
 637                 return 1;
 638         } else if (get_irn_link(proj2) == NULL) {
 639                 /* We have two Proj's here. Check if the Cond has
 640                    a constant argument */
 641                 ir_tarval *tv = value_of(sel);
 642
 643                 if (tv != tarval_bad) {
 644                         /* we have a constant switch */
 645                         long      num     = get_tarval_long(tv);
 646                         long      def_num = get_Cond_default_proj(cond);
 647                         ir_graph *irg     = get_irn_irg(cond);
 648
 649                         if (def_num == get_Proj_proj(proj1)) {
 650                                 /* first one is the defProj */
 651                                 if (num == get_Proj_proj(proj2)) {
 652                                         jmp = new_r_Jmp(blk);
 653                                         exchange(proj2, jmp);
 654                                         exchange(proj1, new_r_Bad(irg));
 655                                         return 1;
 656                                 }
 657                         } else if (def_num == get_Proj_proj(proj2)) {
 658                                 /* second one is the defProj */
 659                                 if (num == get_Proj_proj(proj1)) {
 660                                         jmp = new_r_Jmp(blk);
 661                                         exchange(proj1, jmp);
 662                                         exchange(proj2, new_r_Bad(irg));
 663                                         return 1;
 664                                 }
 665                         } else {
 666                                 /* neither: strange, Cond was not optimized so far */
 667                                 if (num == get_Proj_proj(proj1)) {
 668                                         jmp = new_r_Jmp(blk);
 669                                         exchange(proj1, jmp);
 670                                         exchange(proj2, new_r_Bad(irg));
 671                                         return 1;
 672                                 } else if (num == get_Proj_proj(proj2)) {
 673                                         jmp = new_r_Jmp(blk);
 674                                         exchange(proj2, jmp);
 675                                         exchange(proj1, new_r_Bad(irg));
 676                                         return 1;
 677                                 }
 678                         }
 679                 }
 680         }
 681         return 0;
 682 }
 683
 684 /* Optimizations of the control flow that also require changes of Phi nodes.
 685  *
 686  * This optimization performs two passes over the graph.
 687  *
 688  * The first pass collects all Phi nodes in a link list in the block
 689  * nodes.  Further it performs simple control flow optimizations.
 690  * Finally it marks all blocks that do not contain useful
 691  * computations, i.e., these blocks might be removed.
 692  *
 693  * The second pass performs the optimizations intended by this algorithm.
 694  * It walks only over block nodes and adapts these and the Phi nodes in these blocks,
 695  * which it finds in a linked list computed by the first pass.
 696  *
 697  * We use the mark flag to mark removable blocks in the first
 698  * phase.
 699  */
 700 void optimize_cf(ir_graph *irg)
 701 {
 702         int i, j, n, changed;
 703         ir_node **in = NULL;
 704         ir_node *cond, *end = get_irg_end(irg);
 705         plist_element_t *el;
 706         merge_env env;
 707
 708         assert(get_irg_phase_state(irg) != phase_building);
 709
 710         /* if the graph is not pinned, we cannot determine empty blocks */
 711         assert(get_irg_pinned(irg) != op_pin_state_floats &&
 712                "Control flow optimization need a pinned graph");
 713
 714         /* FIXME: control flow opt destroys block edges. So edges are deactivated here. Fix the edges! */
 715         edges_deactivate(irg);
 716
 717         /* we use the mark flag to mark removable blocks */
 718         ir_reserve_resources(irg, IR_RESOURCE_BLOCK_MARK);
 719 restart:
 720         env.changed    = 0;
 721         env.phis_moved = 0;
 722
 723         /* ALWAYS kill unreachable control flow. Backend cannot handle it anyway.
 724            Use dominator info to kill blocks. Also optimize useless Conds. */
 725         assure_doms(irg);
 726         irg_block_walk_graph(irg, NULL, remove_unreachable_blocks_and_conds, &env.changed);
 727
 728         /* fix the keep-alives */
 729         changed = 0;
 730         for (i = 0, n = get_End_n_keepalives(end); i < n; ++i) {
 731                 ir_node *ka = get_End_keepalive(end, i);
 732
 733                 if (is_Block(ka)) {
 734                         /* do NOT keep dead blocks */
 735                         if (is_Block_dead(ka) || get_Block_dom_depth(ka) < 0) {
 736                                 set_End_keepalive(end, i, new_r_Bad(irg));
 737                                 changed = 1;
 738                         }
 739                 } else {
 740                         ir_node *block = get_nodes_block(ka);
 741
 742                         if (is_Bad(block) || is_Block_dead(block) || get_Block_dom_depth(block) < 0) {
 743                                 /* do NOT keep nodes in dead blocks */
 744                                 set_End_keepalive(end, i, new_r_Bad(irg));
 745                                 changed = 1;
 746                         }
 747                 }
 748         }
 749         env.changed |= changed;
 750
 751         ir_reserve_resources(irg, IR_RESOURCE_IRN_LINK);
 752
 753         env.list = plist_new();
 754         irg_walk(end, merge_blocks, collect_nodes, &env);
 755
 756         ir_free_resources(irg, IR_RESOURCE_IRN_LINK);
 757
 758         if (env.changed) {
 759                 /* Handle graph state if was changed. */
 760                 set_irg_outs_inconsistent(irg);
 761                 set_irg_doms_inconsistent(irg);
 762                 set_irg_extblk_inconsistent(irg);
 763                 set_irg_loopinfo_inconsistent(irg);
 764                 set_irg_entity_usage_state(irg, ir_entity_usage_not_computed);
 765                 env.changed = 0;
 766         }
 767
 768         /* handle all collected switch-Conds */
 769         foreach_plist(env.list, el) {
 770                 cond = (ir_node*)plist_element_get_value(el);
 771                 env.changed |= handle_switch_cond(cond);
 772         }
 773         plist_free(env.list);
 774
 775         if (env.changed) {
 776                 /* The Cond optimization might generate unreachable code, so restart if
 777                    it happens. */
 778                 goto restart;
 779         }
 780
 781         /* Optimize the standard code. */
 782         env.changed = 0;
 783         assure_doms(irg);
 784         irg_block_walk_graph(irg, optimize_blocks, remove_simple_blocks, &env);
 785
 786         /* in rare cases a node may be kept alive more than once, use the visited flag to detect this */
 787         ir_reserve_resources(irg, IR_RESOURCE_IRN_VISITED);
 788         inc_irg_visited(irg);
 789
 790         /* fix the keep-alives again */
 791         changed = 0;
 792         for (i = 0, n = get_End_n_keepalives(end); i < n; ++i) {
 793                 ir_node *ka = get_End_keepalive(end, i);
 794
 795                 if (is_Block(ka)) {
 796                         /* do NOT keep dead blocks */
 797                         if (is_Block_dead(ka) || get_Block_dom_depth(ka) < 0) {
 798                                 set_End_keepalive(end, i, new_r_Bad(irg));
 799                                 changed = 1;
 800                         }
 801                 } else {
 802                         ir_node *block = get_nodes_block(ka);
 803
 804                         if (is_Bad(block) || is_Block_dead(block) || get_Block_dom_depth(block) < 0) {
 805                                 /* do NOT keep nodes in dead blocks */
 806                                 set_End_keepalive(end, i, new_r_Bad(irg));
 807                                 changed = 1;
 808                         }
 809                 }
 810         }
 811         env.changed |= changed;
 812
 813         remove_End_Bads_and_doublets(end);
 814
 815
 816         ir_free_resources(irg, IR_RESOURCE_BLOCK_MARK | IR_RESOURCE_IRN_VISITED);
 817
 818         if (env.phis_moved) {
 819                 /* Bad: when we moved Phi's, we might produce dead Phi nodes
 820                    that are kept-alive.
 821                    Some other phases cannot copy with this, so will them.
 822                  */
 823                 n = get_End_n_keepalives(end);
 824                 if (n > 0) {
 825                         NEW_ARR_A(ir_node *, in, n);
 826                         if (env.changed) {
 827                                 /* Handle graph state if was changed. */
 828                                 set_irg_outs_inconsistent(irg);
 829                         }
 830                         assure_irg_outs(irg);
 831
 832                         for (i = j = 0; i < n; ++i) {
 833                                 ir_node *ka = get_End_keepalive(end, i);
 834
 835                                 if (is_Phi(ka)) {
 836                                         int k;
 837
 838                                         for (k = get_irn_n_outs(ka) - 1; k >= 0; --k) {
 839                                                 ir_node *user = get_irn_out(ka, k);
 840
 841                                                 if (user != ka && user != end) {
 842                                                         /* Is it a real user or just a self loop ? */
 843                                                         break;
 844                                                 }
 845                                         }
 846                                         if (k >= 0)
 847                                                 in[j++] = ka;
 848                                 } else
 849                                         in[j++] = ka;
 850                         }
 851                         if (j != n) {
 852                                 set_End_keepalives(end, j, in);
 853                                 env.changed = 1;
 854                         }
 855                 }
 856         }
 857
 858         if (env.changed) {
 859                 /* Handle graph state if was changed. */
 860                 set_irg_outs_inconsistent(irg);
 861                 set_irg_doms_inconsistent(irg);
 862                 set_irg_extblk_inconsistent(irg);
 863                 set_irg_loopinfo_inconsistent(irg);
 864                 set_irg_entity_usage_state(irg, ir_entity_usage_not_computed);
 865         }
 866
 867
 868         /* the verifier doesn't work yet with floating nodes */
 869         if (get_irg_pinned(irg) == op_pin_state_pinned) {
 870                 /* after optimize_cf(), only Bad data flow may remain. */
 871                 if (irg_verify_bads(irg, BAD_DF | BAD_BLOCK | TUPLE)) {
 872                         dump_ir_graph(irg, "-verify-cf");
 873                         fprintf(stderr, "VERIFY_BAD in optimize_cf()\n");
 874                 }
 875         }
 876 }
 877
 878 /* Creates an ir_graph pass for optimize_cf. */
 879 ir_graph_pass_t *optimize_cf_pass(const char *name)
 880 {
 881         return def_graph_pass(name ? name : "optimize_cf", optimize_cf);
 882 }  /* optimize_cf_pass */