nsz Git - libfirm/blob - ir/opt/return.c

   1 /*
   2  * Project:     libFIRM
   3  * File name:   ir/opt/return.c
   4  * Purpose:     normalize returns
   5  * Author:
   6  * Created:
   7  * CVS-ID:      $Id$
   8  * Copyright:   (c) 1998-2005 Universität Karlsruhe
   9  * Licence:     This file protected by GPL -  GNU GENERAL PUBLIC LICENSE.
  10  */
  11 #ifdef HAVE_CONFIG_H
  12 #include "config.h"
  13 #endif
  14
  15 #ifdef HAVE_ALLOCA_H
  16 # include <alloca.h>
  17 #endif
  18 #ifdef HAVE_MALLOC_H
  19 # include <malloc.h>
  20 #endif
  21
  22 #include "irgraph_t.h"
  23 #include "ircons_t.h"
  24 #include "irnode_t.h"
  25 #include "irgmod.h"
  26
  27 #define set_bit(n)      (returns[(n) >> 3] |= 1 << ((n) & 7))
  28 #define get_bit(n)      (returns[(n) >> 3] & (1 << ((n) & 7)))
  29
  30 #undef IMAX
  31 #define IMAX(a, b)       ((a) > (b) ? (a) : (b))
  32
  33 /*
  34  * Normalize the Returns of a graph by creating a new End block
  35  * with One Return(Phi).
  36  * This is the prefered input for the if-conversion.
  37  *
  38  * In pseudocode, it means:
  39  *
  40  * if (a)
  41  *   return b;
  42  * else
  43  *   return c;
  44  *
  45  * is transformed into
  46  *
  47  * if (a)
  48  *   res = b;
  49  * else
  50  *   res = c;
  51  * return res;
  52  */
  53 void normalize_one_return(ir_graph *irg)
  54 {
  55   ir_node *endbl = get_irg_end_block(irg);
  56   int i, j, k, n, last_idx, n_rets, n_ret_vals = -1;
  57   unsigned char *returns;
  58   ir_node **in, **retvals;
  59
  60   ir_node *block, *new_ret;
  61
  62   /* look, if we have more than one return */
  63   n       = get_Block_n_cfgpreds(endbl);
  64   returns = alloca((n + 7) >> 3);
  65   memset(returns, 0, (n + 7) >> 3);
  66
  67   for (n_rets = i = 0; i < n; ++i) {
  68     ir_node *node = get_Block_cfgpred(endbl, i);
  69
  70     if (get_irn_op(node) == op_Return) {
  71       ++n_rets;
  72
  73       set_bit(i);
  74
  75       if (n_ret_vals < 0)
  76         n_ret_vals = get_irn_arity(node);
  77     }
  78   }
  79
  80   /* there should be at least one Return node in Firm */
  81   if (n_rets <= 1)
  82     return;
  83
  84   in      = alloca(sizeof(*in) * IMAX(n_rets, n_ret_vals));
  85   retvals = alloca(sizeof(*in) * n_rets * n_ret_vals);
  86
  87   for (j = i = 0; i < n; ++i) {
  88     if (get_bit(i)) {
  89       ir_node *ret  = get_Block_cfgpred(endbl, i);
  90       ir_node *block = get_nodes_block(ret);
  91
  92       /* create a new Jmp for every Ret and place the in in */
  93       in[j] = new_r_Jmp(irg, block);
  94
  95       /* save the return values and shuffle them */
  96       for (k = 0; k < n_ret_vals; ++k)
  97         retvals[j + k*n_ret_vals] = get_irn_n(ret, k);
  98
  99       ++j;
 100
 101       set_Block_cfgpred(endbl, i, new_r_Bad(irg));
 102       last_idx = i;
 103     }
 104   }
 105
 106   /* ok, create a new block with all created in's */
 107   block = new_r_Block(irg, n_rets, in);
 108
 109   /* now create the Phi nodes */
 110   for (j = i = 0; i < n_ret_vals; ++i, j += n_rets) {
 111     /* the return values are already shuffled */
 112     in[i] = new_r_Phi(irg, block, n_rets, &retvals[j], get_irn_mode(retvals[j]));
 113   }
 114
 115   new_ret = new_r_Return(irg, block, in[0], n_ret_vals-1, &in[1]);
 116
 117   set_Block_cfgpred(endbl, last_idx, new_ret);
 118
 119   /* invalidate analysis information:
 120    * a new Block was added, so dominator, outs and loop are inconsistent,
 121    * trouts and callee-state should be still valid
 122    */
 123   set_irg_dom_inconsistent(irg);
 124   set_irg_outs_inconsistent(irg);
 125   set_irg_loopinfo_state(current_ir_graph, loopinfo_cf_inconsistent);
 126 }
 127
 128 /**
 129  * check, whether a Ret can be moved on block upwards.
 130  *
 131  * In a block with a Return, all live nodes must be linked
 132  * with the Return, otherwise they are dead (because the Return leaves
 133  * the graph, so no more users of the other nodes can exists.
 134  *
 135  * We can move a Return, if it's predecessors are Phi nodes or
 136  * comes from another block. In the later case, it is always possible
 137  * to move the Return one block up, because the predecessor block must
 138  * dominate the Return block (SSA) and then it dominates the predecessor
 139  * block of the Return block as well.
 140  *
 141  * All predecessors of the Return block must be Jmp's of course, or we
 142  * cannot move it up, so we check this either.
 143  */
 144 static int can_move_ret(ir_node *ret)
 145 {
 146   ir_node *retbl = get_nodes_block(ret);
 147   int i, n = get_irn_arity(ret);
 148
 149   for (i = 0; i < n; ++i) {
 150     ir_node *pred = get_irn_n(ret, i);
 151
 152     if (! is_Phi(pred) && retbl == get_nodes_block(pred)) {
 153       /* first condition failed, found a non-Phi predecessor
 154        * then is in the Return block */
 155       return 0;
 156     }
 157   }
 158
 159   /* check, that predecessors are Jmps */
 160   n = get_Block_n_cfgpreds(retbl);
 161   for (i = 0; i < n; ++i)
 162     if (get_irn_op(get_Block_cfgpred(retbl, i)) != op_Jmp)
 163       return 0;
 164
 165   /* if we have 0 control flow predecessors, we cannot move :-) */
 166   return n > 0;
 167 }
 168
 169 /*
 170  * Normalize the Returns of a graph by moving
 171  * the Returns upwards as much as possible.
 172  * This might be prefered for code generation.
 173  *
 174  * In pseudocode, it means:
 175  *
 176  * if (a)
 177  *   res = b;
 178  * else
 179  *   res = c;
 180  * return res;
 181  *
 182  * is transformed into
 183  *
 184  * if (a)
 185  *   return b;
 186  * else
 187  *   return c;
 188  */
 189 void normalize_n_returns(ir_graph *irg)
 190 {
 191   int i, j, n, n_rets, n_finals, n_ret_vals;
 192   ir_node *list  = NULL;
 193   ir_node *final = NULL;
 194   ir_node **in;
 195   ir_node *endbl = get_irg_end_block(irg);
 196   ir_node *end;
 197
 198   /* first, link all returns */
 199   n = get_Block_n_cfgpreds(endbl);
 200   for (n_finals = n_rets = i = 0; i < n; ++i) {
 201     ir_node *ret = get_Block_cfgpred(endbl, i);
 202
 203     if (get_irn_op(ret) == op_Return && can_move_ret(ret)) {
 204       /*
 205        * Ok, all conditions met, we can move this Return, put it
 206        * on our work list.
 207        */
 208       set_irn_link(ret, list);
 209       list = ret;
 210       ++n_rets;
 211     }
 212     else {
 213       /* Put all nodes that are not changed on the final list. */
 214       set_irn_link(ret, final);
 215       final = ret;
 216       ++n_finals;
 217     }
 218   }
 219
 220   if (n_rets <= 0)
 221     return;
 222
 223   /*
 224    * Now move the Returns upwards. We move always one block up (and create n
 225    * new Returns), than we check if a newly created Return can be moved even further.
 226    * If yes, we simply add it to our work list, else to the final list.
 227    */
 228   end        = get_irg_end(irg);
 229   n_ret_vals = get_irn_arity(list);
 230   in         = alloca(sizeof(*in) * n_ret_vals);
 231   while (list) {
 232     ir_node *ret   = list;
 233     ir_node *block = get_nodes_block(ret);
 234     ir_node *phiM;
 235
 236     list = get_irn_link(ret);
 237     --n_rets;
 238
 239     n = get_Block_n_cfgpreds(block);
 240     for (i = 0; i < n; ++i) {
 241       ir_node *jmp    = get_Block_cfgpred(block, i);
 242       ir_node *new_bl = get_nodes_block(jmp);
 243       ir_node *new_ret;
 244
 245       /* create the in-array for the new Ret */
 246       for (j = 0; j < n_ret_vals; ++j) {
 247         ir_node *pred = get_irn_n(ret, j);
 248
 249         in[j] = is_Phi(pred) ? get_Phi_pred(pred, i) : pred;
 250       }
 251
 252       new_ret = new_r_Return(irg, new_bl, in[0], n_ret_vals - 1, &in[1]);
 253
 254       if (! is_Bad(new_ret)) {
 255         /*
 256          * The newly created node might be bad, if we
 257          * create it in a block with only Bad predecessors.
 258          * In that case ignore this block.
 259          *
 260          * We could even kill the jmp then ...
 261          */
 262         if (can_move_ret(new_ret)) {
 263           set_irn_link(new_ret, list);
 264           list = new_ret;
 265           ++n_rets;
 266         }
 267         else {
 268           set_irn_link(new_ret, final);
 269           final = new_ret;
 270           ++n_finals;
 271         }
 272       }
 273     }
 274
 275     /*
 276      * if the memory of the old Return is a PhiM, remove it
 277      * from the keep-alives, or it will keep the block which
 278      * will crash the dominator algorithm.
 279      */
 280     phiM = get_Return_mem(ret);
 281     if (is_Phi(phiM)) {
 282       n = get_End_n_keepalives(end);
 283       for (i = 0; i < n; ++i) {
 284         if (get_End_keepalive(end, i) == phiM) {
 285           set_End_keepalive(end, i, new_r_Bad(irg));
 286           break;
 287         }
 288       }
 289     }
 290   }
 291
 292   /*
 293    * Last step: Create a new endblock, with all nodes on the final
 294    * list as predecessors.
 295    */
 296   in = alloca(sizeof(*in) * n_finals);
 297
 298   for (i = 0; final; ++i, final = get_irn_link(final))
 299     in[i] = final;
 300
 301   exchange(endbl, new_r_Block(irg, n_finals, in));
 302
 303   /* the end block is not automatically skiped, so do it here */
 304   set_irg_end_block(irg, skip_Id(get_irg_end_block(irg)));
 305
 306   /* Invalidate analysis information:
 307    * Blocks become dead and new Eeturns were deleted, so dominator, outs and loop are inconsistent,
 308    * trouts and callee-state should be still valid
 309    */
 310   set_irg_dom_inconsistent(irg);
 311   set_irg_outs_inconsistent(irg);
 312   set_irg_loopinfo_state(current_ir_graph, loopinfo_cf_inconsistent);
 313 }