nsz Git - libfirm/blob - ir/ir/iropt.c

   1 /*
   2  * Project:     libFIRM
   3  * File name:   ir/ir/iropt.c
   4  * Purpose:     iropt --- optimizations intertwined with IR construction.
   5  * Author:      Christian Schaefer
   6  * Modified by: Goetz Lindenmaier, Michael Beck
   7  * Created:
   8  * CVS-ID:      $Id$
   9  * Copyright:   (c) 1998-2005 Universität Karlsruhe
  10  * Licence:     This file protected by GPL -  GNU GENERAL PUBLIC LICENSE.
  11  */
  12
  13 #ifdef HAVE_CONFIG_H
  14 # include "config.h"
  15 #endif
  16
  17 #ifdef HAVE_ALLOCA_H
  18 #include <alloca.h>
  19 #endif
  20 #ifdef HAVE_MALLOC_H
  21 #include <malloc.h>
  22 #endif
  23 #ifdef HAVE_STRING_H
  24 #include <string.h>
  25 #endif
  26
  27 #include "irnode_t.h"
  28 #include "irgraph_t.h"
  29 #include "iredges_t.h"
  30 #include "irmode_t.h"
  31 #include "iropt_t.h"
  32 #include "ircons_t.h"
  33 #include "irgmod.h"
  34 #include "irvrfy.h"
  35 #include "tv_t.h"
  36 #include "dbginfo_t.h"
  37 #include "iropt_dbg.h"
  38 #include "irflag_t.h"
  39 #include "irhooks.h"
  40 #include "irarch.h"
  41 #include "hashptr.h"
  42 #include "archop.h"
  43 #include "opt_polymorphy.h"
  44 #include "opt_confirms.h"
  45
  46 /* Make types visible to allow most efficient access */
  47 # include "entity_t.h"
  48
  49 /**
  50  * return the value of a Constant
  51  */
  52 static tarval *computed_value_Const(ir_node *n)
  53 {
  54   return get_Const_tarval(n);
  55 }
  56
  57 /**
  58  * return the value of a 'sizeof' SymConst
  59  */
  60 static tarval *computed_value_SymConst(ir_node *n)
  61 {
  62   ir_type *type;
  63
  64   switch (get_SymConst_kind(n)) {
  65   case symconst_type_size:
  66     type = get_SymConst_type(n);
  67     if (get_type_state(type) == layout_fixed)
  68       return new_tarval_from_long(get_type_size_bytes(type), get_irn_mode(n));
  69     break;
  70   case symconst_type_align:
  71     type = get_SymConst_type(n);
  72     if (get_type_state(type) == layout_fixed)
  73       return new_tarval_from_long(get_type_alignment_bytes(type), get_irn_mode(n));
  74     break;
  75   default:
  76     break;
  77   }
  78   return tarval_bad;
  79 }
  80
  81 /**
  82  * return the value of an Add
  83  */
  84 static tarval *computed_value_Add(ir_node *n)
  85 {
  86   ir_node *a = get_Add_left(n);
  87   ir_node *b = get_Add_right(n);
  88
  89   tarval *ta = value_of(a);
  90   tarval *tb = value_of(b);
  91
  92   if ((ta != tarval_bad) && (tb != tarval_bad) && (get_irn_mode(a) == get_irn_mode(b)))
  93     return tarval_add(ta, tb);
  94
  95   return tarval_bad;
  96 }
  97
  98 /**
  99  * return the value of a Sub
 100  * Special case: a - a
 101  */
 102 static tarval *computed_value_Sub(ir_node *n)
 103 {
 104   ir_node *a = get_Sub_left(n);
 105   ir_node *b = get_Sub_right(n);
 106   tarval *ta;
 107   tarval *tb;
 108
 109   /* a - a */
 110   if (a == b && !is_Bad(a))
 111     return get_mode_null(get_irn_mode(n));
 112
 113   ta = value_of(a);
 114   tb = value_of(b);
 115
 116   if ((ta != tarval_bad) && (tb != tarval_bad) && (get_irn_mode(a) == get_irn_mode(b)))
 117     return tarval_sub(ta, tb);
 118
 119   return tarval_bad;
 120 }
 121
 122 /**
 123  * return the value of a Carry
 124  * Special : a op 0, 0 op b
 125  */
 126 static tarval *computed_value_Carry(ir_node *n)
 127 {
 128   ir_node *a = get_binop_left(n);
 129   ir_node *b = get_binop_right(n);
 130   ir_mode *m = get_irn_mode(n);
 131
 132   tarval *ta = value_of(a);
 133   tarval *tb = value_of(b);
 134
 135   if ((ta != tarval_bad) && (tb != tarval_bad)) {
 136     tarval_add(ta, tb);
 137     return tarval_carry() ? get_mode_one(m) : get_mode_null(m);
 138   } else {
 139     if (   (classify_tarval(ta) == TV_CLASSIFY_NULL)
 140         || (classify_tarval(tb) == TV_CLASSIFY_NULL))
 141       return get_mode_null(m);
 142   }
 143   return tarval_bad;
 144 }
 145
 146 /**
 147  * return the value of a Borrow
 148  * Special : a op 0
 149  */
 150 static tarval *computed_value_Borrow(ir_node *n)
 151 {
 152   ir_node *a = get_binop_left(n);
 153   ir_node *b = get_binop_right(n);
 154   ir_mode *m = get_irn_mode(n);
 155
 156   tarval *ta = value_of(a);
 157   tarval *tb = value_of(b);
 158
 159   if ((ta != tarval_bad) && (tb != tarval_bad)) {
 160     return tarval_cmp(ta, tb) == pn_Cmp_Lt ? get_mode_one(m) : get_mode_null(m);
 161   } else if (classify_tarval(ta) == TV_CLASSIFY_NULL) {
 162       return get_mode_null(m);
 163   }
 164   return tarval_bad;
 165 }
 166
 167 /**
 168  * return the value of an unary Minus
 169  */
 170 static tarval *computed_value_Minus(ir_node *n)
 171 {
 172   ir_node *a = get_Minus_op(n);
 173   tarval *ta = value_of(a);
 174
 175   if ((ta != tarval_bad) && mode_is_signed(get_irn_mode(a)))
 176     return tarval_neg(ta);
 177
 178   return tarval_bad;
 179 }
 180
 181 /**
 182  * return the value of a Mul
 183  */
 184 static tarval *computed_value_Mul(ir_node *n)
 185 {
 186   ir_node *a = get_Mul_left(n);
 187   ir_node *b = get_Mul_right(n);
 188
 189   tarval *ta = value_of(a);
 190   tarval *tb = value_of(b);
 191
 192   if ((ta != tarval_bad) && (tb != tarval_bad) && (get_irn_mode(a) == get_irn_mode(b))) {
 193     return tarval_mul(ta, tb);
 194   } else {
 195     /* a*0 = 0 or 0*b = 0:
 196        calls computed_value recursive and returns the 0 with proper
 197        mode. */
 198     if ((ta != tarval_bad) && (ta == get_mode_null(get_tarval_mode(ta))))
 199       return ta;
 200     if ((tb != tarval_bad) && (tb == get_mode_null(get_tarval_mode(tb))))
 201       return tb;
 202   }
 203   return tarval_bad;
 204 }
 205
 206 /**
 207  * return the value of a floating point Quot
 208  */
 209 static tarval *computed_value_Quot(ir_node *n)
 210 {
 211   ir_node *a = get_Quot_left(n);
 212   ir_node *b = get_Quot_right(n);
 213
 214   tarval *ta = value_of(a);
 215   tarval *tb = value_of(b);
 216
 217   /* This was missing in original implementation. Why? */
 218   if ((ta != tarval_bad) && (tb != tarval_bad) && (get_irn_mode(a) == get_irn_mode(b))) {
 219     if (tb != get_mode_null(get_tarval_mode(tb)))   /* div by zero: return tarval_bad */
 220       return tarval_quo(ta, tb);
 221   }
 222   return tarval_bad;
 223 }
 224
 225 /**
 226  * calculate the value of an integer Div of two nodes
 227  * Special case: 0 / b
 228  */
 229 static tarval *do_computed_value_Div(ir_node *a, ir_node *b)
 230 {
 231   tarval *ta = value_of(a);
 232   tarval *tb = value_of(b);
 233
 234   /* Compute c1 / c2 or 0 / a, a != 0 */
 235   if (ta != tarval_bad) {
 236     if ((tb != tarval_bad) && (tb != get_mode_null(get_irn_mode(b))))   /* div by zero: return tarval_bad */
 237       return tarval_div(ta, tb);
 238     else if (ta == get_mode_null(get_tarval_mode(ta)))  /* 0 / b == 0 */
 239       return ta;
 240   }
 241   return tarval_bad;
 242 }
 243
 244 /**
 245  * return the value of an integer Div
 246  */
 247 static tarval *computed_value_Div(ir_node *n)
 248 {
 249   return do_computed_value_Div(get_Div_left(n), get_Div_right(n));
 250 }
 251
 252 /**
 253  * calculate the value of an integer Mod of two nodes
 254  * Special case: a % 1
 255  */
 256 static tarval *do_computed_value_Mod(ir_node *a, ir_node *b)
 257 {
 258   tarval *ta = value_of(a);
 259   tarval *tb = value_of(b);
 260
 261   /* Compute c1 % c2 or a % 1 */
 262   if (tb != tarval_bad) {
 263     if ((ta != tarval_bad) && (tb != get_mode_null(get_tarval_mode(tb))))   /* div by zero: return tarval_bad */
 264       return tarval_mod(ta, tb);
 265     else if (tb == get_mode_one(get_tarval_mode(tb)))    /* x mod 1 == 0 */
 266       return get_mode_null(get_irn_mode(a));
 267   }
 268
 269   return tarval_bad;
 270 }
 271
 272 /**
 273  * return the value of an integer Mod
 274  */
 275 static tarval *computed_value_Mod(ir_node *n)
 276 {
 277   return do_computed_value_Mod(get_Mod_left(n), get_Mod_right(n));
 278 }
 279
 280 /**
 281  * return the value of an Abs
 282  */
 283 static tarval *computed_value_Abs(ir_node *n)
 284 {
 285   ir_node *a = get_Abs_op(n);
 286   tarval *ta = value_of(a);
 287
 288   if (ta != tarval_bad)
 289     return tarval_abs(ta);
 290
 291   return tarval_bad;
 292 }
 293
 294 /**
 295  * return the value of an And
 296  * Special case: a & 0, 0 & b
 297  */
 298 static tarval *computed_value_And(ir_node *n)
 299 {
 300   ir_node *a = get_And_left(n);
 301   ir_node *b = get_And_right(n);
 302
 303   tarval *ta = value_of(a);
 304   tarval *tb = value_of(b);
 305
 306   if ((ta != tarval_bad) && (tb != tarval_bad)) {
 307     return tarval_and (ta, tb);
 308   } else {
 309     tarval *v;
 310
 311     if (   (classify_tarval ((v = ta)) == TV_CLASSIFY_NULL)
 312         || (classify_tarval ((v = tb)) == TV_CLASSIFY_NULL)) {
 313       return v;
 314     }
 315   }
 316   return tarval_bad;
 317 }
 318
 319 /**
 320  * return the value of an Or
 321  * Special case: a | 1...1, 1...1 | b
 322  */
 323 static tarval *computed_value_Or(ir_node *n)
 324 {
 325   ir_node *a = get_Or_left(n);
 326   ir_node *b = get_Or_right(n);
 327
 328   tarval *ta = value_of(a);
 329   tarval *tb = value_of(b);
 330
 331   if ((ta != tarval_bad) && (tb != tarval_bad)) {
 332     return tarval_or (ta, tb);
 333   } else {
 334     tarval *v;
 335     if (   (classify_tarval ((v = ta)) == TV_CLASSIFY_ALL_ONE)
 336         || (classify_tarval ((v = tb)) == TV_CLASSIFY_ALL_ONE)) {
 337       return v;
 338     }
 339   }
 340   return tarval_bad;
 341 }
 342
 343 /**
 344  * return the value of an Eor
 345  */
 346 static tarval *computed_value_Eor(ir_node *n)
 347 {
 348   ir_node *a = get_Eor_left(n);
 349   ir_node *b = get_Eor_right(n);
 350
 351   tarval *ta, *tb;
 352
 353   if (a == b)
 354     return get_mode_null(get_irn_mode(n));
 355
 356   ta = value_of(a);
 357   tb = value_of(b);
 358
 359   if ((ta != tarval_bad) && (tb != tarval_bad)) {
 360     return tarval_eor (ta, tb);
 361   }
 362   return tarval_bad;
 363 }
 364
 365 /**
 366  * return the value of a Not
 367  */
 368 static tarval *computed_value_Not(ir_node *n)
 369 {
 370   ir_node *a = get_Not_op(n);
 371   tarval *ta = value_of(a);
 372
 373   if (ta != tarval_bad)
 374     return tarval_not(ta);
 375
 376   return tarval_bad;
 377 }
 378
 379 /**
 380  * return the value of a Shl
 381  */
 382 static tarval *computed_value_Shl(ir_node *n)
 383 {
 384   ir_node *a = get_Shl_left(n);
 385   ir_node *b = get_Shl_right(n);
 386
 387   tarval *ta = value_of(a);
 388   tarval *tb = value_of(b);
 389
 390   if ((ta != tarval_bad) && (tb != tarval_bad)) {
 391     return tarval_shl (ta, tb);
 392   }
 393   return tarval_bad;
 394 }
 395
 396 /**
 397  * return the value of a Shr
 398  */
 399 static tarval *computed_value_Shr(ir_node *n)
 400 {
 401   ir_node *a = get_Shr_left(n);
 402   ir_node *b = get_Shr_right(n);
 403
 404   tarval *ta = value_of(a);
 405   tarval *tb = value_of(b);
 406
 407   if ((ta != tarval_bad) && (tb != tarval_bad)) {
 408     return tarval_shr (ta, tb);
 409   }
 410   return tarval_bad;
 411 }
 412
 413 /**
 414  * return the value of a Shrs
 415  */
 416 static tarval *computed_value_Shrs(ir_node *n)
 417 {
 418   ir_node *a = get_Shrs_left(n);
 419   ir_node *b = get_Shrs_right(n);
 420
 421   tarval *ta = value_of(a);
 422   tarval *tb = value_of(b);
 423
 424   if ((ta != tarval_bad) && (tb != tarval_bad)) {
 425     return tarval_shrs (ta, tb);
 426   }
 427   return tarval_bad;
 428 }
 429
 430 /**
 431  * return the value of a Rot
 432  */
 433 static tarval *computed_value_Rot(ir_node *n)
 434 {
 435   ir_node *a = get_Rot_left(n);
 436   ir_node *b = get_Rot_right(n);
 437
 438   tarval *ta = value_of(a);
 439   tarval *tb = value_of(b);
 440
 441   if ((ta != tarval_bad) && (tb != tarval_bad)) {
 442     return tarval_rot (ta, tb);
 443   }
 444   return tarval_bad;
 445 }
 446
 447 /**
 448  * return the value of a Conv
 449  */
 450 static tarval *computed_value_Conv(ir_node *n)
 451 {
 452   ir_node *a = get_Conv_op(n);
 453   tarval *ta = value_of(a);
 454
 455   if (ta != tarval_bad)
 456     return tarval_convert_to(ta, get_irn_mode(n));
 457
 458   return tarval_bad;
 459 }
 460
 461 /**
 462  * return the value of a Proj(Cmp)
 463  *
 464  * This performs a first step of unreachable code elimination.
 465  * Proj can not be computed, but folding a Cmp above the Proj here is
 466  * not as wasteful as folding a Cmp into a Tuple of 16 Consts of which
 467  * only 1 is used.
 468  * There are several case where we can evaluate a Cmp node, see later.
 469  */
 470 static tarval *computed_value_Proj_Cmp(ir_node *n)
 471 {
 472   ir_node *a   = get_Proj_pred(n);
 473   ir_node *aa  = get_Cmp_left(a);
 474   ir_node *ab  = get_Cmp_right(a);
 475   long proj_nr = get_Proj_proj(n);
 476
 477   /*
 478    * BEWARE: a == a is NOT always True for floating Point values, as
 479    * NaN != NaN is defined, so we must check this here.
 480    */
 481   if (aa == ab && (
 482       !mode_is_float(get_irn_mode(aa)) || proj_nr == pn_Cmp_Lt ||  proj_nr == pn_Cmp_Gt)
 483       ) { /* 1.: */
 484
 485     /* This is a trick with the bits used for encoding the Cmp
 486        Proj numbers, the following statement is not the same:
 487     return new_tarval_from_long (proj_nr == pn_Cmp_Eq, mode_b) */
 488     return new_tarval_from_long (proj_nr & pn_Cmp_Eq, mode_b);
 489   }
 490   else {
 491     tarval *taa = value_of(aa);
 492     tarval *tab = value_of(ab);
 493     ir_mode *mode = get_irn_mode(aa);
 494
 495     /*
 496      * The predecessors of Cmp are target values.  We can evaluate
 497      * the Cmp.
 498      */
 499     if ((taa != tarval_bad) && (tab != tarval_bad)) {
 500       /* strange checks... */
 501       pn_Cmp flags = tarval_cmp(taa, tab);
 502       if (flags != pn_Cmp_False) {
 503         return new_tarval_from_long (proj_nr & flags, mode_b);
 504       }
 505     }
 506     /* for integer values, we can check against MIN/MAX */
 507     else if (mode_is_int(mode)) {
 508       /* MIN <=/> x.  This results in true/false. */
 509       if (taa == get_mode_min(mode)) {
 510         /* a compare with the MIN value */
 511         if (proj_nr == pn_Cmp_Le)
 512           return get_tarval_b_true();
 513         else if (proj_nr == pn_Cmp_Gt)
 514           return get_tarval_b_false();
 515       }
 516       /* x >=/< MIN.  This results in true/false. */
 517       else
 518       if (tab == get_mode_min(mode)) {
 519         /* a compare with the MIN value */
 520         if (proj_nr == pn_Cmp_Ge)
 521           return get_tarval_b_true();
 522         else if (proj_nr == pn_Cmp_Lt)
 523           return get_tarval_b_false();
 524       }
 525       /* MAX >=/< x.  This results in true/false. */
 526       else if (taa == get_mode_max(mode)) {
 527         if (proj_nr == pn_Cmp_Ge)
 528           return get_tarval_b_true();
 529         else if (proj_nr == pn_Cmp_Lt)
 530           return get_tarval_b_false();
 531       }
 532       /* x <=/> MAX.  This results in true/false. */
 533       else if (tab == get_mode_max(mode)) {
 534         if (proj_nr == pn_Cmp_Le)
 535           return get_tarval_b_true();
 536         else if (proj_nr == pn_Cmp_Gt)
 537           return get_tarval_b_false();
 538       }
 539     }
 540     /*
 541      * The predecessors are Allocs or (void*)(0) constants.  Allocs never
 542      * return NULL, they raise an exception.   Therefore we can predict
 543      * the Cmp result.
 544      */
 545     else {
 546       ir_node *aaa = skip_Id(skip_Proj(aa));
 547       ir_node *aba = skip_Id(skip_Proj(ab));
 548
 549       if (   (   (/* aa is ProjP and aaa is Alloc */
 550                      (get_irn_op(aa) == op_Proj)
 551                   && (mode_is_reference(get_irn_mode(aa)))
 552                   && (get_irn_op(aaa) == op_Alloc))
 553               && (   (/* ab is NULL */
 554                          (get_irn_op(ab) == op_Const)
 555                       && (mode_is_reference(get_irn_mode(ab)))
 556                       && (get_Const_tarval(ab) == get_mode_null(get_irn_mode(ab))))
 557                   || (/* ab is other Alloc */
 558                          (get_irn_op(ab) == op_Proj)
 559                       && (mode_is_reference(get_irn_mode(ab)))
 560                       && (get_irn_op(aba) == op_Alloc)
 561                       && (aaa != aba))))
 562           || (/* aa is NULL and aba is Alloc */
 563                  (get_irn_op(aa) == op_Const)
 564               && (mode_is_reference(get_irn_mode(aa)))
 565               && (get_Const_tarval(aa) == get_mode_null(get_irn_mode(aa)))
 566               && (get_irn_op(ab) == op_Proj)
 567               && (mode_is_reference(get_irn_mode(ab)))
 568               && (get_irn_op(aba) == op_Alloc)))
 569         /* 3.: */
 570         return new_tarval_from_long(proj_nr & pn_Cmp_Ne, mode_b);
 571     }
 572   }
 573   return computed_value_Cmp_Confirm(a, aa, ab, proj_nr);
 574 }
 575
 576 /**
 577  * return the value of a Proj, handle Proj(Cmp), Proj(Div), Proj(Mod), Proj(DivMod)
 578  */
 579 static tarval *computed_value_Proj(ir_node *n)
 580 {
 581   ir_node *a = get_Proj_pred(n);
 582   long proj_nr;
 583
 584   switch (get_irn_opcode(a)) {
 585   case iro_Cmp:
 586     return computed_value_Proj_Cmp(n);
 587
 588   case iro_DivMod:
 589     /* compute either the Div or the Mod part */
 590     proj_nr = get_Proj_proj(n);
 591     if (proj_nr == pn_DivMod_res_div)
 592       return do_computed_value_Div(get_DivMod_left(a), get_DivMod_right(a));
 593     else if (proj_nr == pn_DivMod_res_mod)
 594       return do_computed_value_Mod(get_DivMod_left(a), get_DivMod_right(a));
 595     break;
 596
 597   case iro_Div:
 598     if (get_Proj_proj(n) == pn_Div_res)
 599       return computed_value(a);
 600     break;
 601
 602   case iro_Mod:
 603     if (get_Proj_proj(n) == pn_Mod_res)
 604       return computed_value(a);
 605     break;
 606
 607   default:
 608     return tarval_bad;
 609   }
 610   return tarval_bad;
 611 }
 612
 613 /**
 614  * calculate the value of a Mux: can be evaluated, if the
 615  * sel and the right input are known
 616  */
 617 static tarval *computed_value_Mux(ir_node *n)
 618 {
 619   ir_node *sel = get_Mux_sel(n);
 620   tarval *ts = value_of(sel);
 621
 622   if (ts == get_tarval_b_true()) {
 623     ir_node *v = get_Mux_true(n);
 624     return value_of(v);
 625   }
 626   else if (ts == get_tarval_b_false()) {
 627     ir_node *v = get_Mux_false(n);
 628     return value_of(v);
 629   }
 630   return tarval_bad;
 631 }
 632
 633 /**
 634  * Calculate the value of a Psi: can be evaluated, if a condition is true
 635  * and all previous conditions are false. If all conditions are false
 636  * we evaluate to the default one.
 637  */
 638 static tarval *computed_value_Psi(ir_node *n)
 639 {
 640   if (is_Mux(n))
 641     return computed_value_Mux(n);
 642   return tarval_bad;
 643 }
 644
 645 /**
 646  * calculate the value of a Confirm: can be evaluated,
 647  * if it has the form Confirm(x, '=', Const).
 648  */
 649 static tarval *computed_value_Confirm(ir_node *n)
 650 {
 651   return get_Confirm_cmp(n) == pn_Cmp_Eq ?
 652     value_of(get_Confirm_bound(n)) : tarval_bad;
 653 }
 654
 655 /**
 656  * If the parameter n can be computed, return its value, else tarval_bad.
 657  * Performs constant folding.
 658  *
 659  * @param n  The node this should be evaluated
 660  */
 661 tarval *computed_value(ir_node *n)
 662 {
 663   if (n->op->ops.computed_value)
 664     return n->op->ops.computed_value(n);
 665   return tarval_bad;
 666 }
 667
 668 /**
 669  * set the default computed_value evaluator in an ir_op_ops.
 670  *
 671  * @param code   the opcode for the default operation
 672  * @param ops    the operations initialized
 673  *
 674  * @return
 675  *    The operations.
 676  */
 677 static ir_op_ops *firm_set_default_computed_value(opcode code, ir_op_ops *ops)
 678 {
 679 #define CASE(a)                               \
 680   case iro_##a:                               \
 681     ops->computed_value  = computed_value_##a; \
 682     break
 683
 684   switch (code) {
 685   CASE(Const);
 686   CASE(SymConst);
 687   CASE(Add);
 688   CASE(Sub);
 689   CASE(Minus);
 690   CASE(Mul);
 691   CASE(Quot);
 692   CASE(Div);
 693   CASE(Mod);
 694   CASE(Abs);
 695   CASE(And);
 696   CASE(Or);
 697   CASE(Eor);
 698   CASE(Not);
 699   CASE(Shl);
 700   CASE(Shr);
 701   CASE(Shrs);
 702   CASE(Rot);
 703   CASE(Carry);
 704   CASE(Borrow);
 705   CASE(Conv);
 706   CASE(Proj);
 707   CASE(Mux);
 708   CASE(Psi);
 709   CASE(Confirm);
 710   default:
 711     /* leave NULL */;
 712   }
 713
 714   return ops;
 715 #undef CASE
 716 }
 717
 718 /**
 719  * Returns a equivalent block for another block.
 720  * If the block has only one predecessor, this is
 721  * the equivalent one. If the only predecessor of a block is
 722  * the block itself, this is a dead block.
 723  *
 724  * If both predecessors of a block are the branches of a binary
 725  * Cond, the equivalent block is Cond's block.
 726  *
 727  * If all predecessors of a block are bad or lies in a dead
 728  * block, the current block is dead as well.
 729  *
 730  * Note, that blocks are NEVER turned into Bad's, instead
 731  * the dead_block flag is set. So, never test for is_Bad(block),
 732  * always use is_dead_Block(block).
 733  */
 734 static ir_node *equivalent_node_Block(ir_node *n)
 735 {
 736   ir_node *oldn = n;
 737   int n_preds   = get_Block_n_cfgpreds(n);
 738
 739   /* The Block constructor does not call optimize, but mature_immBlock
 740      calls the optimization. */
 741   assert(get_Block_matured(n));
 742
 743   /* Straightening: a single entry Block following a single exit Block
 744      can be merged, if it is not the Start block. */
 745   /* !!! Beware, all Phi-nodes of n must have been optimized away.
 746      This should be true, as the block is matured before optimize is called.
 747      But what about Phi-cycles with the Phi0/Id that could not be resolved?
 748      Remaining Phi nodes are just Ids. */
 749    if ((n_preds == 1) && (get_irn_op(get_Block_cfgpred(n, 0)) == op_Jmp)) {
 750      ir_node *predblock = get_nodes_block(get_Block_cfgpred(n, 0));
 751      if (predblock == oldn) {
 752        /* Jmp jumps into the block it is in -- deal self cycle. */
 753        n = set_Block_dead(n);
 754        DBG_OPT_DEAD_BLOCK(oldn, n);
 755      } else if (get_opt_control_flow_straightening()) {
 756        n = predblock;
 757        DBG_OPT_STG(oldn, n);
 758      }
 759    }
 760    else if ((n_preds == 1) &&
 761             (get_irn_op(skip_Proj(get_Block_cfgpred(n, 0))) == op_Cond)) {
 762      ir_node *predblock = get_Block_cfgpred_block(n, 0);
 763      if (predblock == oldn) {
 764        /* Jmp jumps into the block it is in -- deal self cycle. */
 765        n = set_Block_dead(n);
 766        DBG_OPT_DEAD_BLOCK(oldn, n);
 767      }
 768    }
 769    else if ((n_preds == 2) &&
 770             (get_opt_control_flow_weak_simplification())) {
 771     /* Test whether Cond jumps twice to this block
 772      * The more general case which more than 2 predecessors is handles
 773      * in optimize_cf(), we handle only this special case for speed here.
 774      */
 775     ir_node *a = get_Block_cfgpred(n, 0);
 776     ir_node *b = get_Block_cfgpred(n, 1);
 777
 778     if ((get_irn_op(a) == op_Proj) &&
 779         (get_irn_op(b) == op_Proj) &&
 780         (get_Proj_pred(a) == get_Proj_pred(b)) &&
 781         (get_irn_op(get_Proj_pred(a)) == op_Cond) &&
 782         (get_irn_mode(get_Cond_selector(get_Proj_pred(a))) == mode_b)) {
 783       /* Also a single entry Block following a single exit Block.  Phis have
 784          twice the same operand and will be optimized away. */
 785       n = get_nodes_block(get_Proj_pred(a));
 786       DBG_OPT_IFSIM1(oldn, a, b, n);
 787     }
 788   }
 789   else if (get_opt_unreachable_code() &&
 790            (n != get_irg_start_block(current_ir_graph)) &&
 791            (n != get_irg_end_block(current_ir_graph))    ) {
 792     int i;
 793
 794     /* If all inputs are dead, this block is dead too, except if it is
 795        the start or end block.  This is one step of unreachable code
 796        elimination */
 797     for (i = get_Block_n_cfgpreds(n) - 1; i >= 0; --i) {
 798       ir_node *pred = get_Block_cfgpred(n, i);
 799       ir_node *pred_blk;
 800
 801       if (is_Bad(pred)) continue;
 802       pred_blk = get_nodes_block(skip_Proj(pred));
 803
 804       if (is_Block_dead(pred_blk)) continue;
 805
 806       if (pred_blk != n) {
 807         /* really found a living input */
 808         break;
 809       }
 810     }
 811     if (i < 0) {
 812       n = set_Block_dead(n);
 813       DBG_OPT_DEAD_BLOCK(oldn, n);
 814     }
 815   }
 816
 817   return n;
 818 }
 819
 820 /**
 821  * Returns a equivalent node for a Jmp, a Bad :-)
 822  * Of course this only happens if the Block of the Jmp is dead.
 823  */
 824 static ir_node *equivalent_node_Jmp(ir_node *n)
 825 {
 826   /* unreachable code elimination */
 827   if (is_Block_dead(get_nodes_block(n)))
 828     n = new_Bad();
 829
 830   return n;
 831 }
 832
 833 /** Raise is handled in the same way as Jmp. */
 834 #define equivalent_node_Raise   equivalent_node_Jmp
 835
 836
 837 /* We do not evaluate Cond here as we replace it by a new node, a Jmp.
 838    See transform_node_Proj_Cond(). */
 839
 840 /**
 841  * optimize operations that are commutative and have neutral 0,
 842  * so a op 0 = 0 op a = a.
 843  */
 844 static ir_node *equivalent_node_neutral_zero(ir_node *n)
 845 {
 846   ir_node *oldn = n;
 847
 848   ir_node *a = get_binop_left(n);
 849   ir_node *b = get_binop_right(n);
 850
 851   tarval *tv;
 852   ir_node *on;
 853
 854   /* After running compute_node there is only one constant predecessor.
 855      Find this predecessors value and remember the other node: */
 856   if ((tv = value_of(a)) != tarval_bad) {
 857     on = b;
 858   } else if ((tv = value_of(b)) != tarval_bad) {
 859     on = a;
 860   } else
 861     return n;
 862
 863   /* If this predecessors constant value is zero, the operation is
 864    * unnecessary. Remove it.
 865    *
 866    * Beware: If n is a Add, the mode of on and n might be different
 867    * which happens in this rare construction: NULL + 3.
 868    * Then, a Conv would be needed which we cannot include here.
 869    */
 870   if (classify_tarval (tv) == TV_CLASSIFY_NULL) {
 871     if (get_irn_mode(on) == get_irn_mode(n)) {
 872       n = on;
 873
 874       DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_NEUTRAL_0);
 875     }
 876   }
 877
 878   return n;
 879 }
 880
 881 /**
 882  * Eor is commutative and has neutral 0.
 883  */
 884 #define equivalent_node_Eor  equivalent_node_neutral_zero
 885
 886 /*
 887  * Optimize a - 0 and (a - x) + x (for modes with wrap-around).
 888  *
 889  * The second one looks strange, but this construct
 890  * is used heavily in the LCC sources :-).
 891  *
 892  * Beware: The Mode of an Add may be different than the mode of its
 893  * predecessors, so we could not return a predecessors in all cases.
 894  */
 895 static ir_node *equivalent_node_Add(ir_node *n)
 896 {
 897   ir_node *oldn = n;
 898   ir_node *left, *right;
 899
 900   n = equivalent_node_neutral_zero(n);
 901   if (n != oldn)
 902     return n;
 903
 904   left  = get_Add_left(n);
 905   right = get_Add_right(n);
 906
 907   if (get_irn_op(left) == op_Sub) {
 908     if (get_Sub_right(left) == right) {
 909       /* (a - x) + x */
 910
 911       n = get_Sub_left(left);
 912       if (get_irn_mode(oldn) == get_irn_mode(n)) {
 913         DBG_OPT_ALGSIM1(oldn, left, right, n, FS_OPT_ADD_SUB);
 914         return n;
 915       }
 916     }
 917   }
 918   if (get_irn_op(right) == op_Sub) {
 919     if (get_Sub_right(right) == left) {
 920       /* x + (a - x) */
 921
 922       n = get_Sub_left(right);
 923       if (get_irn_mode(oldn) == get_irn_mode(n)) {
 924         DBG_OPT_ALGSIM1(oldn, left, right, n, FS_OPT_ADD_SUB);
 925         return n;
 926       }
 927     }
 928   }
 929   return n;
 930 }
 931
 932 /**
 933  * optimize operations that are not commutative but have neutral 0 on left,
 934  * so a op 0 = a.
 935  */
 936 static ir_node *equivalent_node_left_zero(ir_node *n)
 937 {
 938   ir_node *oldn = n;
 939
 940   ir_node *a = get_binop_left(n);
 941   ir_node *b = get_binop_right(n);
 942
 943   if (classify_tarval(value_of(b)) == TV_CLASSIFY_NULL) {
 944     n = a;
 945
 946     DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_NEUTRAL_0);
 947   }
 948
 949   return n;
 950 }
 951
 952 #define equivalent_node_Shl   equivalent_node_left_zero
 953 #define equivalent_node_Shr   equivalent_node_left_zero
 954 #define equivalent_node_Shrs  equivalent_node_left_zero
 955 #define equivalent_node_Rot   equivalent_node_left_zero
 956
 957 /**
 958  * Optimize a - 0 and (a + x) - x (for modes with wrap-around).
 959  *
 960  * The second one looks strange, but this construct
 961  * is used heavily in the LCC sources :-).
 962  *
 963  * Beware: The Mode of a Sub may be different than the mode of its
 964  * predecessors, so we could not return a predecessors in all cases.
 965  */
 966 static ir_node *equivalent_node_Sub(ir_node *n)
 967 {
 968   ir_node *oldn = n;
 969
 970   ir_node *a = get_Sub_left(n);
 971   ir_node *b = get_Sub_right(n);
 972
 973   /* Beware: modes might be different */
 974   if (classify_tarval(value_of(b)) == TV_CLASSIFY_NULL) {
 975     if (get_irn_mode(n) == get_irn_mode(a)) {
 976       n = a;
 977
 978       DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_NEUTRAL_0);
 979     }
 980   }
 981   else if (get_irn_op(a) == op_Add) {
 982     ir_mode *mode = get_irn_mode(n);
 983
 984     if (mode_wrap_around(mode)) {
 985       ir_node *left  = get_Add_left(a);
 986       ir_node *right = get_Add_right(a);
 987
 988       if (left == b) {
 989         if (get_irn_mode(n) == get_irn_mode(right)) {
 990           n = right;
 991           DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_ADD_SUB);
 992         }
 993       }
 994       else if (right == b) {
 995         if (get_irn_mode(n) == get_irn_mode(left)) {
 996           n = left;
 997           DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_ADD_SUB);
 998         }
 999       }
1000     }
1001   }
1002
1003   return n;
1004 }
1005
1006
1007 /**
1008  * Optimize an "idempotent unary op", ie op(op(n)) = n.
1009  *
1010  * @todo
1011  *   -(-a) == a, but might overflow two times.
1012  *   We handle it anyway here but the better way would be a
1013  *   flag. This would be needed for Pascal for instance.
1014  */
1015 static ir_node *equivalent_node_idempotent_unop(ir_node *n)
1016 {
1017   ir_node *oldn = n;
1018   ir_node *pred = get_unop_op(n);
1019
1020   /* optimize symmetric unop */
1021   if (get_irn_op(pred) == get_irn_op(n)) {
1022     n = get_unop_op(pred);
1023     DBG_OPT_ALGSIM2(oldn, pred, n);
1024   }
1025   return n;
1026 }
1027
1028 /** Not(Not(x)) == x */
1029 #define equivalent_node_Not    equivalent_node_idempotent_unop
1030
1031 /** --x == x       ??? Is this possible or can --x raise an
1032                        out of bounds exception if min =! max? */
1033 #define equivalent_node_Minus  equivalent_node_idempotent_unop
1034
1035 /**
1036  * Optimize a * 1 = 1 * a = a.
1037  */
1038 static ir_node *equivalent_node_Mul(ir_node *n)
1039 {
1040   ir_node *oldn = n;
1041
1042   ir_node *a = get_Mul_left(n);
1043   ir_node *b = get_Mul_right(n);
1044
1045   /* Mul is commutative and has again an other neutral element. */
1046   if (classify_tarval(value_of(a)) == TV_CLASSIFY_ONE) {
1047     n = b;
1048     DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_NEUTRAL_1);
1049   } else if (classify_tarval(value_of(b)) == TV_CLASSIFY_ONE) {
1050     n = a;
1051     DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_NEUTRAL_1);
1052   }
1053   return n;
1054 }
1055
1056 /**
1057  * Optimize a / 1 = a.
1058  */
1059 static ir_node *equivalent_node_Div(ir_node *n)
1060 {
1061   ir_node *a = get_Div_left(n);
1062   ir_node *b = get_Div_right(n);
1063
1064   /* Div is not commutative. */
1065   if (classify_tarval(value_of(b)) == TV_CLASSIFY_ONE) { /* div(x, 1) == x */
1066     /* Turn Div into a tuple (mem, bad, a) */
1067     ir_node *mem = get_Div_mem(n);
1068     turn_into_tuple(n, pn_Div_max);
1069     set_Tuple_pred(n, pn_Div_M,        mem);
1070     set_Tuple_pred(n, pn_Div_X_except, new_Bad());        /* no exception */
1071     set_Tuple_pred(n, pn_Div_res,      a);
1072   }
1073   return n;
1074 }
1075
1076 /**
1077  * Optimize a / 1 = a.
1078  */
1079 static ir_node *equivalent_node_DivMod(ir_node *n)
1080 {
1081   ir_node *a = get_DivMod_left(n);
1082   ir_node *b = get_DivMod_right(n);
1083
1084   /* Div is not commutative. */
1085   if (classify_tarval(value_of(b)) == TV_CLASSIFY_ONE) { /* div(x, 1) == x */
1086     /* Turn DivMod into a tuple (mem, bad, a, 0) */
1087     ir_node *mem = get_Div_mem(n);
1088     ir_mode *mode = get_irn_mode(b);
1089
1090     turn_into_tuple(n, pn_DivMod_max);
1091     set_Tuple_pred(n, pn_DivMod_M,        mem);
1092     set_Tuple_pred(n, pn_DivMod_X_except, new_Bad());        /* no exception */
1093     set_Tuple_pred(n, pn_DivMod_res_div,  a);
1094     set_Tuple_pred(n, pn_DivMod_res_mod,  new_Const(mode, get_mode_null(mode)));
1095   }
1096   return n;
1097 }
1098
1099 /**
1100  * Use algebraic simplification a | a = a | 0 = 0 | a = a.
1101  */
1102 static ir_node *equivalent_node_Or(ir_node *n)
1103 {
1104   ir_node *oldn = n;
1105
1106   ir_node *a = get_Or_left(n);
1107   ir_node *b = get_Or_right(n);
1108
1109   if (a == b) {
1110     n = a;    /* Or has it's own neutral element */
1111     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_OR);
1112   } else if (classify_tarval(value_of(a)) == TV_CLASSIFY_NULL) {
1113     n = b;
1114     DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_OR);
1115   } else if (classify_tarval(value_of(b)) == TV_CLASSIFY_NULL) {
1116     n = a;
1117     DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_OR);
1118   }
1119
1120   return n;
1121 }
1122
1123 /**
1124  * Optimize a & 0b1...1 = 0b1...1 & a =  a & a = a.
1125  */
1126 static ir_node *equivalent_node_And(ir_node *n)
1127 {
1128   ir_node *oldn = n;
1129
1130   ir_node *a = get_And_left(n);
1131   ir_node *b = get_And_right(n);
1132
1133   if (a == b) {
1134     n = a;    /* And has it's own neutral element */
1135     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_AND);
1136   } else if (classify_tarval(value_of(a)) == TV_CLASSIFY_ALL_ONE) {
1137     n = b;
1138     DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_AND);
1139   } else if (classify_tarval(value_of(b)) == TV_CLASSIFY_ALL_ONE) {
1140     n = a;
1141     DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_AND);
1142   }
1143   return n;
1144 }
1145
1146 /**
1147  * Try to remove useless Conv's:
1148  */
1149 static ir_node *equivalent_node_Conv(ir_node *n)
1150 {
1151   ir_node *oldn = n;
1152   ir_node *a = get_Conv_op(n);
1153   ir_node *b;
1154
1155   ir_mode *n_mode = get_irn_mode(n);
1156   ir_mode *a_mode = get_irn_mode(a);
1157
1158   if (n_mode == a_mode) { /* No Conv necessary */
1159     n = a;
1160     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_CONV);
1161   } else if (get_irn_op(a) == op_Conv) { /* Conv(Conv(b)) */
1162     ir_mode *b_mode;
1163
1164     b = get_Conv_op(a);
1165     n_mode = get_irn_mode(n);
1166     b_mode = get_irn_mode(b);
1167
1168     if (n_mode == b_mode) {
1169       if (n_mode == mode_b) {
1170         n = b; /* Convb(Conv*(xxxb(...))) == xxxb(...) */
1171         DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_CONV);
1172       }
1173       else if (mode_is_int(n_mode) || mode_is_character(n_mode)) {
1174         if (smaller_mode(b_mode, a_mode)){
1175           n = b;        /* ConvS(ConvL(xxxS(...))) == xxxS(...) */
1176           DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_CONV);
1177         }
1178       }
1179     }
1180   }
1181   return n;
1182 }
1183
1184 /**
1185  * A Cast may be removed if the type of the previous node
1186  * is already the type of the Cast.
1187  */
1188 static ir_node *equivalent_node_Cast(ir_node *n) {
1189   ir_node *oldn = n;
1190   ir_node *pred = get_Cast_op(n);
1191
1192   if (get_irn_type(pred) == get_Cast_type(n)) {
1193     n = pred;
1194     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_CAST);
1195   }
1196   return n;
1197 }
1198
1199 /**
1200   Several optimizations:
1201    - no Phi in start block.
1202    - remove Id operators that are inputs to Phi
1203    - fold Phi-nodes, iff they have only one predecessor except
1204            themselves.
1205  */
1206 static ir_node *equivalent_node_Phi(ir_node *n)
1207 {
1208   int i, n_preds;
1209
1210   ir_node *oldn = n;
1211   ir_node *block = NULL;     /* to shutup gcc */
1212   ir_node *first_val = NULL; /* to shutup gcc */
1213
1214   if (!get_opt_normalize()) return n;
1215
1216   n_preds = get_Phi_n_preds(n);
1217
1218   block = get_nodes_block(n);
1219   /* @@@ fliegt 'raus, sollte aber doch immer wahr sein!!!
1220      assert(get_irn_arity(block) == n_preds && "phi in wrong block!"); */
1221   if ((is_Block_dead(block)) ||                  /* Control dead */
1222       (block == get_irg_start_block(current_ir_graph)))  /* There should be no Phi nodes */
1223     return new_Bad();                                    /* in the Start Block. */
1224
1225   if (n_preds == 0) return n;           /* Phi of dead Region without predecessors. */
1226
1227   /* If the Block has a Bad pred, we also have one. */
1228   for (i = 0;  i < n_preds;  ++i)
1229     if (is_Bad(get_Block_cfgpred(block, i)))
1230       set_Phi_pred(n, i, new_Bad());
1231
1232   /* Find first non-self-referencing input */
1233   for (i = 0; i < n_preds; ++i) {
1234     first_val = get_Phi_pred(n, i);
1235     if (   (first_val != n)                            /* not self pointer */
1236 #if 1
1237         && (! is_Bad(first_val))
1238 #endif
1239            ) {        /* value not dead */
1240       break;          /* then found first value. */
1241     }
1242   }
1243
1244   if (i >= n_preds) {
1245     /* A totally Bad or self-referencing Phi (we didn't break the above loop) */
1246     return new_Bad();
1247   }
1248
1249   /* search for rest of inputs, determine if any of these
1250      are non-self-referencing */
1251   while (++i < n_preds) {
1252     ir_node *scnd_val = get_Phi_pred(n, i);
1253     if (   (scnd_val != n)
1254         && (scnd_val != first_val)
1255 #if 1
1256         && (! is_Bad(scnd_val))
1257 #endif
1258            ) {
1259       break;
1260     }
1261   }
1262
1263   if (i >= n_preds) {
1264     /* Fold, if no multiple distinct non-self-referencing inputs */
1265     n = first_val;
1266     DBG_OPT_PHI(oldn, n);
1267   }
1268   return n;
1269 }
1270
1271 /**
1272   Several optimizations:
1273    - no Sync in start block.
1274    - fold Sync-nodes, iff they have only one predecessor except
1275            themselves.
1276   @fixme: are there loop's in Sync's
1277  */
1278 static ir_node *equivalent_node_Sync(ir_node *n)
1279 {
1280   int i, n_preds;
1281
1282   ir_node *oldn = n;
1283   ir_node *first_val = NULL; /* to shutup gcc */
1284
1285   if (!get_opt_normalize()) return n;
1286
1287   n_preds = get_Sync_n_preds(n);
1288
1289   /* Find first non-self-referencing input */
1290   for (i = 0; i < n_preds; ++i) {
1291     first_val = get_Sync_pred(n, i);
1292     if ((first_val != n)  /* not self pointer */ &&
1293         (! is_Bad(first_val))
1294        ) {            /* value not dead */
1295       break;          /* then found first value. */
1296     }
1297   }
1298
1299   if (i >= n_preds)
1300     /* A totally Bad or self-referencing Sync (we didn't break the above loop) */
1301     return new_Bad();
1302
1303   /* search the rest of inputs, determine if any of these
1304      are non-self-referencing */
1305   while (++i < n_preds) {
1306     ir_node *scnd_val = get_Sync_pred(n, i);
1307     if ((scnd_val != n) &&
1308         (scnd_val != first_val) &&
1309         (! is_Bad(scnd_val))
1310        )
1311       break;
1312   }
1313
1314   if (i >= n_preds) {
1315     /* Fold, if no multiple distinct non-self-referencing inputs */
1316     n = first_val;
1317     DBG_OPT_SYNC(oldn, n);
1318   }
1319   return n;
1320 }
1321
1322 /**
1323  * optimize Proj(Tuple) and gigo() for ProjX in Bad block,
1324  * ProjX(Load) and ProjX(Store)
1325  */
1326 static ir_node *equivalent_node_Proj(ir_node *n)
1327 {
1328   ir_node *oldn = n;
1329
1330   ir_node *a = get_Proj_pred(n);
1331
1332   if ( get_irn_op(a) == op_Tuple) {
1333     /* Remove the Tuple/Proj combination. */
1334     if ( get_Proj_proj(n) <= get_Tuple_n_preds(a) ) {
1335       n = get_Tuple_pred(a, get_Proj_proj(n));
1336       DBG_OPT_TUPLE(oldn, a, n);
1337     } else {
1338       assert(0); /* This should not happen! */
1339       n = new_Bad();
1340     }
1341   }
1342   else if (get_irn_mode(n) == mode_X) {
1343     if (is_Block_dead(get_nodes_block(skip_Proj(n)))) {
1344       /* Remove dead control flow -- early gigo(). */
1345       n = new_Bad();
1346     }
1347     else if (get_opt_ldst_only_null_ptr_exceptions()) {
1348       ir_op *op = get_irn_op(a);
1349
1350       if (op == op_Load || op == op_Store) {
1351         /* get the load/store address */
1352         ir_node *addr = get_irn_n(a, 1);
1353         if (value_not_null(addr)) {
1354           /* this node may float if it did not depend on a Confirm */
1355           set_irn_pinned(a, op_pin_state_floats);
1356           DBG_OPT_EXC_REM(n);
1357           return new_Bad();
1358         }
1359       }
1360     }
1361   }
1362
1363   return n;
1364 }
1365
1366 /**
1367  * Remove Id's.
1368  */
1369 static ir_node *equivalent_node_Id(ir_node *n)
1370 {
1371   ir_node *oldn = n;
1372
1373   do {
1374     n = get_Id_pred(n);
1375   } while (get_irn_op(n) == op_Id);
1376
1377   DBG_OPT_ID(oldn, n);
1378   return n;
1379 }
1380
1381 /**
1382  * optimize a Mux
1383  */
1384 static ir_node *equivalent_node_Mux(ir_node *n)
1385 {
1386   ir_node *oldn = n, *sel = get_Mux_sel(n);
1387   tarval *ts = value_of(sel);
1388
1389   /* Mux(true, f, t) == t */
1390   if (ts == tarval_b_true) {
1391     n = get_Mux_true(n);
1392     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_MUX_C);
1393   }
1394   /* Mux(false, f, t) == f */
1395   else if (ts == tarval_b_false) {
1396     n = get_Mux_false(n);
1397     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_MUX_C);
1398   }
1399   /* Mux(v, x, x) == x */
1400   else if (get_Mux_false(n) == get_Mux_true(n)) {
1401     n = get_Mux_true(n);
1402     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_MUX_EQ);
1403   }
1404   else if (get_irn_op(sel) == op_Proj && !mode_honor_signed_zeros(get_irn_mode(n))) {
1405     ir_node *cmp = get_Proj_pred(sel);
1406     long proj_nr = get_Proj_proj(sel);
1407     ir_node *b   = get_Mux_false(n);
1408     ir_node *a   = get_Mux_true(n);
1409
1410     /*
1411      * Note: normalization puts the constant on the right site,
1412      * so we check only one case.
1413      *
1414      * Note further that these optimization work even for floating point
1415      * with NaN's because -NaN == NaN.
1416      * However, if +0 and -0 is handled differently, we cannot use the first one.
1417      */
1418     if (get_irn_op(cmp) == op_Cmp && get_Cmp_left(cmp) == a) {
1419       if (classify_Const(get_Cmp_right(cmp)) == CNST_NULL) {
1420         /* Mux(a CMP 0, X, a) */
1421         if (get_irn_op(b) == op_Minus && get_Minus_op(b) == a) {
1422           /* Mux(a CMP 0, -a, a) */
1423           if (proj_nr == pn_Cmp_Eq) {
1424             /* Mux(a == 0, -a, a)  ==>  -a */
1425             n = b;
1426             DBG_OPT_ALGSIM0(oldn, n, FS_OPT_MUX_TRANSFORM);
1427           }
1428           else if (proj_nr == pn_Cmp_Lg || proj_nr == pn_Cmp_Ne) {
1429             /* Mux(a != 0, -a, a)  ==> a */
1430             n = a;
1431             DBG_OPT_ALGSIM0(oldn, n, FS_OPT_MUX_TRANSFORM);
1432           }
1433         }
1434         else if (classify_Const(b) == CNST_NULL) {
1435           /* Mux(a CMP 0, 0, a) */
1436           if (proj_nr == pn_Cmp_Lg || proj_nr == pn_Cmp_Ne) {
1437             /* Mux(a != 0, 0, a) ==> a */
1438             n = a;
1439             DBG_OPT_ALGSIM0(oldn, n, FS_OPT_MUX_TRANSFORM);
1440           }
1441           else if (proj_nr == pn_Cmp_Eq) {
1442             /* Mux(a == 0, 0, a) ==> 0 */
1443             n = b;
1444             DBG_OPT_ALGSIM0(oldn, n, FS_OPT_MUX_TRANSFORM);
1445           }
1446         }
1447       }
1448     }
1449   }
1450   return n;
1451 }
1452
1453 /**
1454  * Returns a equivalent node of a Psi: if a condition is true
1455  * and all previous conditions are false we know its value.
1456  * If all conditions are false its value is the default one.
1457  */
1458 static ir_node *equivalent_node_Psi(ir_node *n) {
1459   if (is_Mux(n))
1460     return equivalent_node_Mux(n);
1461   return n;
1462 }
1463
1464 /**
1465  * Optimize -a CMP -b into b CMP a.
1466  * This works only for for modes where unary Minus
1467  * cannot Overflow.
1468  * Note that two-complement integers can Overflow
1469  * so it will NOT work.
1470  */
1471 static ir_node *equivalent_node_Cmp(ir_node *n)
1472 {
1473   ir_node *left  = get_Cmp_left(n);
1474   ir_node *right = get_Cmp_right(n);
1475
1476   if (get_irn_op(left) == op_Minus && get_irn_op(right) == op_Minus &&
1477       !mode_overflow_on_unary_Minus(get_irn_mode(left))) {
1478     left  = get_Minus_op(left);
1479     right = get_Minus_op(right);
1480     set_Cmp_left(n, right);
1481     set_Cmp_right(n, left);
1482   }
1483   return n;
1484 }
1485
1486 /**
1487  * Remove Confirm nodes if setting is on.
1488  * Replace Confirms(x, '=', Constlike) by Constlike.
1489  */
1490 static ir_node *equivalent_node_Confirm(ir_node *n)
1491 {
1492   ir_node *pred = get_Confirm_value(n);
1493   pn_Cmp  pnc   = get_Confirm_cmp(n);
1494
1495   if (get_irn_op(pred) == op_Confirm && pnc == get_Confirm_cmp(pred)) {
1496     /*
1497      * rare case: two identical Confirms one after another,
1498      * replace the second one with the first.
1499      */
1500     n = pred;
1501   }
1502   if (pnc == pn_Cmp_Eq) {
1503     ir_node *bound = get_Confirm_bound(n);
1504
1505     /*
1506      * Optimize a rare case:
1507      * Confirm(x, '=', Constlike) ==> Constlike
1508      */
1509     if (is_irn_constlike(bound)) {
1510       DBG_OPT_CONFIRM(n, bound);
1511       return bound;
1512     }
1513   }
1514   return get_opt_remove_confirm() ? get_Confirm_value(n) : n;
1515 }
1516
1517 /**
1518  * Optimize CopyB(mem, x, x) into a Nop
1519  */
1520 static ir_node *equivalent_node_CopyB(ir_node *n)
1521 {
1522   ir_node *a = get_CopyB_dst(n);
1523   ir_node *b = get_CopyB_src(n);
1524
1525   if (a == b) {
1526     /* Turn CopyB into a tuple (mem, bad, bad) */
1527     ir_node *mem = get_CopyB_mem(n);
1528     turn_into_tuple(n, pn_CopyB_max);
1529     set_Tuple_pred(n, pn_CopyB_M,        mem);
1530     set_Tuple_pred(n, pn_CopyB_X_except, new_Bad());        /* no exception */
1531     set_Tuple_pred(n, pn_CopyB_M_except, new_Bad());
1532   }
1533   return n;
1534 }
1535
1536 /**
1537  * Optimize Bounds(idx, idx, upper) into idx.
1538  */
1539 static ir_node *equivalent_node_Bound(ir_node *n)
1540 {
1541   ir_node *idx   = get_Bound_index(n);
1542   ir_node *lower = get_Bound_lower(n);
1543   int ret_tuple = 0;
1544
1545   /* By definition lower < upper, so if idx == lower -->
1546      lower <= idx && idx < upper */
1547   if (idx == lower) {
1548     /* Turn Bound into a tuple (mem, bad, idx) */
1549     ret_tuple = 1;
1550   }
1551   else {
1552     ir_node *pred = skip_Proj(idx);
1553
1554     if (get_irn_op(pred) == op_Bound) {
1555       /*
1556        * idx was Bounds_check previously, it is still valid if
1557        * lower <= pred_lower && pred_upper <= upper.
1558        */
1559       ir_node *upper = get_Bound_upper(n);
1560       if (get_Bound_lower(pred) == lower &&
1561           get_Bound_upper(pred) == upper) {
1562         /*
1563          * One could expect that we simply return the previous
1564          * Bound here. However, this would be wrong, as we could
1565          * add an exception Proj to a new location than.
1566          * So, we must turn in into a tuple
1567          */
1568         ret_tuple = 1;
1569       }
1570     }
1571   }
1572   if (ret_tuple) {
1573     /* Turn Bound into a tuple (mem, bad, idx) */
1574     ir_node *mem = get_Bound_mem(n);
1575     turn_into_tuple(n, pn_Bound_max);
1576     set_Tuple_pred(n, pn_Bound_M_regular, mem);
1577     set_Tuple_pred(n, pn_Bound_X_except,  new_Bad());       /* no exception */
1578     set_Tuple_pred(n, pn_Bound_res,       idx);
1579     set_Tuple_pred(n, pn_Bound_M_except,  mem);
1580   }
1581   return n;
1582 }
1583
1584 /**
1585  * equivalent_node() returns a node equivalent to input n. It skips all nodes that
1586  * perform no actual computation, as, e.g., the Id nodes.  It does not create
1587  * new nodes.  It is therefore safe to free n if the node returned is not n.
1588  * If a node returns a Tuple we can not just skip it.  If the size of the
1589  * in array fits, we transform n into a tuple (e.g., Div).
1590  */
1591 ir_node *
1592 equivalent_node(ir_node *n)
1593 {
1594   if (n->op->ops.equivalent_node)
1595     return n->op->ops.equivalent_node(n);
1596   return n;
1597 }
1598
1599 /**
1600  * sets the default equivalent node operation for an ir_op_ops.
1601  *
1602  * @param code   the opcode for the default operation
1603  * @param ops    the operations initialized
1604  *
1605  * @return
1606  *    The operations.
1607  */
1608 static ir_op_ops *firm_set_default_equivalent_node(opcode code, ir_op_ops *ops)
1609 {
1610 #define CASE(a)                                 \
1611   case iro_##a:                                 \
1612     ops->equivalent_node  = equivalent_node_##a; \
1613     break
1614
1615   switch (code) {
1616   CASE(Block);
1617   CASE(Jmp);
1618   CASE(Raise);
1619   CASE(Or);
1620   CASE(Add);
1621   CASE(Eor);
1622   CASE(Sub);
1623   CASE(Shl);
1624   CASE(Shr);
1625   CASE(Shrs);
1626   CASE(Rot);
1627   CASE(Not);
1628   CASE(Minus);
1629   CASE(Mul);
1630   CASE(Div);
1631   CASE(DivMod);
1632   CASE(And);
1633   CASE(Conv);
1634   CASE(Cast);
1635   CASE(Phi);
1636   CASE(Sync);
1637   CASE(Proj);
1638   CASE(Id);
1639   CASE(Mux);
1640   CASE(Psi);
1641   CASE(Cmp);
1642   CASE(Confirm);
1643   CASE(CopyB);
1644   CASE(Bound);
1645   default:
1646     /* leave NULL */;
1647   }
1648
1649   return ops;
1650 #undef CASE
1651 }
1652
1653 /**
1654  * Do node specific optimizations of nodes predecessors.
1655  */
1656 static void
1657 optimize_preds(ir_node *n) {
1658   ir_node *a = NULL, *b = NULL;
1659
1660   /* get the operands we will work on for simple cases. */
1661   if (is_binop(n)) {
1662     a = get_binop_left(n);
1663     b = get_binop_right(n);
1664   } else if (is_unop(n)) {
1665     a = get_unop_op(n);
1666   }
1667
1668   switch (get_irn_opcode(n)) {
1669
1670   case iro_Cmp:
1671     /* We don't want Cast as input to Cmp. */
1672     if (get_irn_op(a) == op_Cast) {
1673       a = get_Cast_op(a);
1674       set_Cmp_left(n, a);
1675     }
1676     if (get_irn_op(b) == op_Cast) {
1677       b = get_Cast_op(b);
1678       set_Cmp_right(n, b);
1679     }
1680     break;
1681
1682   default: break;
1683   } /* end switch */
1684 }
1685
1686 /**
1687  * Returns non-zero if all Phi predecessors are constants
1688  */
1689 static int is_const_Phi(ir_node *phi) {
1690   int i;
1691
1692   for (i = get_irn_arity(phi) - 1; i >= 0; --i)
1693     if (! is_Const(get_irn_n(phi, i)))
1694       return 0;
1695   return 1;
1696 }
1697
1698 /**
1699  * Transform AddP(P, ConvIs(Iu)), AddP(P, ConvIu(Is)) and
1700  * SubP(P, ConvIs(Iu)), SubP(P, ConvIu(Is)).
1701  * If possible, remove the Conv's.
1702  */
1703 static ir_node *transform_node_AddSub(ir_node *n)
1704 {
1705   ir_mode *mode = get_irn_mode(n);
1706
1707   if (mode_is_reference(mode)) {
1708     ir_node *left  = get_binop_left(n);
1709     ir_node *right = get_binop_right(n);
1710     int ref_bits   = get_mode_size_bits(mode);
1711
1712     if (get_irn_op(left) == op_Conv) {
1713       ir_mode *mode = get_irn_mode(left);
1714       int bits      = get_mode_size_bits(mode);
1715
1716       if (ref_bits == bits &&
1717           mode_is_int(mode) &&
1718           get_mode_arithmetic(mode) == irma_twos_complement) {
1719         ir_node *pre      = get_Conv_op(left);
1720         ir_mode *pre_mode = get_irn_mode(pre);
1721
1722         if (mode_is_int(pre_mode) &&
1723             get_mode_size_bits(pre_mode) == bits &&
1724             get_mode_arithmetic(pre_mode) == irma_twos_complement) {
1725           /* ok, this conv just changes to sign, moreover the calculation
1726            * is done with same number of bits as our address mode, so
1727            * we can ignore the conv as address calculation can be viewed
1728            * as either signed or unsigned
1729            */
1730           set_binop_left(n, pre);
1731         }
1732       }
1733     }
1734
1735     if (get_irn_op(right) == op_Conv) {
1736       ir_mode *mode = get_irn_mode(right);
1737       int bits      = get_mode_size_bits(mode);
1738
1739       if (ref_bits == bits &&
1740           mode_is_int(mode) &&
1741           get_mode_arithmetic(mode) == irma_twos_complement) {
1742         ir_node *pre      = get_Conv_op(right);
1743         ir_mode *pre_mode = get_irn_mode(pre);
1744
1745         if (mode_is_int(pre_mode) &&
1746             get_mode_size_bits(pre_mode) == bits &&
1747             get_mode_arithmetic(pre_mode) == irma_twos_complement) {
1748           /* ok, this conv just changes to sign, moreover the calculation
1749            * is done with same number of bits as our address mode, so
1750            * we can ignore the conv as address calculation can be viewed
1751            * as either signed or unsigned
1752            */
1753           set_binop_right(n, pre);
1754         }
1755       }
1756     }
1757   }
1758   return n;
1759 }
1760
1761 /**
1762  * Do the AddSub optimization, then Transform
1763  *   Add(a,a)          -> Mul(a, 2)
1764  *   Add(Mul(a, x), a) -> Mul(a, x+1)
1765  * if the mode is integer or float.
1766  * Transform Add(a,-b) into Sub(a,b).
1767  * Reassociation might fold this further.
1768  */
1769 static ir_node *transform_node_Add(ir_node *n)
1770 {
1771   ir_mode *mode;
1772   ir_node *oldn = n;
1773
1774   n = transform_node_AddSub(n);
1775
1776   mode = get_irn_mode(n);
1777   if (mode_is_num(mode)) {
1778     ir_node *a = get_Add_left(n);
1779     ir_node *b = get_Add_right(n);
1780
1781     if (a == b) {
1782       ir_node *block = get_irn_n(n, -1);
1783
1784       n = new_rd_Mul(
1785             get_irn_dbg_info(n),
1786             current_ir_graph,
1787             block,
1788             a,
1789             new_r_Const_long(current_ir_graph, block, mode, 2),
1790             mode);
1791       DBG_OPT_ALGSIM0(oldn, n, FS_OPT_ADD_A_A);
1792     }
1793     else if (get_irn_op(a) == op_Minus) {
1794       n = new_rd_Sub(
1795           get_irn_dbg_info(n),
1796           current_ir_graph,
1797           get_irn_n(n, -1),
1798           b,
1799           get_Minus_op(a),
1800           mode);
1801       DBG_OPT_ALGSIM0(oldn, n, FS_OPT_ADD_A_MINUS_B);
1802     }
1803     else if (get_irn_op(b) == op_Minus) {
1804       n = new_rd_Sub(
1805           get_irn_dbg_info(n),
1806           current_ir_graph,
1807           get_irn_n(n, -1),
1808           a,
1809           get_Minus_op(b),
1810           mode);
1811       DBG_OPT_ALGSIM0(oldn, n, FS_OPT_ADD_A_MINUS_B);
1812     }
1813     /* do NOT execute this code if reassociation is enabled, it does the inverse! */
1814     else if (!get_opt_reassociation() && get_irn_op(a) == op_Mul) {
1815       ir_node *ma = get_Mul_left(a);
1816       ir_node *mb = get_Mul_right(a);
1817
1818       if (b == ma) {
1819         ir_node *blk = get_irn_n(n, -1);
1820         n = new_rd_Mul(
1821           get_irn_dbg_info(n), current_ir_graph, blk,
1822           ma,
1823           new_rd_Add(
1824             get_irn_dbg_info(n), current_ir_graph, blk,
1825             mb,
1826             new_r_Const_long(current_ir_graph, blk, mode, 1),
1827             mode),
1828           mode);
1829         DBG_OPT_ALGSIM0(oldn, n, FS_OPT_ADD_MUL_A_X_A);
1830       }
1831       else if (b == mb) {
1832         ir_node *blk = get_irn_n(n, -1);
1833         n = new_rd_Mul(
1834           get_irn_dbg_info(n), current_ir_graph, blk,
1835           mb,
1836           new_rd_Add(
1837             get_irn_dbg_info(n), current_ir_graph, blk,
1838             ma,
1839             new_r_Const_long(current_ir_graph, blk, mode, 1),
1840             mode),
1841           mode);
1842         DBG_OPT_ALGSIM0(oldn, n, FS_OPT_ADD_MUL_A_X_A);
1843       }
1844     }
1845     /* do NOT execute this code if reassociation is enabled, it does the inverse! */
1846     else if (!get_opt_reassociation() && get_irn_op(b) == op_Mul) {
1847       ir_node *ma = get_Mul_left(b);
1848       ir_node *mb = get_Mul_right(b);
1849
1850       if (a == ma) {
1851         ir_node *blk = get_irn_n(n, -1);
1852         n = new_rd_Mul(
1853           get_irn_dbg_info(n), current_ir_graph, blk,
1854           ma,
1855           new_rd_Add(
1856             get_irn_dbg_info(n), current_ir_graph, blk,
1857             mb,
1858             new_r_Const_long(current_ir_graph, blk, mode, 1),
1859             mode),
1860           mode);
1861         DBG_OPT_ALGSIM0(oldn, n, FS_OPT_ADD_MUL_A_X_A);
1862       }
1863       else if (a == mb) {
1864         ir_node *blk = get_irn_n(n, -1);
1865         n = new_rd_Mul(
1866           get_irn_dbg_info(n), current_ir_graph, blk,
1867           mb,
1868           new_rd_Add(
1869             get_irn_dbg_info(n), current_ir_graph, blk,
1870             ma,
1871             new_r_Const_long(current_ir_graph, blk, mode, 1),
1872             mode),
1873           mode);
1874         DBG_OPT_ALGSIM0(oldn, n, FS_OPT_ADD_MUL_A_X_A);
1875       }
1876     }
1877   }
1878   return n;
1879 }
1880
1881 /**
1882  * Do the AddSub optimization, then Transform
1883  *   Sub(0,a)          -> Minus(a)
1884  *   Sub(Mul(a, x), a) -> Mul(a, x-1)
1885  */
1886 static ir_node *transform_node_Sub(ir_node *n)
1887 {
1888   ir_mode *mode;
1889   ir_node *oldn = n;
1890   ir_node *a, *b;
1891
1892   n = transform_node_AddSub(n);
1893
1894   mode = get_irn_mode(n);
1895   a    = get_Sub_left(n);
1896   b    = get_Sub_right(n);
1897   if (mode_is_num(mode) && (classify_Const(a) == CNST_NULL)) {
1898     n = new_rd_Minus(
1899           get_irn_dbg_info(n),
1900           current_ir_graph,
1901           get_irn_n(n, -1),
1902           b,
1903           mode);
1904     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_SUB_0_A);
1905   }
1906   /* do NOT execute this code if reassociation is enabled, it does the inverse! */
1907   else if (get_opt_reassociation() && get_irn_op(a) == op_Mul) {
1908     ir_node *ma = get_Mul_left(a);
1909     ir_node *mb = get_Mul_right(a);
1910
1911     if (ma == b) {
1912       ir_node *blk = get_irn_n(n, -1);
1913       n = new_rd_Mul(
1914         get_irn_dbg_info(n),
1915         current_ir_graph, blk,
1916         ma,
1917         new_rd_Sub(
1918           get_irn_dbg_info(n),
1919           current_ir_graph, blk,
1920           mb,
1921           new_r_Const_long(current_ir_graph, blk, mode, 1),
1922           mode),
1923         mode);
1924       DBG_OPT_ALGSIM0(oldn, n, FS_OPT_SUB_MUL_A_X_A);
1925     }
1926     else if (mb == b) {
1927       ir_node *blk = get_irn_n(n, -1);
1928       n = new_rd_Mul(
1929         get_irn_dbg_info(n),
1930         current_ir_graph, blk,
1931         mb,
1932         new_rd_Sub(
1933           get_irn_dbg_info(n),
1934           current_ir_graph, blk,
1935           ma,
1936           new_r_Const_long(current_ir_graph, blk, mode, 1),
1937           mode),
1938         mode);
1939       DBG_OPT_ALGSIM0(oldn, n, FS_OPT_SUB_MUL_A_X_A);
1940     }
1941   }
1942
1943   return n;
1944 }
1945
1946 /**
1947  * Transform Mul(a,-1) into -a.
1948  * Do architecture dependent optimizations on Mul nodes
1949  */
1950 static ir_node *transform_node_Mul(ir_node *n) {
1951   ir_node *oldn = n;
1952   ir_mode *mode = get_irn_mode(n);
1953
1954   if (mode_is_signed(mode)) {
1955     ir_node *r = NULL;
1956     ir_node *a = get_Mul_left(n);
1957     ir_node *b = get_Mul_right(n);
1958
1959     if (value_of(a) == get_mode_minus_one(mode))
1960       r = b;
1961     else if (value_of(b) == get_mode_minus_one(mode))
1962       r = a;
1963     if (r) {
1964       n = new_rd_Minus(get_irn_dbg_info(n), current_ir_graph, get_irn_n(n, -1), r, mode);
1965       DBG_OPT_ALGSIM1(oldn, a, b, n, FS_OPT_MUL_MINUS_1);
1966       return n;
1967     }
1968   }
1969   return arch_dep_replace_mul_with_shifts(n);
1970 }
1971
1972 /**
1973  * transform a Div Node
1974  */
1975 static ir_node *transform_node_Div(ir_node *n)
1976 {
1977   tarval *tv = value_of(n);
1978   ir_node *value = n;
1979
1980   /* BEWARE: it is NOT possible to optimize a/a to 1, as this may cause a exception */
1981
1982   if (tv != tarval_bad) {
1983     value = new_Const(get_tarval_mode(tv), tv);
1984
1985     DBG_OPT_CSTEVAL(n, value);
1986   }
1987   else /* Try architecture dependent optimization */
1988     value = arch_dep_replace_div_by_const(n);
1989
1990   if (value != n) {
1991     /* Turn Div into a tuple (mem, bad, value) */
1992     ir_node *mem = get_Div_mem(n);
1993
1994     turn_into_tuple(n, pn_Div_max);
1995     set_Tuple_pred(n, pn_Div_M, mem);
1996     set_Tuple_pred(n, pn_Div_X_except, new_Bad());
1997     set_Tuple_pred(n, pn_Div_res, value);
1998   }
1999   return n;
2000 }
2001
2002 /**
2003  * transform a Mod node
2004  */
2005 static ir_node *transform_node_Mod(ir_node *n)
2006 {
2007   tarval *tv = value_of(n);
2008   ir_node *value = n;
2009
2010   /* BEWARE: it is NOT possible to optimize a%a to 0, as this may cause a exception */
2011
2012   if (tv != tarval_bad) {
2013     value = new_Const(get_tarval_mode(tv), tv);
2014
2015     DBG_OPT_CSTEVAL(n, value);
2016   }
2017   else /* Try architecture dependent optimization */
2018     value = arch_dep_replace_mod_by_const(n);
2019
2020   if (value != n) {
2021     /* Turn Mod into a tuple (mem, bad, value) */
2022     ir_node *mem = get_Mod_mem(n);
2023
2024     turn_into_tuple(n, pn_Mod_max);
2025     set_Tuple_pred(n, pn_Mod_M, mem);
2026     set_Tuple_pred(n, pn_Mod_X_except, new_Bad());
2027     set_Tuple_pred(n, pn_Mod_res, value);
2028   }
2029   return n;
2030 }
2031
2032 /**
2033  * transform a DivMod node
2034  */
2035 static ir_node *transform_node_DivMod(ir_node *n)
2036 {
2037   int evaluated = 0;
2038
2039   ir_node *a = get_DivMod_left(n);
2040   ir_node *b = get_DivMod_right(n);
2041   ir_mode *mode = get_irn_mode(a);
2042   tarval *ta = value_of(a);
2043   tarval *tb = value_of(b);
2044
2045   if (!(mode_is_int(mode) && mode_is_int(get_irn_mode(b))))
2046     return n;
2047
2048   /* BEWARE: it is NOT possible to optimize a/a to 1, as this may cause a exception */
2049
2050   if (tb != tarval_bad) {
2051     if (tb == get_mode_one(get_tarval_mode(tb))) {
2052       b = new_Const (mode, get_mode_null(mode));
2053       evaluated = 1;
2054
2055       DBG_OPT_CSTEVAL(n, b);
2056     }
2057     else if (ta != tarval_bad) {
2058       tarval *resa, *resb;
2059       resa = tarval_div (ta, tb);
2060       if (resa == tarval_bad) return n; /* Causes exception!!! Model by replacing through
2061                                         Jmp for X result!? */
2062       resb = tarval_mod (ta, tb);
2063       if (resb == tarval_bad) return n; /* Causes exception! */
2064       a = new_Const (mode, resa);
2065       b = new_Const (mode, resb);
2066       evaluated = 1;
2067
2068       DBG_OPT_CSTEVAL(n, a);
2069       DBG_OPT_CSTEVAL(n, b);
2070     }
2071     else { /* Try architecture dependent optimization */
2072       arch_dep_replace_divmod_by_const(&a, &b, n);
2073       evaluated = a != NULL;
2074     }
2075   } else if (ta == get_mode_null(mode)) {
2076     /* 0 / non-Const = 0 */
2077     b = a;
2078     evaluated = 1;
2079   }
2080
2081   if (evaluated) { /* replace by tuple */
2082     ir_node *mem = get_DivMod_mem(n);
2083     turn_into_tuple(n, pn_DivMod_max);
2084     set_Tuple_pred(n, pn_DivMod_M,        mem);
2085     set_Tuple_pred(n, pn_DivMod_X_except, new_Bad());  /* no exception */
2086     set_Tuple_pred(n, pn_DivMod_res_div,  a);
2087     set_Tuple_pred(n, pn_DivMod_res_mod,  b);
2088   }
2089
2090   return n;
2091 }
2092
2093 /**
2094  * Optimize Abs(x) into  x if x is Confirmed >= 0
2095  * Optimize Abs(x) into -x if x is Confirmed <= 0
2096  */
2097 static ir_node *transform_node_Abs(ir_node *n)
2098 {
2099   ir_node        *oldn = n;
2100   ir_node        *a = get_Abs_op(n);
2101   value_classify sign = classify_value_sign(a);
2102
2103   if (sign == VALUE_NEGATIVE) {
2104     ir_mode *mode = get_irn_mode(n);
2105
2106     /*
2107      * We can replace the Abs by -x here.
2108      * We even could add a new Confirm here.
2109      *
2110      * Note that -x would create a new node, so we could
2111      * not run it in the equivalent_node() context.
2112      */
2113     n = new_rd_Minus(get_irn_dbg_info(n), current_ir_graph,
2114                      get_irn_n(n, -1), a, mode);
2115
2116     DBG_OPT_CONFIRM(oldn, n);
2117   }
2118   else if (sign == VALUE_POSITIVE) {
2119     /* n is positive, Abs is not needed */
2120     n = a;
2121
2122     DBG_OPT_CONFIRM(oldn, n);
2123   }
2124
2125   return n;
2126 }
2127
2128 /**
2129  * transform a Cond node
2130  */
2131 static ir_node *transform_node_Cond(ir_node *n)
2132 {
2133   /* Replace the Cond by a Jmp if it branches on a constant
2134      condition. */
2135   ir_node *jmp;
2136   ir_node *a = get_Cond_selector(n);
2137   tarval *ta = value_of(a);
2138
2139   /* we need block info which is not available in floating irgs */
2140   if (get_irg_pinned(current_ir_graph) == op_pin_state_floats)
2141      return n;
2142
2143   if ((ta != tarval_bad) &&
2144       (get_irn_mode(a) == mode_b) &&
2145       (get_opt_unreachable_code())) {
2146     /* It's a boolean Cond, branching on a boolean constant.
2147                Replace it by a tuple (Bad, Jmp) or (Jmp, Bad) */
2148     jmp = new_r_Jmp(current_ir_graph, get_nodes_block(n));
2149     turn_into_tuple(n, pn_Cond_max);
2150     if (ta == tarval_b_true) {
2151       set_Tuple_pred(n, pn_Cond_false, new_Bad());
2152       set_Tuple_pred(n, pn_Cond_true, jmp);
2153     } else {
2154       set_Tuple_pred(n, pn_Cond_false, jmp);
2155       set_Tuple_pred(n, pn_Cond_true, new_Bad());
2156     }
2157     /* We might generate an endless loop, so keep it alive. */
2158     add_End_keepalive(get_irg_end(current_ir_graph), get_nodes_block(n));
2159   }
2160   return n;
2161 }
2162
2163 /**
2164  * Transform an Eor.
2165  */
2166 static ir_node *transform_node_Eor(ir_node *n)
2167 {
2168   ir_node *oldn = n;
2169   ir_node *a = get_Eor_left(n);
2170   ir_node *b = get_Eor_right(n);
2171   ir_mode *mode = get_irn_mode(n);
2172
2173   if (a == b) {
2174     /* a ^ a = 0 */
2175     n = new_rd_Const(get_irn_dbg_info(n), current_ir_graph, get_irn_n(n, -1),
2176                      mode, get_mode_null(mode));
2177     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_EOR_A_A);
2178   }
2179   else if ((mode == mode_b)
2180       && (get_irn_op(a) == op_Proj)
2181       && (get_irn_mode(a) == mode_b)
2182       && (classify_tarval (value_of(b)) == TV_CLASSIFY_ONE)
2183       && (get_irn_op(get_Proj_pred(a)) == op_Cmp)) {
2184     /* The Eor negates a Cmp. The Cmp has the negated result anyways! */
2185     n = new_r_Proj(current_ir_graph, get_irn_n(n, -1), get_Proj_pred(a),
2186                    mode_b, get_negated_pnc(get_Proj_proj(a), mode));
2187
2188     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_EOR_TO_NOT_BOOL);
2189   }
2190   else if ((mode == mode_b)
2191         && (classify_tarval (value_of(b)) == TV_CLASSIFY_ONE)) {
2192     /* The Eor is a Not. Replace it by a Not. */
2193     /*   ????!!!Extend to bitfield 1111111. */
2194     n = new_r_Not(current_ir_graph, get_irn_n(n, -1), a, mode_b);
2195
2196     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_EOR_TO_NOT);
2197   }
2198
2199   return n;
2200 }
2201
2202 /**
2203  * Transform a boolean Not.
2204  */
2205 static ir_node *transform_node_Not(ir_node *n)
2206 {
2207   ir_node *oldn = n;
2208   ir_node *a = get_Not_op(n);
2209
2210   if (   (get_irn_mode(n) == mode_b)
2211       && (get_irn_op(a) == op_Proj)
2212       && (get_irn_mode(a) == mode_b)
2213       && (get_irn_op(get_Proj_pred(a)) == op_Cmp)) {
2214     /* We negate a Cmp. The Cmp has the negated result anyways! */
2215     n = new_r_Proj(current_ir_graph, get_irn_n(n, -1), get_Proj_pred(a),
2216                    mode_b, get_negated_pnc(get_Proj_proj(a), mode_b));
2217     DBG_OPT_ALGSIM0(oldn, n, FS_OPT_NOT_CMP);
2218   }
2219
2220   return n;
2221 }
2222
2223 /**
2224  * Transform a Cast_type(Const) into a new Const_type
2225  */
2226 static ir_node *transform_node_Cast(ir_node *n) {
2227   ir_node *oldn = n;
2228   ir_node *pred = get_Cast_op(n);
2229   ir_type *tp = get_irn_type(n);
2230
2231   if (get_irn_op(pred) == op_Const && get_Const_type(pred) != tp) {
2232     n = new_rd_Const_type(NULL, current_ir_graph, get_irn_n(pred, -1), get_irn_mode(pred),
2233               get_Const_tarval(pred), tp);
2234     DBG_OPT_CSTEVAL(oldn, n);
2235   } else if ((get_irn_op(pred) == op_SymConst) && (get_SymConst_value_type(pred) != tp)) {
2236     n = new_rd_SymConst_type(NULL, current_ir_graph, get_irn_n(pred, -1), get_SymConst_symbol(pred),
2237                  get_SymConst_kind(pred), tp);
2238     DBG_OPT_CSTEVAL(oldn, n);
2239   }
2240
2241   return n;
2242 }
2243
2244 /**
2245  * Transform a Proj(Div) with a non-zero value.
2246  * Removes the exceptions and routes the memory to the NoMem node.
2247  */
2248 static ir_node *transform_node_Proj_Div(ir_node *proj)
2249 {
2250   ir_node *n = get_Proj_pred(proj);
2251   ir_node *b = get_Div_right(n);
2252   long proj_nr;
2253
2254   if (value_not_zero(b)) {
2255     /* div(x, y) && y != 0 */
2256     proj_nr = get_Proj_proj(proj);
2257
2258     /* this node may float if it did not depend on a Confirm */
2259     set_irn_pinned(n, op_pin_state_floats);
2260
2261     if (proj_nr == pn_Div_X_except) {
2262       /* we found an exception handler, remove it */
2263       DBG_OPT_EXC_REM(proj);
2264       return new_Bad();
2265     }
2266     else if (proj_nr == pn_Div_M) {
2267       ir_node *res = get_Div_mem(n);
2268       /* the memory Proj can only be removed if we divide by a
2269          real constant, but the node never produce a new memory */
2270       if (value_of(b) != tarval_bad) {
2271         /* this is a Div by a const, we can remove the memory edge */
2272         set_Div_mem(n, get_irg_no_mem(current_ir_graph));
2273       }
2274       return res;
2275     }
2276   }
2277   return proj;
2278 }
2279
2280 /**
2281  * Transform a Proj(Mod) with a non-zero value.
2282  * Removes the exceptions and routes the memory to the NoMem node.
2283  */
2284 static ir_node *transform_node_Proj_Mod(ir_node *proj)
2285 {
2286   ir_node *n = get_Proj_pred(proj);
2287   ir_node *b = get_Mod_right(n);
2288   long proj_nr;
2289
2290   if (value_not_zero(b)) {
2291     /* mod(x, y) && y != 0 */
2292     proj_nr = get_Proj_proj(proj);
2293
2294     /* this node may float if it did not depend on a Confirm */
2295     set_irn_pinned(n, op_pin_state_floats);
2296
2297     if (proj_nr == pn_Mod_X_except) {
2298       /* we found an exception handler, remove it */
2299       DBG_OPT_EXC_REM(proj);
2300       return new_Bad();
2301     } else if (proj_nr == pn_Mod_M) {
2302       ir_node *res = get_Mod_mem(n);
2303       /* the memory Proj can only be removed if we divide by a
2304          real constant, but the node never produce a new memory */
2305       if (value_of(b) != tarval_bad) {
2306         /* this is a Mod by a const, we can remove the memory edge */
2307         set_Mod_mem(n, get_irg_no_mem(current_ir_graph));
2308       }
2309       return res;
2310     }
2311     else if (proj_nr == pn_Mod_res && get_Mod_left(n) == b) {
2312       /* a % a = 0 if a != 0 */
2313       ir_mode *mode = get_irn_mode(proj);
2314       ir_node *res  = new_Const(mode, get_mode_null(mode));
2315
2316       DBG_OPT_CSTEVAL(n, res);
2317       return res;
2318     }
2319   }
2320   return proj;
2321 }
2322
2323 /**
2324  * Transform a Proj(DivMod) with a non-zero value.
2325  * Removes the exceptions and routes the memory to the NoMem node.
2326  */
2327 static ir_node *transform_node_Proj_DivMod(ir_node *proj)
2328 {
2329   ir_node *n = get_Proj_pred(proj);
2330   ir_node *b = get_DivMod_right(n);
2331   long proj_nr;
2332
2333   if (value_not_zero(b)) {
2334     /* DivMod(x, y) && y != 0 */
2335     proj_nr = get_Proj_proj(proj);
2336
2337     /* this node may float if it did not depend on a Confirm */
2338     set_irn_pinned(n, op_pin_state_floats);
2339
2340     if (proj_nr == pn_DivMod_X_except) {
2341       /* we found an exception handler, remove it */
2342       DBG_OPT_EXC_REM(proj);
2343       return new_Bad();
2344     }
2345     else if (proj_nr == pn_DivMod_M) {
2346       ir_node *res = get_DivMod_mem(n);
2347       /* the memory Proj can only be removed if we divide by a
2348          real constant, but the node never produce a new memory */
2349       if (value_of(b) != tarval_bad) {
2350         /* this is a DivMod by a const, we can remove the memory edge */
2351         set_DivMod_mem(n, get_irg_no_mem(current_ir_graph));
2352       }
2353       return res;
2354     }
2355     else if (proj_nr == pn_DivMod_res_mod && get_DivMod_left(n) == b) {
2356       /* a % a = 0 if a != 0 */
2357       ir_mode *mode = get_irn_mode(proj);
2358       ir_node *res  = new_Const(mode, get_mode_null(mode));
2359
2360       DBG_OPT_CSTEVAL(n, res);
2361       return res;
2362     }
2363   }
2364   return proj;
2365 }
2366
2367 /**
2368  * Optimizes jump tables (CondIs or CondIu) by removing all impossible cases.
2369  */
2370 static ir_node *transform_node_Proj_Cond(ir_node *proj)
2371 {
2372   if (get_opt_unreachable_code()) {
2373     ir_node *n = get_Proj_pred(proj);
2374     ir_node *b = get_Cond_selector(n);
2375
2376     if (mode_is_int(get_irn_mode(b))) {
2377       tarval *tb = value_of(b);
2378
2379       if (tb != tarval_bad) {
2380         /* we have a constant switch */
2381         long num = get_Proj_proj(proj);
2382
2383         if (num != get_Cond_defaultProj(n)) { /* we cannot optimize default Proj's yet */
2384           if (get_tarval_long(tb) == num) {
2385             /* Do NOT create a jump here, or we will have 2 control flow ops
2386              * in a block. This case is optimized away in optimize_cf(). */
2387             return proj;
2388           }
2389           else {
2390             /* this case will NEVER be taken, kill it */
2391             return new_Bad();
2392           }
2393         }
2394       }
2395     }
2396   }
2397   return proj;
2398 }
2399
2400 /**
2401  * Normalizes and optimizes Cmp nodes.
2402  */
2403 static ir_node *transform_node_Proj_Cmp(ir_node *proj)
2404 {
2405   if (get_opt_reassociation()) {
2406     ir_node *n     = get_Proj_pred(proj);
2407     ir_node *left  = get_Cmp_left(n);
2408     ir_node *right = get_Cmp_right(n);
2409     ir_node *c     = NULL;
2410     tarval *tv     = NULL;
2411     int changed    = 0;
2412     ir_mode *mode  = NULL;
2413     long proj_nr   = get_Proj_proj(proj);
2414
2415     /*
2416      * First step: normalize the compare op
2417      * by placing the constant on the right site
2418      * or moving the lower address node to the left.
2419      * We ignore the case that both are constants
2420      * this case should be optimized away.
2421      */
2422     if (get_irn_op(right) == op_Const)
2423       c = right;
2424     else if (get_irn_op(left) == op_Const) {
2425       c     = left;
2426       left  = right;
2427       right = c;
2428
2429       proj_nr = get_inversed_pnc(proj_nr);
2430       changed |= 1;
2431     }
2432     else if (get_irn_idx(left) > get_irn_idx(right)) {
2433       ir_node *t = left;
2434
2435       left  = right;
2436       right = t;
2437
2438       proj_nr = get_inversed_pnc(proj_nr);
2439       changed |= 1;
2440     }
2441
2442     /*
2443      * Second step: Try to reduce the magnitude
2444      * of a constant. This may help to generate better code
2445      * later and may help to normalize more compares.
2446      * Of course this is only possible for integer values.
2447      */
2448     if (c) {
2449       mode = get_irn_mode(c);
2450       tv = get_Const_tarval(c);
2451
2452       if (tv != tarval_bad) {
2453         /* the following optimization is possible on modes without Overflow
2454          * on Unary Minus or on == and !=:
2455          * -a CMP c  ==>  a swap(CMP) -c
2456          *
2457          * Beware: for two-complement Overflow may occur, so only == and != can
2458          * be optimized, see this:
2459          * -MININT < 0 =/=> MININT > 0 !!!
2460          */
2461         if (get_opt_constant_folding() && get_irn_op(left) == op_Minus &&
2462             (!mode_overflow_on_unary_Minus(mode) ||
2463              (mode_is_int(mode) && (proj_nr == pn_Cmp_Eq || proj_nr == pn_Cmp_Lg)))) {
2464           left = get_Minus_op(left);
2465           tv = tarval_sub(get_mode_null(mode), tv);
2466
2467           proj_nr = get_inversed_pnc(proj_nr);
2468           changed |= 2;
2469         }
2470
2471         /* for integer modes, we have more */
2472         if (mode_is_int(mode)) {
2473           /* Ne includes Unordered which is not possible on integers.
2474            * However, frontends often use this wrong, so fix it here */
2475           if (proj_nr & pn_Cmp_Uo) {
2476             proj_nr &= ~pn_Cmp_Uo;
2477             set_Proj_proj(proj, proj_nr);
2478           }
2479
2480           /* c > 0 : a < c  ==>  a <= (c-1)    a >= c  ==>  a > (c-1) */
2481           if ((proj_nr == pn_Cmp_Lt || proj_nr == pn_Cmp_Ge) &&
2482               tarval_cmp(tv, get_mode_null(mode)) == pn_Cmp_Gt) {
2483             tv = tarval_sub(tv, get_mode_one(mode));
2484
2485             proj_nr ^= pn_Cmp_Eq;
2486             changed |= 2;
2487           }
2488           /* c < 0 : a > c  ==>  a >= (c+1)    a <= c  ==>  a < (c+1) */
2489           else if ((proj_nr == pn_Cmp_Gt || proj_nr == pn_Cmp_Le) &&
2490               tarval_cmp(tv, get_mode_null(mode)) == pn_Cmp_Lt) {
2491             tv = tarval_add(tv, get_mode_one(mode));
2492
2493             proj_nr ^= pn_Cmp_Eq;
2494             changed |= 2;
2495           }
2496
2497           /* the following reassociations work only for == and != */
2498           if (proj_nr == pn_Cmp_Eq || proj_nr == pn_Cmp_Lg) {
2499
2500             /* a-b == 0  ==>  a == b,  a-b != 0  ==>  a != b */
2501             if (classify_tarval(tv) == TV_CLASSIFY_NULL && get_irn_op(left) == op_Sub) {
2502               right = get_Sub_right(left);
2503               left  = get_Sub_left(left);
2504
2505               tv = value_of(right);
2506               changed = 1;
2507             }
2508
2509             if (tv != tarval_bad) {
2510               ir_op *op = get_irn_op(left);
2511
2512               /* a-c1 == c2  ==>  a == c2+c1,  a-c1 != c2  ==>  a != c2+c1 */
2513               if (op == op_Sub) {
2514                 ir_node *c1 = get_Sub_right(left);
2515                 tarval *tv2 = value_of(c1);
2516
2517                 if (tv2 != tarval_bad) {
2518                   tv2 = tarval_add(tv, value_of(c1));
2519
2520                   if (tv2 != tarval_bad) {
2521                     left    = get_Sub_left(left);
2522                     tv      = tv2;
2523                     changed |= 2;
2524                   }
2525                 }
2526               }
2527               /* a+c1 == c2  ==>  a == c2-c1,  a+c1 != c2  ==>  a != c2-c1 */
2528               else if (op == op_Add) {
2529                 ir_node *a_l = get_Add_left(left);
2530                 ir_node *a_r = get_Add_right(left);
2531                 ir_node *a;
2532                 tarval *tv2;
2533
2534                 if (get_irn_op(a_l) == op_Const) {
2535                   a = a_r;
2536                   tv2 = value_of(a_l);
2537                 }
2538                 else {
2539                   a = a_l;
2540                   tv2 = value_of(a_r);
2541                 }
2542
2543                 if (tv2 != tarval_bad) {
2544                   tv2 = tarval_sub(tv, tv2);
2545
2546                   if (tv2 != tarval_bad) {
2547                     left    = a;
2548                     tv      = tv2;
2549                     changed |= 2;
2550                   }
2551                 }
2552               }
2553               /* -a == c ==> a == -c, -a != c ==> a != -c */
2554               else if (op == op_Minus) {
2555                 tarval *tv2 = tarval_sub(get_mode_null(mode), tv);
2556
2557                 if (tv2 != tarval_bad) {
2558                   left    = get_Minus_op(left);
2559                   tv      = tv2;
2560                   changed |= 2;
2561                 }
2562               }
2563             }
2564           } /* == or != */
2565           /* the following reassociations work only for <= */
2566           else if (proj_nr == pn_Cmp_Le || proj_nr == pn_Cmp_Lt) {
2567             if (tv != tarval_bad) {
2568               ir_op *op = get_irn_op(left);
2569
2570               /* c >= 0 : Abs(a) <= c  ==>  (unsigned)(a + c) <= 2*c */
2571               if (op == op_Abs) {
2572               }
2573             }
2574           }
2575         } /* mode_is_int */
2576
2577         /*
2578          * optimization for AND:
2579          * Optimize:
2580          *   And(x, C) == C  ==>  And(x, C) != 0
2581          *   And(x, C) != C  ==>  And(X, C) == 0
2582          *
2583          * if C is a single Bit constant.
2584          */
2585         if ((proj_nr == pn_Cmp_Eq || proj_nr == pn_Cmp_Lg) &&
2586             (get_irn_op(left) == op_And)) {
2587           if (is_single_bit_tarval(tv)) {
2588             /* check for Constant's match. We have check hare the tarvals,
2589                because our const might be changed */
2590             ir_node *la = get_And_left(left);
2591             ir_node *ra = get_And_right(left);
2592             if ((is_Const(la) && get_Const_tarval(la) == tv) ||
2593                 (is_Const(ra) && get_Const_tarval(ra) == tv)) {
2594               /* fine: do the transformation */
2595               tv = get_mode_null(get_tarval_mode(tv));
2596               proj_nr ^= pn_Cmp_Leg;
2597               changed |= 2;
2598             }
2599           }
2600         }
2601       } /* tarval != bad */
2602     }
2603
2604     if (changed) {
2605       ir_node *block = get_irn_n(n, -1); /* Beware of get_nodes_Block() */
2606
2607       if (changed & 2)      /* need a new Const */
2608         right = new_Const(mode, tv);
2609
2610       /* create a new compare */
2611       n = new_rd_Cmp(get_irn_dbg_info(n), current_ir_graph, block,
2612             left, right);
2613
2614       set_Proj_pred(proj, n);
2615       set_Proj_proj(proj, proj_nr);
2616     }
2617   }
2618   return proj;
2619 }
2620
2621 /**
2622  * Does all optimizations on nodes that must be done on it's Proj's
2623  * because of creating new nodes.
2624  */
2625 static ir_node *transform_node_Proj(ir_node *proj)
2626 {
2627   ir_node *n = get_Proj_pred(proj);
2628
2629   switch (get_irn_opcode(n)) {
2630   case iro_Div:
2631     return transform_node_Proj_Div(proj);
2632
2633   case iro_Mod:
2634     return transform_node_Proj_Mod(proj);
2635
2636   case iro_DivMod:
2637     return transform_node_Proj_DivMod(proj);
2638
2639   case iro_Cond:
2640     return transform_node_Proj_Cond(proj);
2641
2642   case iro_Cmp:
2643     return transform_node_Proj_Cmp(proj);
2644
2645   case iro_Tuple:
2646     /* should not happen, but if it does will be optimized away */
2647     return equivalent_node_Proj(proj);
2648
2649   default:
2650     /* do nothing */
2651     return proj;
2652   }
2653 }
2654
2655 /**
2656  * Move Confirms down through Phi nodes.
2657  */
2658 static ir_node *transform_node_Phi(ir_node *phi) {
2659   int i, n;
2660   ir_mode *mode = get_irn_mode(phi);
2661
2662   if (mode_is_reference(mode)) {
2663     n = get_irn_arity(phi);
2664
2665     /* Beware of Phi0 */
2666     if (n > 0) {
2667       ir_node *pred = get_irn_n(phi, 0);
2668       ir_node *bound;
2669       pn_Cmp  pnc;
2670
2671       if (! is_Confirm(pred))
2672         return phi;
2673
2674       bound = get_Confirm_bound(pred);
2675       pnc   = get_Confirm_cmp(pred);
2676
2677       for (i = 1; i < n; ++i) {
2678         pred = get_irn_n(phi, i);
2679
2680         if (! is_Confirm(pred) ||
2681             get_Confirm_bound(pred) != bound ||
2682             get_Confirm_cmp(pred) != pnc)
2683           return phi;
2684       }
2685       return new_r_Confirm(current_ir_graph, get_irn_n(phi, -1), phi, bound, pnc);
2686     }
2687   }
2688   return phi;
2689 }
2690
2691 /**
2692  * returns the operands of a commutative bin-op, if one operand is
2693  * a const, it is returned as the second one.
2694  */
2695 static void get_comm_Binop_Ops(ir_node *binop, ir_node **a, ir_node **c)
2696 {
2697   ir_node *op_a = get_binop_left(binop);
2698   ir_node *op_b = get_binop_right(binop);
2699
2700   assert(is_op_commutative(get_irn_op(binop)));
2701
2702   if (get_irn_op(op_a) == op_Const) {
2703     *a = op_b;
2704     *c = op_a;
2705   }
2706   else {
2707     *a = op_a;
2708     *c = op_b;
2709   }
2710 }
2711
2712 /**
2713  * Optimize a Or(And(Or(And(v,c4),c3),c2),c1) pattern if possible.
2714  * Such pattern may arise in bitfield stores.
2715  *
2716  * value  c4                  value      c4 & c2
2717  *    AND     c3                    AND           c1 | c3
2718  *        OR     c2      ===>               OR
2719  *           AND    c1
2720  *               OR
2721  */
2722 static ir_node *transform_node_Or_bf_store(ir_node *or)
2723 {
2724   ir_node *and, *c1;
2725   ir_node *or_l, *c2;
2726   ir_node *and_l, *c3;
2727   ir_node *value, *c4;
2728   ir_node *new_and, *new_const, *block;
2729   ir_mode *mode = get_irn_mode(or);
2730
2731   tarval *tv1, *tv2, *tv3, *tv4, *tv, *n_tv4, *n_tv2;
2732
2733   get_comm_Binop_Ops(or, &and, &c1);
2734   if ((get_irn_op(c1) != op_Const) || (get_irn_op(and) != op_And))
2735     return or;
2736
2737   get_comm_Binop_Ops(and, &or_l, &c2);
2738   if ((get_irn_op(c2) != op_Const) || (get_irn_op(or_l) != op_Or))
2739     return or;
2740
2741   get_comm_Binop_Ops(or_l, &and_l, &c3);
2742   if ((get_irn_op(c3) != op_Const) || (get_irn_op(and_l) != op_And))
2743     return or;
2744
2745   get_comm_Binop_Ops(and_l, &value, &c4);
2746   if (get_irn_op(c4) != op_Const)
2747     return or;
2748
2749   /* ok, found the pattern, check for conditions */
2750   assert(mode == get_irn_mode(and));
2751   assert(mode == get_irn_mode(or_l));
2752   assert(mode == get_irn_mode(and_l));
2753
2754   tv1 = get_Const_tarval(c1);
2755   tv2 = get_Const_tarval(c2);
2756   tv3 = get_Const_tarval(c3);
2757   tv4 = get_Const_tarval(c4);
2758
2759   tv = tarval_or(tv4, tv2);
2760   if (classify_tarval(tv) != TV_CLASSIFY_ALL_ONE) {
2761     /* have at least one 0 at the same bit position */
2762     return or;
2763   }
2764
2765   n_tv4 = tarval_not(tv4);
2766   if (tv3 != tarval_and(tv3, n_tv4)) {
2767     /* bit in the or_mask is outside the and_mask */
2768     return or;
2769   }
2770
2771   n_tv2 = tarval_not(tv2);
2772   if (tv1 != tarval_and(tv1, n_tv2)) {
2773     /* bit in the or_mask is outside the and_mask */
2774     return or;
2775   }
2776
2777   /* ok, all conditions met */
2778   block = get_irn_n(or, -1);
2779
2780   new_and = new_r_And(current_ir_graph, block,
2781       value, new_r_Const(current_ir_graph, block, mode, tarval_and(tv4, tv2)), mode);
2782
2783   new_const = new_r_Const(current_ir_graph, block, mode, tarval_or(tv3, tv1));
2784
2785   set_Or_left(or, new_and);
2786   set_Or_right(or, new_const);
2787
2788   /* check for more */
2789   return transform_node_Or_bf_store(or);
2790 }
2791
2792 /**
2793  * Optimize an Or(shl(x, c), shr(x, bits - c)) into a Rot
2794  */
2795 static ir_node *transform_node_Or_Rot(ir_node *or)
2796 {
2797   ir_mode *mode = get_irn_mode(or);
2798   ir_node *shl, *shr, *block;
2799   ir_node *irn, *x, *c1, *c2, *v, *sub, *n;
2800   tarval *tv1, *tv2;
2801
2802   if (! mode_is_int(mode))
2803     return or;
2804
2805   shl = get_binop_left(or);
2806   shr = get_binop_right(or);
2807
2808   if (get_irn_op(shl) == op_Shr) {
2809     if (get_irn_op(shr) != op_Shl)
2810       return or;
2811
2812     irn = shl;
2813     shl = shr;
2814     shr = irn;
2815   }
2816   else if (get_irn_op(shl) != op_Shl)
2817     return or;
2818   else if (get_irn_op(shr) != op_Shr)
2819     return or;
2820
2821   x = get_Shl_left(shl);
2822   if (x != get_Shr_left(shr))
2823     return or;
2824
2825   c1 = get_Shl_right(shl);
2826   c2 = get_Shr_right(shr);
2827   if (get_irn_op(c1) == op_Const && get_irn_op(c2) == op_Const) {
2828     tv1 = get_Const_tarval(c1);
2829     if (! tarval_is_long(tv1))
2830       return or;
2831
2832     tv2 = get_Const_tarval(c2);
2833     if (! tarval_is_long(tv2))
2834       return or;
2835
2836     if (get_tarval_long(tv1) + get_tarval_long(tv2)
2837         != get_mode_size_bits(mode))
2838       return or;
2839
2840     /* yet, condition met */
2841     block = get_irn_n(or, -1);
2842
2843     n = new_r_Rot(current_ir_graph, block, x, c1, mode);
2844
2845     DBG_OPT_ALGSIM1(or, shl, shr, n, FS_OPT_OR_SHFT_TO_ROT);
2846     return n;
2847   }
2848   else if (get_irn_op(c1) == op_Sub) {
2849     v   = c2;
2850     sub = c1;
2851
2852     if (get_Sub_right(sub) != v)
2853       return or;
2854
2855     c1 = get_Sub_left(sub);
2856     if (get_irn_op(c1) != op_Const)
2857       return or;
2858
2859     tv1 = get_Const_tarval(c1);
2860     if (! tarval_is_long(tv1))
2861       return or;
2862
2863     if (get_tarval_long(tv1) != get_mode_size_bits(mode))
2864       return or;
2865
2866     /* yet, condition met */
2867     block = get_nodes_block(or);
2868
2869     /* a Rot right is not supported, so use a rot left */
2870     n =  new_r_Rot(current_ir_graph, block, x, sub, mode);
2871
2872     DBG_OPT_ALGSIM0(or, n, FS_OPT_OR_SHFT_TO_ROT);
2873     return n;
2874   }
2875   else if (get_irn_op(c2) == op_Sub) {
2876     v   = c1;
2877     sub = c2;
2878
2879     c1 = get_Sub_left(sub);
2880     if (get_irn_op(c1) != op_Const)
2881       return or;
2882
2883     tv1 = get_Const_tarval(c1);
2884     if (! tarval_is_long(tv1))
2885       return or;
2886
2887     if (get_tarval_long(tv1) != get_mode_size_bits(mode))
2888       return or;
2889
2890     /* yet, condition met */
2891     block = get_irn_n(or, -1);
2892
2893     /* a Rot Left */
2894     n = new_r_Rot(current_ir_graph, block, x, v, mode);
2895
2896     DBG_OPT_ALGSIM0(or, n, FS_OPT_OR_SHFT_TO_ROT);
2897     return n;
2898   }
2899
2900   return or;
2901 }
2902
2903 /**
2904  * Optimize an Or
2905  */
2906 static ir_node *transform_node_Or(ir_node *or)
2907 {
2908   or = transform_node_Or_bf_store(or);
2909   or = transform_node_Or_Rot(or);
2910
2911   return or;
2912 }
2913
2914 /* forward */
2915 static ir_node *transform_node(ir_node *n);
2916
2917 /**
2918  * Optimize (a >> c1) >> c2), works for Shr, Shrs, Shl.
2919  *
2920  * Should be moved to reassociation?
2921  */
2922 static ir_node *transform_node_shift(ir_node *n)
2923 {
2924   ir_node *left, *right;
2925   tarval *tv1, *tv2, *res;
2926   ir_mode *mode;
2927   int modulo_shf, flag;
2928
2929   left = get_binop_left(n);
2930
2931   /* different operations */
2932   if (get_irn_op(left) != get_irn_op(n))
2933     return n;
2934
2935   right = get_binop_right(n);
2936   tv1 = value_of(right);
2937   if (tv1 == tarval_bad)
2938     return n;
2939
2940   tv2 = value_of(get_binop_right(left));
2941   if (tv2 == tarval_bad)
2942     return n;
2943
2944   res = tarval_add(tv1, tv2);
2945
2946   /* beware: a simple replacement works only, if res < modulo shift */
2947   mode = get_irn_mode(n);
2948
2949   flag = 0;
2950
2951   modulo_shf = get_mode_modulo_shift(mode);
2952   if (modulo_shf > 0) {
2953     tarval *modulo = new_tarval_from_long(modulo_shf, get_tarval_mode(res));
2954
2955     if (tarval_cmp(res, modulo) & pn_Cmp_Lt)
2956       flag = 1;
2957   }
2958   else
2959     flag = 1;
2960
2961   if (flag) {
2962     /* ok, we can replace it */
2963     ir_node *in[2], *irn, *block = get_irn_n(n, -1);
2964
2965     in[0] = get_binop_left(left);
2966     in[1] = new_r_Const(current_ir_graph, block, get_tarval_mode(res), res);
2967
2968     irn = new_ir_node(NULL, current_ir_graph, block, get_irn_op(n), mode, 2, in);
2969
2970     DBG_OPT_ALGSIM0(n, irn, FS_OPT_REASSOC_SHIFT);
2971
2972     return transform_node(irn);
2973   }
2974   return n;
2975 }
2976
2977 #define transform_node_Shr  transform_node_shift
2978 #define transform_node_Shrs transform_node_shift
2979 #define transform_node_Shl  transform_node_shift
2980
2981 /**
2982  * Remove dead blocks and nodes in dead blocks
2983  * in keep alive list.  We do not generate a new End node.
2984  */
2985 static ir_node *transform_node_End(ir_node *n) {
2986   int i, n_keepalives = get_End_n_keepalives(n);
2987
2988   for (i = 0; i < n_keepalives; ++i) {
2989     ir_node *ka = get_End_keepalive(n, i);
2990     if (is_Block(ka)) {
2991       if (is_Block_dead(ka)) {
2992         set_End_keepalive(n, i, new_Bad());
2993       }
2994     }
2995     else if (is_irn_pinned_in_irg(ka) && is_Block_dead(get_nodes_block(ka)))
2996       set_End_keepalive(n, i, new_Bad());
2997   }
2998   return n;
2999 }
3000
3001 /**
3002  * Optimize a Mux into some simpler cases.
3003  */
3004 static ir_node *transform_node_Mux(ir_node *n)
3005 {
3006   ir_node *oldn = n, *sel = get_Mux_sel(n);
3007   ir_mode *mode = get_irn_mode(n);
3008
3009   if (get_irn_op(sel) == op_Proj && !mode_honor_signed_zeros(mode)) {
3010     ir_node *cmp = get_Proj_pred(sel);
3011     long proj_nr = get_Proj_proj(sel);
3012     ir_node *f   =  get_Mux_false(n);
3013     ir_node *t   = get_Mux_true(n);
3014
3015     if (get_irn_op(cmp) == op_Cmp && classify_Const(get_Cmp_right(cmp)) == CNST_NULL) {
3016       ir_node *block = get_irn_n(n, -1);
3017
3018       /*
3019        * Note: normalization puts the constant on the right site,
3020        * so we check only one case.
3021        *
3022        * Note further that these optimization work even for floating point
3023        * with NaN's because -NaN == NaN.
3024        * However, if +0 and -0 is handled differently, we cannot use the first one.
3025        */
3026       if (get_irn_op(f) == op_Minus &&
3027           get_Minus_op(f)   == t &&
3028           get_Cmp_left(cmp) == t) {
3029
3030         if (proj_nr == pn_Cmp_Ge || proj_nr == pn_Cmp_Gt) {
3031           /* Mux(a >=/> 0, -a, a)  ==>  Abs(a) */
3032           n = new_rd_Abs(get_irn_dbg_info(n),
3033                 current_ir_graph,
3034                 block,
3035                 t, mode);
3036           DBG_OPT_ALGSIM1(oldn, cmp, sel, n, FS_OPT_MUX_TO_ABS);
3037           return n;
3038         }
3039         else if (proj_nr == pn_Cmp_Le || proj_nr == pn_Cmp_Lt) {
3040           /* Mux(a <=/< 0, -a, a)  ==>  Minus(Abs(a)) */
3041           n = new_rd_Abs(get_irn_dbg_info(n),
3042                 current_ir_graph,
3043                 block,
3044                 t, mode);
3045           n = new_rd_Minus(get_irn_dbg_info(n),
3046                 current_ir_graph,
3047                 block,
3048                 n, mode);
3049
3050           DBG_OPT_ALGSIM1(oldn, cmp, sel, n, FS_OPT_MUX_TO_ABS);
3051           return n;
3052         }
3053       }
3054       else if (get_irn_op(t) == op_Minus &&
3055           get_Minus_op(t)   == f &&
3056           get_Cmp_left(cmp) == f) {
3057
3058         if (proj_nr == pn_Cmp_Le || proj_nr == pn_Cmp_Lt) {
3059           /* Mux(a <=/< 0, a, -a)  ==>  Abs(a) */
3060           n = new_rd_Abs(get_irn_dbg_info(n),
3061                 current_ir_graph,
3062                 block,
3063                 f, mode);
3064           DBG_OPT_ALGSIM1(oldn, cmp, sel, n, FS_OPT_MUX_TO_ABS);
3065           return n;
3066         }
3067         else if (proj_nr == pn_Cmp_Ge || proj_nr == pn_Cmp_Gt) {
3068           /* Mux(a >=/> 0, a, -a)  ==>  Minus(Abs(a)) */
3069           n = new_rd_Abs(get_irn_dbg_info(n),
3070                 current_ir_graph,
3071                 block,
3072                 f, mode);
3073           n = new_rd_Minus(get_irn_dbg_info(n),
3074                 current_ir_graph,
3075                 block,
3076                 n, mode);
3077
3078           DBG_OPT_ALGSIM1(oldn, cmp, sel, n, FS_OPT_MUX_TO_ABS);
3079           return n;
3080         }
3081       }
3082
3083       if (mode_is_int(mode) && mode_is_signed(mode) &&
3084           get_mode_arithmetic(mode) == irma_twos_complement) {
3085         ir_node *x = get_Cmp_left(cmp);
3086
3087         /* the following optimization works only with signed integer two-complement mode */
3088
3089         if (mode == get_irn_mode(x)) {
3090           /*
3091            * FIXME: this restriction is two rigid, as it would still
3092            * work if mode(x) = Hs and mode == Is, but at least it removes
3093            * all wrong cases.
3094            */
3095           if ((proj_nr == pn_Cmp_Lt || proj_nr == pn_Cmp_Le) &&
3096               classify_Const(t) == CNST_ALL_ONE &&
3097               classify_Const(f) == CNST_NULL) {
3098             /*
3099              * Mux(x:T </<= 0, 0, -1) -> Shrs(x, sizeof_bits(T) - 1)
3100              * Conditions:
3101              * T must be signed.
3102              */
3103             n = new_rd_Shrs(get_irn_dbg_info(n),
3104                   current_ir_graph, block, x,
3105                   new_r_Const_long(current_ir_graph, block, mode_Iu,
3106                     get_mode_size_bits(mode) - 1),
3107                   mode);
3108             DBG_OPT_ALGSIM1(oldn, cmp, sel, n, FS_OPT_MUX_TO_SHR);
3109             return n;
3110           }
3111           else if ((proj_nr == pn_Cmp_Gt || proj_nr == pn_Cmp_Ge) &&
3112                    classify_Const(t) == CNST_ONE &&
3113                    classify_Const(f) == CNST_NULL) {
3114             /*
3115              * Mux(x:T >/>= 0, 0, 1) -> Shr(-x, sizeof_bits(T) - 1)
3116              * Conditions:
3117              * T must be signed.
3118              */
3119             n = new_rd_Shr(get_irn_dbg_info(n),
3120                   current_ir_graph, block,
3121                   new_r_Minus(current_ir_graph, block, x, mode),
3122                   new_r_Const_long(current_ir_graph, block, mode_Iu,
3123                     get_mode_size_bits(mode) - 1),
3124                   mode);
3125             DBG_OPT_ALGSIM1(oldn, cmp, sel, n, FS_OPT_MUX_TO_SHR);
3126             return n;
3127           }
3128         }
3129       }
3130     }
3131   }
3132   return arch_transform_node_Mux(n);
3133 }
3134
3135 /**
3136  * Optimize a Psi into some simpler cases.
3137  */
3138 static ir_node *transform_node_Psi(ir_node *n) {
3139   if (is_Mux(n))
3140     return transform_node_Mux(n);
3141
3142   return n;
3143 }
3144
3145 /**
3146  * Tries several [inplace] [optimizing] transformations and returns an
3147  * equivalent node.  The difference to equivalent_node() is that these
3148  * transformations _do_ generate new nodes, and thus the old node must
3149  * not be freed even if the equivalent node isn't the old one.
3150  */
3151 static ir_node *transform_node(ir_node *n)
3152 {
3153   if (n->op->ops.transform_node)
3154     n = n->op->ops.transform_node(n);
3155   return n;
3156 }
3157
3158 /**
3159  * sSets the default transform node operation for an ir_op_ops.
3160  *
3161  * @param code   the opcode for the default operation
3162  * @param ops    the operations initialized
3163  *
3164  * @return
3165  *    The operations.
3166  */
3167 static ir_op_ops *firm_set_default_transform_node(opcode code, ir_op_ops *ops)
3168 {
3169 #define CASE(a)                                 \
3170   case iro_##a:                                 \
3171     ops->transform_node  = transform_node_##a;   \
3172     break
3173
3174   switch (code) {
3175   CASE(Add);
3176   CASE(Sub);
3177   CASE(Mul);
3178   CASE(Div);
3179   CASE(Mod);
3180   CASE(DivMod);
3181   CASE(Abs);
3182   CASE(Cond);
3183   CASE(Eor);
3184   CASE(Not);
3185   CASE(Cast);
3186   CASE(Proj);
3187   CASE(Phi);
3188   CASE(Sel);
3189   CASE(Or);
3190   CASE(Shr);
3191   CASE(Shrs);
3192   CASE(Shl);
3193   CASE(End);
3194   CASE(Mux);
3195   CASE(Psi);
3196   default:
3197     /* leave NULL */;
3198   }
3199
3200   return ops;
3201 #undef CASE
3202 }
3203
3204
3205 /* **************** Common Subexpression Elimination **************** */
3206
3207 /** The size of the hash table used, should estimate the number of nodes
3208     in a graph. */
3209 #define N_IR_NODES 512
3210
3211 /** Compares the attributes of two Const nodes. */
3212 static int node_cmp_attr_Const(ir_node *a, ir_node *b)
3213 {
3214   return (get_Const_tarval(a) != get_Const_tarval(b))
3215       || (get_Const_type(a) != get_Const_type(b));
3216 }
3217
3218 /** Compares the attributes of two Proj nodes. */
3219 static int node_cmp_attr_Proj(ir_node *a, ir_node *b)
3220 {
3221   return get_irn_proj_attr (a) != get_irn_proj_attr (b);
3222 }
3223
3224 /** Compares the attributes of two Filter nodes. */
3225 static int node_cmp_attr_Filter(ir_node *a, ir_node *b)
3226 {
3227   return get_Filter_proj(a) != get_Filter_proj(b);
3228 }
3229
3230 /** Compares the attributes of two Alloc nodes. */
3231 static int node_cmp_attr_Alloc(ir_node *a, ir_node *b)
3232 {
3233   return (get_irn_alloc_attr(a).where != get_irn_alloc_attr(b).where)
3234       || (get_irn_alloc_attr(a).type != get_irn_alloc_attr(b).type);
3235 }
3236
3237 /** Compares the attributes of two Free nodes. */
3238 static int node_cmp_attr_Free(ir_node *a, ir_node *b)
3239 {
3240   return (get_irn_free_attr(a).where != get_irn_free_attr(b).where)
3241       || (get_irn_free_attr(a).type != get_irn_free_attr(b).type);
3242 }
3243
3244 /** Compares the attributes of two SymConst nodes. */
3245 static int node_cmp_attr_SymConst(ir_node *a, ir_node *b)
3246 {
3247   return (get_irn_symconst_attr(a).num != get_irn_symconst_attr(b).num)
3248       || (get_irn_symconst_attr(a).sym.type_p != get_irn_symconst_attr(b).sym.type_p)
3249       || (get_irn_symconst_attr(a).tp != get_irn_symconst_attr(b).tp);
3250 }
3251
3252 /** Compares the attributes of two Call nodes. */
3253 static int node_cmp_attr_Call(ir_node *a, ir_node *b)
3254 {
3255   return (get_irn_call_attr(a) != get_irn_call_attr(b));
3256 }
3257
3258 /** Compares the attributes of two Sel nodes. */
3259 static int node_cmp_attr_Sel(ir_node *a, ir_node *b)
3260 {
3261   return (get_irn_sel_attr(a).ent->kind  != get_irn_sel_attr(b).ent->kind)
3262       || (get_irn_sel_attr(a).ent->name    != get_irn_sel_attr(b).ent->name)
3263       || (get_irn_sel_attr(a).ent->owner   != get_irn_sel_attr(b).ent->owner)
3264       || (get_irn_sel_attr(a).ent->ld_name != get_irn_sel_attr(b).ent->ld_name)
3265       || (get_irn_sel_attr(a).ent->type    != get_irn_sel_attr(b).ent->type);
3266 }
3267
3268 /** Compares the attributes of two Phi nodes. */
3269 static int node_cmp_attr_Phi(ir_node *a, ir_node *b)
3270 {
3271   return get_irn_phi_attr (a) != get_irn_phi_attr (b);
3272 }
3273
3274 /** Compares the attributes of two Cast nodes. */
3275 static int node_cmp_attr_Cast(ir_node *a, ir_node *b)
3276 {
3277   return get_Cast_type(a) != get_Cast_type(b);
3278 }
3279
3280 /** Compares the attributes of two Load nodes. */
3281 static int node_cmp_attr_Load(ir_node *a, ir_node *b)
3282 {
3283   if (get_Load_volatility(a) == volatility_is_volatile ||
3284       get_Load_volatility(b) == volatility_is_volatile)
3285     /* NEVER do CSE on volatile Loads */
3286     return 1;
3287
3288   return get_Load_mode(a) != get_Load_mode(b);
3289 }
3290
3291 /** Compares the attributes of two Store nodes. */
3292 static int node_cmp_attr_Store(ir_node *a, ir_node *b)
3293 {
3294   /* NEVER do CSE on volatile Stores */
3295   return (get_Store_volatility(a) == volatility_is_volatile ||
3296           get_Store_volatility(b) == volatility_is_volatile);
3297 }
3298
3299 /** Compares the attributes of two Confirm nodes. */
3300 static int node_cmp_attr_Confirm(ir_node *a, ir_node *b)
3301 {
3302   return (get_Confirm_cmp(a) != get_Confirm_cmp(b));
3303 }
3304
3305 /**
3306  * Set the default node attribute compare operation for an ir_op_ops.
3307  *
3308  * @param code   the opcode for the default operation
3309  * @param ops    the operations initialized
3310  *
3311  * @return
3312  *    The operations.
3313  */
3314 static ir_op_ops *firm_set_default_node_cmp_attr(opcode code, ir_op_ops *ops)
3315 {
3316 #define CASE(a)                              \
3317   case iro_##a:                              \
3318     ops->node_cmp_attr  = node_cmp_attr_##a; \
3319     break
3320
3321   switch (code) {
3322   CASE(Const);
3323   CASE(Proj);
3324   CASE(Filter);
3325   CASE(Alloc);
3326   CASE(Free);
3327   CASE(SymConst);
3328   CASE(Call);
3329   CASE(Sel);
3330   CASE(Phi);
3331   CASE(Cast);
3332   CASE(Load);
3333   CASE(Store);
3334   CASE(Confirm);
3335   default:
3336     /* leave NULL */;
3337   }
3338
3339   return ops;
3340 #undef CASE
3341 }
3342
3343 /*
3344  * Compare function for two nodes in the hash table. Gets two
3345  * nodes as parameters.  Returns 0 if the nodes are a cse.
3346  */
3347 int identities_cmp(const void *elt, const void *key)
3348 {
3349   ir_node *a, *b;
3350   int i, irn_arity_a;
3351
3352   a = (void *)elt;
3353   b = (void *)key;
3354
3355   if (a == b) return 0;
3356
3357   if ((get_irn_op(a) != get_irn_op(b)) ||
3358       (get_irn_mode(a) != get_irn_mode(b))) return 1;
3359
3360   /* compare if a's in and b's in are of equal length */
3361   irn_arity_a = get_irn_intra_arity (a);
3362   if (irn_arity_a != get_irn_intra_arity(b))
3363     return 1;
3364
3365   /* for block-local cse and op_pin_state_pinned nodes: */
3366   if (!get_opt_global_cse() || (get_irn_pinned(a) == op_pin_state_pinned)) {
3367     if (get_irn_intra_n(a, -1) != get_irn_intra_n(b, -1))
3368       return 1;
3369   }
3370
3371   /* compare a->in[0..ins] with b->in[0..ins] */
3372   for (i = 0; i < irn_arity_a; i++)
3373     if (get_irn_intra_n(a, i) != get_irn_intra_n(b, i))
3374       return 1;
3375
3376   /*
3377    * here, we already now that the nodes are identical except their
3378    * attributes
3379    */
3380   if (a->op->ops.node_cmp_attr)
3381     return a->op->ops.node_cmp_attr(a, b);
3382
3383   return 0;
3384 }
3385
3386 /*
3387  * Calculate a hash value of a node.
3388  */
3389 unsigned
3390 ir_node_hash (ir_node *node)
3391 {
3392   unsigned h;
3393   int i, irn_arity;
3394
3395   if (node->op == op_Const) {
3396     /* special value for const, as they only differ in their tarval. */
3397     h = HASH_PTR(node->attr.con.tv);
3398     h = 9*h + HASH_PTR(get_irn_mode(node));
3399   } else if (node->op == op_SymConst) {
3400     /* special value for const, as they only differ in their symbol. */
3401     h = HASH_PTR(node->attr.i.sym.type_p);
3402     h = 9*h + HASH_PTR(get_irn_mode(node));
3403   } else {
3404
3405     /* hash table value = 9*(9*(9*(9*(9*arity+in[0])+in[1])+ ...)+mode)+code */
3406     h = irn_arity = get_irn_intra_arity(node);
3407
3408     /* consider all in nodes... except the block if not a control flow. */
3409     for (i =  is_cfop(node) ? -1 : 0;  i < irn_arity;  i++) {
3410       h = 9*h + HASH_PTR(get_irn_intra_n(node, i));
3411     }
3412
3413     /* ...mode,... */
3414     h = 9*h + HASH_PTR(get_irn_mode(node));
3415     /* ...and code */
3416     h = 9*h + HASH_PTR(get_irn_op(node));
3417   }
3418
3419   return h;
3420 }
3421
3422 pset *
3423 new_identities(void) {
3424   return new_pset(identities_cmp, N_IR_NODES);
3425 }
3426
3427 void
3428 del_identities(pset *value_table) {
3429   del_pset(value_table);
3430 }
3431
3432 /**
3433  * Return the canonical node computing the same value as n.
3434  * Looks up the node in a hash table.
3435  *
3436  * For Const nodes this is performed in the constructor, too.  Const
3437  * nodes are extremely time critical because of their frequent use in
3438  * constant string arrays.
3439  */
3440 static INLINE ir_node *identify(pset *value_table, ir_node *n)
3441 {
3442   ir_node *o = NULL;
3443
3444   if (!value_table) return n;
3445
3446   if (get_opt_reassociation()) {
3447     if (is_op_commutative(get_irn_op(n))) {
3448       ir_node *l = get_binop_left(n);
3449       ir_node *r = get_binop_right(n);
3450
3451       /* for commutative operators perform  a OP b == b OP a */
3452       if (get_irn_idx(l) > get_irn_idx(r)) {
3453         set_binop_left(n, r);
3454         set_binop_right(n, l);
3455       }
3456     }
3457   }
3458
3459   o = pset_find(value_table, n, ir_node_hash (n));
3460   if (!o) return n;
3461
3462   DBG_OPT_CSE(n, o);
3463
3464   return o;
3465 }
3466
3467 /**
3468  * During construction we set the op_pin_state_pinned flag in the graph right when the
3469  * optimization is performed.  The flag turning on procedure global cse could
3470  * be changed between two allocations.  This way we are safe.
3471  */
3472 static INLINE ir_node *identify_cons(pset *value_table, ir_node *n) {
3473   ir_node *old = n;
3474
3475   n = identify(value_table, n);
3476   if (get_irn_n(old, -1) != get_irn_n(n, -1))
3477     set_irg_pinned(current_ir_graph, op_pin_state_floats);
3478   return n;
3479 }
3480
3481 /*
3482  * Return the canonical node computing the same value as n.
3483  * Looks up the node in a hash table, enters it in the table
3484  * if it isn't there yet.
3485  */
3486 ir_node *identify_remember(pset *value_table, ir_node *n)
3487 {
3488   ir_node *o = NULL;
3489
3490   if (!value_table) return n;
3491
3492   if (get_opt_reassociation()) {
3493     if (is_op_commutative(get_irn_op(n))) {
3494       ir_node *l = get_binop_left(n);
3495       ir_node *r = get_binop_right(n);
3496
3497       /* for commutative operators perform  a OP b == b OP a */
3498       if (l > r) {
3499         set_binop_left(n, r);
3500         set_binop_right(n, l);
3501       }
3502     }
3503   }
3504
3505   /* lookup or insert in hash table with given hash key. */
3506   o = pset_insert (value_table, n, ir_node_hash (n));
3507
3508   if (o != n) {
3509     DBG_OPT_CSE(n, o);
3510   }
3511
3512   return o;
3513 }
3514
3515 /* Add a node to the identities value table. */
3516 void add_identities(pset *value_table, ir_node *node) {
3517   if (get_opt_cse() && is_no_Block(node))
3518     identify_remember(value_table, node);
3519 }
3520
3521 /* Visit each node in the value table of a graph. */
3522 void visit_all_identities(ir_graph *irg, irg_walk_func visit, void *env) {
3523   ir_node *node;
3524   ir_graph *rem = current_ir_graph;
3525
3526   current_ir_graph = irg;
3527   foreach_pset(irg->value_table, node)
3528     visit(node, env);
3529   current_ir_graph = rem;
3530 }
3531
3532 /**
3533  * garbage in, garbage out. If a node has a dead input, i.e., the
3534  * Bad node is input to the node, return the Bad node.
3535  */
3536 static INLINE ir_node *gigo(ir_node *node)
3537 {
3538   int i, irn_arity;
3539   ir_op *op = get_irn_op(node);
3540
3541   /* remove garbage blocks by looking at control flow that leaves the block
3542      and replacing the control flow by Bad. */
3543   if (get_irn_mode(node) == mode_X) {
3544     ir_node *block = get_nodes_block(skip_Proj(node));
3545
3546     /* Don't optimize nodes in immature blocks. */
3547     if (!get_Block_matured(block)) return node;
3548      /* Don't optimize End, may have Bads. */
3549     if (op == op_End) return node;
3550
3551     if (is_Block(block)) {
3552       irn_arity = get_irn_arity(block);
3553       for (i = 0; i < irn_arity; i++) {
3554         if (!is_Bad(get_irn_n(block, i)))
3555           break;
3556       }
3557       if (i == irn_arity) return new_Bad();
3558     }
3559   }
3560
3561   /* Blocks, Phis and Tuples may have dead inputs, e.g., if one of the
3562      blocks predecessors is dead. */
3563   if ( op != op_Block && op != op_Phi && op != op_Tuple) {
3564     irn_arity = get_irn_arity(node);
3565
3566     /*
3567      * Beware: we can only read the block of a non-floating node.
3568      */
3569     if (is_irn_pinned_in_irg(node) &&
3570         is_Block_dead(get_nodes_block(node)))
3571       return new_Bad();
3572
3573     for (i = 0; i < irn_arity; i++) {
3574       ir_node *pred = get_irn_n(node, i);
3575
3576       if (is_Bad(pred))
3577         return new_Bad();
3578 #if 0
3579       /* Propagating Unknowns here seems to be a bad idea, because
3580          sometimes we need a node as a input and did not want that
3581          it kills it's user.
3582          However, i might be useful to move this into a later phase
3583          (it you thing optimizing such code is useful). */
3584       if (is_Unknown(pred) && mode_is_data(get_irn_mode(node)))
3585         return new_Unknown(get_irn_mode(node));
3586 #endif
3587     }
3588   }
3589 #if 0
3590   /* With this code we violate the agreement that local_optimize
3591      only leaves Bads in Block, Phi and Tuple nodes. */
3592   /* If Block has only Bads as predecessors it's garbage. */
3593   /* If Phi has only Bads as predecessors it's garbage. */
3594   if ((op == op_Block && get_Block_matured(node)) || op == op_Phi)  {
3595     irn_arity = get_irn_arity(node);
3596     for (i = 0; i < irn_arity; i++) {
3597       if (!is_Bad(get_irn_n(node, i))) break;
3598     }
3599     if (i == irn_arity) node = new_Bad();
3600   }
3601 #endif
3602   return node;
3603 }
3604
3605 /**
3606  * These optimizations deallocate nodes from the obstack.
3607  * It can only be called if it is guaranteed that no other nodes
3608  * reference this one, i.e., right after construction of a node.
3609  *
3610  * current_ir_graph must be set to the graph of the node!
3611  */
3612 ir_node *optimize_node(ir_node *n)
3613 {
3614   tarval *tv;
3615   ir_node *oldn = n;
3616   opcode iro = get_irn_opcode(n);
3617
3618   /* Always optimize Phi nodes: part of the construction. */
3619   if ((!get_opt_optimize()) && (iro != iro_Phi)) return n;
3620
3621   /* constant expression evaluation / constant folding */
3622   if (get_opt_constant_folding()) {
3623     /* neither constants nor Tuple values can be evaluated */
3624     if (iro != iro_Const && (get_irn_mode(n) != mode_T)) {
3625       /* try to evaluate */
3626       tv = computed_value(n);
3627       if (tv != tarval_bad) {
3628         ir_node *nw;
3629         ir_type *old_tp = get_irn_type(n);
3630         int i, arity = get_irn_arity(n);
3631         int node_size;
3632
3633         /*
3634          * Try to recover the type of the new expression.
3635          */
3636         for (i = 0; i < arity && !old_tp; ++i)
3637           old_tp = get_irn_type(get_irn_n(n, i));
3638
3639         /*
3640          * we MUST copy the node here temporary, because it's still needed
3641          * for DBG_OPT_CSTEVAL
3642          */
3643         node_size = offsetof(ir_node, attr) +  n->op->attr_size;
3644         oldn = alloca(node_size);
3645
3646         memcpy(oldn, n, node_size);
3647         CLONE_ARR_A(ir_node *, oldn->in, n->in);
3648
3649         /* ARG, copy the in array, we need it for statistics */
3650         memcpy(oldn->in, n->in, ARR_LEN(n->in) * sizeof(n->in[0]));
3651
3652         /* note the inplace edges module */
3653         edges_node_deleted(n, current_ir_graph);
3654
3655         /* evaluation was successful -- replace the node. */
3656         irg_kill_node(current_ir_graph, n);
3657         nw = new_Const(get_tarval_mode (tv), tv);
3658
3659         if (old_tp && get_type_mode(old_tp) == get_tarval_mode (tv))
3660           set_Const_type(nw, old_tp);
3661         DBG_OPT_CSTEVAL(oldn, nw);
3662         return nw;
3663       }
3664     }
3665   }
3666
3667   /* remove unnecessary nodes */
3668   if (get_opt_constant_folding() ||
3669     (iro == iro_Phi)  ||   /* always optimize these nodes. */
3670     (iro == iro_Id)   ||
3671     (iro == iro_Proj) ||
3672     (iro == iro_Block)  )  /* Flags tested local. */
3673     n = equivalent_node (n);
3674
3675   optimize_preds(n);                  /* do node specific optimizations of nodes predecessors. */
3676
3677   /* Common Subexpression Elimination.
3678    *
3679    * Checks whether n is already available.
3680    * The block input is used to distinguish different subexpressions. Right
3681    * now all nodes are op_pin_state_pinned to blocks, i.e., the CSE only finds common
3682    * subexpressions within a block.
3683    */
3684   if (get_opt_cse())
3685     n = identify_cons (current_ir_graph->value_table, n);
3686
3687   if (n != oldn) {
3688     edges_node_deleted(oldn, current_ir_graph);
3689
3690     /* We found an existing, better node, so we can deallocate the old node. */
3691     irg_kill_node(current_ir_graph, oldn);
3692     return n;
3693   }
3694
3695   /* Some more constant expression evaluation that does not allow to
3696      free the node. */
3697   iro = get_irn_opcode(n);
3698   if (get_opt_constant_folding() ||
3699     (iro == iro_Cond) ||
3700     (iro == iro_Proj) ||
3701     (iro == iro_Sel))     /* Flags tested local. */
3702     n = transform_node (n);
3703
3704   /* Remove nodes with dead (Bad) input.
3705      Run always for transformation induced Bads. */
3706   n = gigo (n);
3707
3708   /* Now we have a legal, useful node. Enter it in hash table for CSE */
3709   if (get_opt_cse() && (get_irn_opcode(n) != iro_Block)) {
3710     n = identify_remember (current_ir_graph->value_table, n);
3711   }
3712
3713   return n;
3714 }
3715
3716
3717 /**
3718  * These optimizations never deallocate nodes (in place).  This can cause dead
3719  * nodes lying on the obstack.  Remove these by a dead node elimination,
3720  * i.e., a copying garbage collection.
3721  */
3722 ir_node *optimize_in_place_2(ir_node *n)
3723 {
3724   tarval *tv;
3725   ir_node *oldn = n;
3726   opcode iro = get_irn_opcode(n);
3727
3728   if (!get_opt_optimize() && (get_irn_op(n) != op_Phi)) return n;
3729
3730   /* constant expression evaluation / constant folding */
3731   if (get_opt_constant_folding()) {
3732     /* neither constants nor Tuple values can be evaluated */
3733     if (iro != iro_Const && get_irn_mode(n) != mode_T) {
3734       /* try to evaluate */
3735       tv = computed_value(n);
3736       if (tv != tarval_bad) {
3737         /* evaluation was successful -- replace the node. */
3738         ir_type *old_tp = get_irn_type(n);
3739         int i, arity = get_irn_arity(n);
3740
3741         /*
3742          * Try to recover the type of the new expression.
3743          */
3744         for (i = 0; i < arity && !old_tp; ++i)
3745           old_tp = get_irn_type(get_irn_n(n, i));
3746
3747         n = new_Const(get_tarval_mode(tv), tv);
3748
3749         if (old_tp && get_type_mode(old_tp) == get_tarval_mode(tv))
3750           set_Const_type(n, old_tp);
3751
3752         DBG_OPT_CSTEVAL(oldn, n);
3753         return n;
3754       }
3755     }
3756   }
3757
3758   /* remove unnecessary nodes */
3759   if (get_opt_constant_folding() ||
3760       (iro == iro_Phi)  ||   /* always optimize these nodes. */
3761       (iro == iro_Id)   ||   /* ... */
3762       (iro == iro_Proj) ||   /* ... */
3763       (iro == iro_Block)  )  /* Flags tested local. */
3764     n = equivalent_node(n);
3765
3766   optimize_preds(n);                  /* do node specific optimizations of nodes predecessors. */
3767
3768   /** common subexpression elimination **/
3769   /* Checks whether n is already available. */
3770   /* The block input is used to distinguish different subexpressions.  Right
3771      now all nodes are op_pin_state_pinned to blocks, i.e., the cse only finds common
3772      subexpressions within a block. */
3773   if (get_opt_cse()) {
3774     n = identify(current_ir_graph->value_table, n);
3775   }
3776
3777   /* Some more constant expression evaluation. */
3778   iro = get_irn_opcode(n);
3779   if (get_opt_constant_folding() ||
3780       (iro == iro_Cond) ||
3781       (iro == iro_Proj) ||
3782       (iro == iro_Sel))     /* Flags tested local. */
3783     n = transform_node(n);
3784
3785   /* Remove nodes with dead (Bad) input.
3786      Run always for transformation induced Bads.  */
3787   n = gigo(n);
3788
3789   /* Now we can verify the node, as it has no dead inputs any more. */
3790   irn_vrfy(n);
3791
3792   /* Now we have a legal, useful node. Enter it in hash table for cse.
3793      Blocks should be unique anyways.  (Except the successor of start:
3794      is cse with the start block!) */
3795   if (get_opt_cse() && (get_irn_opcode(n) != iro_Block))
3796     n = identify_remember(current_ir_graph->value_table, n);
3797
3798   return n;
3799 }
3800
3801 /**
3802  * Wrapper for external use, set proper status bits after optimization.
3803  */
3804 ir_node *optimize_in_place(ir_node *n)
3805 {
3806   /* Handle graph state */
3807   assert(get_irg_phase_state(current_ir_graph) != phase_building);
3808
3809   if (get_opt_global_cse())
3810     set_irg_pinned(current_ir_graph, op_pin_state_floats);
3811   if (get_irg_outs_state(current_ir_graph) == outs_consistent)
3812     set_irg_outs_inconsistent(current_ir_graph);
3813
3814   /* FIXME: Maybe we could also test whether optimizing the node can
3815      change the control graph. */
3816   set_irg_doms_inconsistent(current_ir_graph);
3817   return optimize_in_place_2 (n);
3818 }
3819
3820 /*
3821  * Sets the default operation for an ir_ops.
3822  */
3823 ir_op_ops *firm_set_default_operations(opcode code, ir_op_ops *ops)
3824 {
3825   ops = firm_set_default_computed_value(code, ops);
3826   ops = firm_set_default_equivalent_node(code, ops);
3827   ops = firm_set_default_transform_node(code, ops);
3828   ops = firm_set_default_node_cmp_attr(code, ops);
3829   ops = firm_set_default_get_type(code, ops);
3830   ops = firm_set_default_get_type_attr(code, ops);
3831   ops = firm_set_default_get_entity_attr(code, ops);
3832
3833   return ops;
3834 }