Use simple assignment instead of memcpy() when possible.
[libfirm] / ir / be / ia32 / ia32_transform.c
index c0696dc..a9acd89 100644 (file)
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 1995-2008 University of Karlsruhe.  All right reserved.
+ * Copyright (C) 1995-2011 University of Karlsruhe.  All right reserved.
  *
  * This file is part of libFirm.
  *
 #include "ia32_nodes_attr.h"
 #include "ia32_transform.h"
 #include "ia32_new_nodes.h"
-#include "ia32_map_regs.h"
 #include "ia32_dbg_stat.h"
 #include "ia32_optimize.h"
-#include "ia32_util.h"
 #include "ia32_address_mode.h"
 #include "ia32_architecture.h"
 
@@ -91,8 +89,9 @@
 
 DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)
 
+static ir_node         *old_initial_fpcw = NULL;
 static ir_node         *initial_fpcw = NULL;
-int                     no_pic_adjust;
+int                     ia32_no_pic_adjust;
 
 typedef ir_node *construct_binop_func(dbg_info *db, ir_node *block,
         ir_node *base, ir_node *index, ir_node *mem, ir_node *op1,
@@ -285,7 +284,7 @@ static ir_node *gen_Const(ir_node *node)
                                        }
                                }
 #endif /* CONSTRUCT_SSE_CONST */
-                               floatent = create_float_const_entity(node);
+                               floatent = ia32_create_float_const_entity(node);
 
                                base     = get_symconst_base();
                                load     = new_bd_ia32_xLoad(dbgi, block, base, noreg_GP, nomem,
@@ -308,7 +307,7 @@ static ir_node *gen_Const(ir_node *node)
                                ir_mode *ls_mode;
                                ir_node *base;
 
-                               floatent = create_float_const_entity(node);
+                               floatent = ia32_create_float_const_entity(node);
                                /* create_float_const_ent is smart and sometimes creates
                                   smaller entities */
                                ls_mode  = get_type_mode(get_entity_type(floatent));
@@ -325,8 +324,6 @@ static ir_node *gen_Const(ir_node *node)
 end:
 #endif /* CONSTRUCT_SSE_CONST */
                SET_IA32_ORIG_NODE(load, node);
-
-               be_dep_on_frame(load);
                return res;
        } else { /* non-float mode */
                ir_node   *cnst;
@@ -344,7 +341,6 @@ end:
                cnst = new_bd_ia32_Const(dbgi, block, NULL, 0, 0, val);
                SET_IA32_ORIG_NODE(cnst, node);
 
-               be_dep_on_frame(cnst);
                return cnst;
        }
 }
@@ -374,12 +370,18 @@ static ir_node *gen_SymConst(ir_node *node)
                        panic("backend only support symconst_addr_ent (at %+F)", node);
                }
                entity = get_SymConst_entity(node);
-               cnst = new_bd_ia32_Const(dbgi, block, entity, 0, 0, 0);
+               if (get_entity_owner(entity) == get_tls_type()) {
+                       ir_node *tls_base = new_bd_ia32_LdTls(NULL, block);
+                       ir_node *lea     = new_bd_ia32_Lea(dbgi, block, tls_base, noreg_GP);
+                       set_ia32_am_sc(lea, entity);
+                       cnst = lea;
+               } else {
+                       cnst = new_bd_ia32_Const(dbgi, block, entity, 0, 0, 0);
+               }
        }
 
        SET_IA32_ORIG_NODE(cnst, node);
 
-       be_dep_on_frame(cnst);
        return cnst;
 }
 
@@ -591,10 +593,10 @@ static int ia32_use_source_address_mode(ir_node *block, ir_node *node,
                return 0;
 
        /* don't do AM if other node inputs depend on the load (via mem-proj) */
-       if (other != NULL && prevents_AM(block, load, other))
+       if (other != NULL && ia32_prevents_AM(block, load, other))
                return 0;
 
-       if (other2 != NULL && prevents_AM(block, load, other2))
+       if (other2 != NULL && ia32_prevents_AM(block, load, other2))
                return 0;
 
        return 1;
@@ -636,11 +638,12 @@ static void build_address(ia32_address_mode_t *am, ir_node *node,
 
        /* floating point immediates */
        if (is_Const(node)) {
-               ir_entity *entity  = create_float_const_entity(node);
+               ir_entity *entity  = ia32_create_float_const_entity(node);
                addr->base         = get_symconst_base();
                addr->index        = noreg_GP;
                addr->mem          = nomem;
                addr->symconst_ent = entity;
+               addr->tls_segment  = false;
                addr->use_frame    = 1;
                am->ls_mode        = get_type_mode(get_entity_type(entity));
                am->pinned         = op_pin_state_floats;
@@ -669,6 +672,7 @@ static void set_address(ir_node *node, const ia32_address_t *addr)
        set_ia32_am_scale(node, addr->scale);
        set_ia32_am_sc(node, addr->symconst_ent);
        set_ia32_am_offs_int(node, addr->offset);
+       set_ia32_am_tls_segment(node, addr->tls_segment);
        if (addr->symconst_sign)
                set_ia32_am_sc_sign(node);
        if (addr->use_frame)
@@ -842,7 +846,7 @@ static void match_arguments(ia32_address_mode_t *am, ir_node *block,
         * op2 input */
        new_op2 = NULL;
        if (!(flags & match_try_am) && use_immediate) {
-               new_op2 = try_create_Immediate(op2, 0);
+               new_op2 = ia32_try_create_Immediate(op2, 0);
        }
 
        if (new_op2 == NULL &&
@@ -872,7 +876,7 @@ static void match_arguments(ia32_address_mode_t *am, ir_node *block,
                } else {
                        new_op1 = be_transform_node(op2);
                        new_op2 = noreg;
-                       am->ins_permuted = 1;
+                       am->ins_permuted = true;
                }
                am->op_type = ia32_AddrModeS;
        } else {
@@ -1034,14 +1038,10 @@ static ir_node *gen_binop_flags(ir_node *node, construct_binop_flags_func *func,
 
 static ir_node *get_fpcw(void)
 {
-       ir_node *fpcw;
        if (initial_fpcw != NULL)
                return initial_fpcw;
 
-       fpcw         = be_abi_get_ignore_irn(be_get_irg_abi(current_ir_graph),
-                                            &ia32_registers[REG_FPCW]);
-       initial_fpcw = be_transform_node(fpcw);
-
+       initial_fpcw = be_transform_node(old_initial_fpcw);
        return initial_fpcw;
 }
 
@@ -1067,8 +1067,12 @@ static ir_node *gen_binop_x87_float(ir_node *node, ir_node *op1, ir_node *op2,
        match_flags_t        flags = match_commutative;
 
        /* happens for div nodes... */
-       if (mode == mode_T)
-               mode = get_divop_resmod(node);
+       if (mode == mode_T) {
+               if (is_Div(node))
+                       mode = get_Div_resmode(node);
+               else
+                       panic("can't determine mode");
+       }
 
        /* cannot use address mode with long double on x87 */
        if (get_mode_size_bits(mode) <= 64)
@@ -1141,8 +1145,12 @@ static ir_node *gen_shift_binop(ir_node *node, ir_node *op1, ir_node *op2,
        /* lowered shift instruction may have a dependency operand, handle it here */
        if (get_irn_arity(node) == 3) {
                /* we have a dependency */
-               ir_node *new_dep = be_transform_node(get_irn_n(node, 2));
-               add_irn_dep(new_node, new_dep);
+               ir_node* dep = get_irn_n(node, 2);
+               if (get_irn_n_edges(dep) > 1) {
+                       /* ... which has at least one user other than 'node' */
+                       ir_node *new_dep = be_transform_node(dep);
+                       add_irn_dep(new_node, new_dep);
+               }
        }
 
        return new_node;
@@ -1197,6 +1205,18 @@ static ir_node *create_lea_from_address(dbg_info *dbgi, ir_node *block,
                index = be_transform_node(index);
        }
 
+       /* segment overrides are ineffective for Leas :-( so we have to patch
+        * around... */
+       if (addr->tls_segment) {
+               ir_node *tls_base = new_bd_ia32_LdTls(NULL, block);
+               assert(addr->symconst_ent != NULL);
+               if (base == noreg_GP)
+                       base = tls_base;
+               else
+                       base = new_bd_ia32_Lea(dbgi, block, tls_base, base);
+               addr->tls_segment = false;
+       }
+
        res = new_bd_ia32_Lea(dbgi, block, base, index);
        set_address(res, addr);
 
@@ -1260,7 +1280,6 @@ static ir_node *gen_Add(ir_node *node)
        if (addr.base == NULL && addr.index == NULL) {
                new_node = new_bd_ia32_Const(dbgi, new_block, addr.symconst_ent,
                                             addr.symconst_sign, 0, addr.offset);
-               be_dep_on_frame(new_node);
                SET_IA32_ORIG_NODE(new_node, node);
                return new_node;
        }
@@ -1495,8 +1514,13 @@ static ir_node *transform_AM_mem(ir_node *const block,
                        ins[n++] = be_transform_node(pred);
                }
 
-               ins[n++] = am_mem;
+               if (n==1 && ins[0] == am_mem) {
+                       return am_mem;
+                       /* creating a new Sync and relying on CSE may fail,
+                        * if am_mem is a ProjM, which does not yet verify. */
+               }
 
+               ins[n++] = am_mem;
                return new_r_Sync(block, n, ins);
        } else {
                ir_node *ins[2];
@@ -1523,7 +1547,6 @@ static ir_node *create_sex_32_64(dbg_info *dbgi, ir_node *block,
        (void)orig;
        if (ia32_cg_config.use_short_sex_eax) {
                ir_node *pval = new_bd_ia32_ProduceVal(dbgi, block);
-               be_dep_on_frame(pval);
                res = new_bd_ia32_Cltd(dbgi, block, val, pval);
        } else {
                ir_node *imm31 = ia32_create_Immediate(NULL, 0, 31);
@@ -1534,7 +1557,7 @@ static ir_node *create_sex_32_64(dbg_info *dbgi, ir_node *block,
 }
 
 /**
- * Generates an ia32 DivMod with additional infrastructure for the
+ * Generates an ia32 Div with additional infrastructure for the
  * register allocator if needed.
  */
 static ir_node *create_Div(ir_node *node)
@@ -1566,12 +1589,6 @@ static ir_node *create_Div(ir_node *node)
                mem     = get_Mod_mem(node);
                mode    = get_Mod_resmode(node);
                break;
-       case iro_DivMod:
-               op1     = get_DivMod_left(node);
-               op2     = get_DivMod_right(node);
-               mem     = get_DivMod_mem(node);
-               mode    = get_DivMod_resmode(node);
-               break;
        default:
                panic("invalid divmod node %+F", node);
        }
@@ -1589,7 +1606,6 @@ static ir_node *create_Div(ir_node *node)
                                addr->index, new_mem, am.new_op2, am.new_op1, sign_extension);
        } else {
                sign_extension = new_bd_ia32_Const(dbgi, new_block, NULL, 0, 0, 0);
-               be_dep_on_frame(sign_extension);
 
                new_node = new_bd_ia32_Div(dbgi, new_block, addr->base,
                                           addr->index, new_mem, am.new_op2,
@@ -1619,36 +1635,20 @@ static ir_node *gen_Mod(ir_node *node)
  */
 static ir_node *gen_Div(ir_node *node)
 {
-       return create_Div(node);
-}
-
-/**
- * Generates an ia32 DivMod.
- */
-static ir_node *gen_DivMod(ir_node *node)
-{
-       return create_Div(node);
-}
-
-
-
-/**
- * Creates an ia32 floating Div.
- *
- * @return The created ia32 xDiv node
- */
-static ir_node *gen_Quot(ir_node *node)
-{
-       ir_node *op1 = get_Quot_left(node);
-       ir_node *op2 = get_Quot_right(node);
+       ir_mode *mode = get_Div_resmode(node);
+       if (mode_is_float(mode)) {
+               ir_node *op1 = get_Div_left(node);
+               ir_node *op2 = get_Div_right(node);
 
-       if (ia32_cg_config.use_sse2) {
-               return gen_binop(node, op1, op2, new_bd_ia32_xDiv, match_am);
-       } else {
-               return gen_binop_x87_float(node, op1, op2, new_bd_ia32_vfdiv);
+               if (ia32_cg_config.use_sse2) {
+                       return gen_binop(node, op1, op2, new_bd_ia32_xDiv, match_am);
+               } else {
+                       return gen_binop_x87_float(node, op1, op2, new_bd_ia32_vfdiv);
+               }
        }
-}
 
+       return create_Div(node);
+}
 
 /**
  * Creates an ia32 Shl.
@@ -1926,85 +1926,160 @@ static ir_node *gen_bt(ir_node *cmp, ir_node *x, ir_node *n)
        return new_bd_ia32_Bt(dbgi, new_block, op1, op2);
 }
 
-/**
- * Transform a node returning a "flag" result.
- *
- * @param node     the node to transform
- * @param pnc_out  the compare mode to use
- */
-static ir_node *get_flags_node(ir_node *node, int *pnc_out)
+static ia32_condition_code_t relation_to_condition_code(ir_relation relation,
+                                                        ir_mode *mode)
 {
-       ir_node  *flags;
-       ir_node  *new_op;
-       ir_node  *new_block;
-       dbg_info *dbgi;
+       if (mode_is_float(mode)) {
+               switch (relation) {
+               case ir_relation_equal:              return ia32_cc_float_equal;
+               case ir_relation_less:               return ia32_cc_float_below;
+               case ir_relation_less_equal:         return ia32_cc_float_below_equal;
+               case ir_relation_greater:            return ia32_cc_float_above;
+               case ir_relation_greater_equal:      return ia32_cc_float_above_equal;
+               case ir_relation_less_greater:       return ia32_cc_not_equal;
+               case ir_relation_less_equal_greater: return ia32_cc_not_parity;
+               case ir_relation_unordered:          return ia32_cc_parity;
+               case ir_relation_unordered_equal:    return ia32_cc_equal;
+               case ir_relation_unordered_less:   return ia32_cc_float_unordered_below;
+               case ir_relation_unordered_less_equal:
+                                            return ia32_cc_float_unordered_below_equal;
+               case ir_relation_unordered_greater:
+                                            return ia32_cc_float_unordered_above;
+               case ir_relation_unordered_greater_equal:
+                                            return ia32_cc_float_unordered_above_equal;
+               case ir_relation_unordered_less_greater:
+                                            return ia32_cc_float_not_equal;
+               case ir_relation_false:
+               case ir_relation_true:
+                       /* should we introduce a jump always/jump never? */
+                       break;
+               }
+               panic("Unexpected float pnc");
+       } else if (mode_is_signed(mode)) {
+               switch (relation) {
+               case ir_relation_unordered_equal:
+               case ir_relation_equal:                return ia32_cc_equal;
+               case ir_relation_unordered_less:
+               case ir_relation_less:                 return ia32_cc_less;
+               case ir_relation_unordered_less_equal:
+               case ir_relation_less_equal:           return ia32_cc_less_equal;
+               case ir_relation_unordered_greater:
+               case ir_relation_greater:              return ia32_cc_greater;
+               case ir_relation_unordered_greater_equal:
+               case ir_relation_greater_equal:        return ia32_cc_greater_equal;
+               case ir_relation_unordered_less_greater:
+               case ir_relation_less_greater:         return ia32_cc_not_equal;
+               case ir_relation_less_equal_greater:
+               case ir_relation_unordered:
+               case ir_relation_false:
+               case ir_relation_true:
+                       /* introduce jump always/jump never? */
+                       break;
+               }
+               panic("Unexpected pnc");
+       } else {
+               switch (relation) {
+               case ir_relation_unordered_equal:
+               case ir_relation_equal:         return ia32_cc_equal;
+               case ir_relation_unordered_less:
+               case ir_relation_less:          return ia32_cc_below;
+               case ir_relation_unordered_less_equal:
+               case ir_relation_less_equal:    return ia32_cc_below_equal;
+               case ir_relation_unordered_greater:
+               case ir_relation_greater:       return ia32_cc_above;
+               case ir_relation_unordered_greater_equal:
+               case ir_relation_greater_equal: return ia32_cc_above_equal;
+               case ir_relation_unordered_less_greater:
+               case ir_relation_less_greater:  return ia32_cc_not_equal;
+               case ir_relation_less_equal_greater:
+               case ir_relation_unordered:
+               case ir_relation_false:
+               case ir_relation_true:
+                       /* introduce jump always/jump never? */
+                       break;
+               }
+               panic("Unexpected pnc");
+       }
+}
 
-       /* we have a Cmp as input */
-       if (is_Proj(node)) {
-               ir_node *pred = get_Proj_pred(node);
-               if (is_Cmp(pred)) {
-                       int pnc = get_Proj_pn_cmp(node);
-                       if (ia32_cg_config.use_bt && (pnc == pn_Cmp_Lg || pnc == pn_Cmp_Eq)) {
-                               ir_node *l = get_Cmp_left(pred);
-                               ir_node *r = get_Cmp_right(pred);
-                               if (is_And(l)) {
-                                       ir_node *la = get_And_left(l);
-                                       ir_node *ra = get_And_right(l);
-                                       if (is_Shl(la)) {
-                                               ir_node *c = get_Shl_left(la);
-                                               if (is_Const_1(c) && (is_Const_0(r) || r == la)) {
-                                                       /* (1 << n) & ra) */
-                                                       ir_node *n = get_Shl_right(la);
-                                                       flags    = gen_bt(pred, ra, n);
-                                                       /* we must generate a Jc/Jnc jump */
-                                                       pnc = pnc == pn_Cmp_Lg ? pn_Cmp_Lt : pn_Cmp_Ge;
-                                                       if (r == la)
-                                                               pnc ^= pn_Cmp_Leg;
-                                                       *pnc_out = ia32_pn_Cmp_unsigned | pnc;
-                                                       return flags;
-                                               }
-                                       }
-                                       if (is_Shl(ra)) {
-                                               ir_node *c = get_Shl_left(ra);
-                                               if (is_Const_1(c) && (is_Const_0(r) || r == ra)) {
-                                                       /* la & (1 << n)) */
-                                                       ir_node *n = get_Shl_right(ra);
-                                                       flags    = gen_bt(pred, la, n);
-                                                       /* we must generate a Jc/Jnc jump */
-                                                       pnc = pnc == pn_Cmp_Lg ? pn_Cmp_Lt : pn_Cmp_Ge;
-                                                       if (r == ra)
-                                                               pnc ^= pn_Cmp_Leg;
-                                                       *pnc_out = ia32_pn_Cmp_unsigned | pnc;
-                                                       return flags;
-                                               }
-                                       }
-                               }
-                       }
-                       /* add ia32 compare flags */
-                       {
-                               ir_node *l    = get_Cmp_left(pred);
-                               ir_mode *mode = get_irn_mode(l);
-                               if (mode_is_float(mode))
-                                       pnc |= ia32_pn_Cmp_float;
-                               else if (! mode_is_signed(mode))
-                                       pnc |= ia32_pn_Cmp_unsigned;
+static ir_node *get_flags_mode_b(ir_node *node, ia32_condition_code_t *cc_out)
+{
+       /* a mode_b value, we have to compare it against 0 */
+       dbg_info *dbgi      = get_irn_dbg_info(node);
+       ir_node  *new_block = be_transform_node(get_nodes_block(node));
+       ir_node  *new_op    = be_transform_node(node);
+       ir_node  *flags     = new_bd_ia32_Test(dbgi, new_block, noreg_GP, noreg_GP, nomem, new_op, new_op, false);
+       *cc_out  = ia32_cc_not_equal;
+       return flags;
+}
+
+static ir_node *get_flags_node_cmp(ir_node *cmp, ia32_condition_code_t *cc_out)
+{
+       /* must have a Cmp as input */
+       ir_relation relation = get_Cmp_relation(cmp);
+       ir_relation possible;
+       ir_node    *l        = get_Cmp_left(cmp);
+       ir_node    *r        = get_Cmp_right(cmp);
+       ir_mode    *mode     = get_irn_mode(l);
+       ir_node    *flags;
+
+       /* check for bit-test */
+       if (ia32_cg_config.use_bt && (relation == ir_relation_equal
+                       || (mode_is_signed(mode) && relation == ir_relation_less_greater)
+                       || (!mode_is_signed(mode) && ((relation & ir_relation_greater_equal) == ir_relation_greater)))
+                   && is_And(l)) {
+               ir_node *la = get_And_left(l);
+               ir_node *ra = get_And_right(l);
+               if (is_Shl(ra)) {
+                       ir_node *tmp = la;
+                       la = ra;
+                       ra = tmp;
+               }
+               if (is_Shl(la)) {
+                       ir_node *c = get_Shl_left(la);
+                       if (is_Const_1(c) && is_Const_0(r)) {
+                               /* (1 << n) & ra) */
+                               ir_node *n = get_Shl_right(la);
+                               flags    = gen_bt(cmp, ra, n);
+                               /* the bit is copied into the CF flag */
+                               if (relation & ir_relation_equal)
+                                       *cc_out = ia32_cc_above_equal; /* test for CF=0 */
+                               else
+                                       *cc_out = ia32_cc_below;       /* test for CF=1 */
+                               return flags;
                        }
-                       *pnc_out = pnc;
-                       flags = be_transform_node(pred);
-                       return flags;
                }
        }
 
-       /* a mode_b value, we have to compare it against 0 */
-       dbgi      = get_irn_dbg_info(node);
-       new_block = be_transform_node(get_nodes_block(node));
-       new_op    = be_transform_node(node);
-       flags     = new_bd_ia32_Test(dbgi, new_block, noreg_GP, noreg_GP, nomem, new_op,
-                                    new_op, /*is_permuted=*/0, /*cmp_unsigned=*/0);
-       *pnc_out  = pn_Cmp_Lg;
+       /* the middle-end tries to eliminate impossible relations, so a ptr != 0
+        * test becomes ptr > 0. But for x86 an equal comparison is preferable to
+        * a >0 (we can sometimes eliminate the cmp in favor of flags produced by
+        * a predecessor node). So add the < bit */
+       possible = ir_get_possible_cmp_relations(l, r);
+       if (((relation & ir_relation_less) && !(possible & ir_relation_greater))
+         || ((relation & ir_relation_greater) && !(possible & ir_relation_less)))
+               relation |= ir_relation_less_greater;
+
+       /* just do a normal transformation of the Cmp */
+       *cc_out = relation_to_condition_code(relation, mode);
+       flags   = be_transform_node(cmp);
        return flags;
 }
 
+/**
+ * Transform a node returning a "flag" result.
+ *
+ * @param node    the node to transform
+ * @param cc_out  the compare mode to use
+ */
+static ir_node *get_flags_node(ir_node *node, ia32_condition_code_t *cc_out)
+{
+       if (is_Cmp(node))
+               return get_flags_node_cmp(node, cc_out);
+       assert(get_irn_mode(node) == mode_b);
+       return get_flags_mode_b(node, cc_out);
+}
+
 /**
  * Transforms a Load.
  *
@@ -2013,14 +2088,14 @@ static ir_node *get_flags_node(ir_node *node, int *pnc_out)
 static ir_node *gen_Load(ir_node *node)
 {
        ir_node  *old_block = get_nodes_block(node);
-       ir_node  *block   = be_transform_node(old_block);
-       ir_node  *ptr     = get_Load_ptr(node);
-       ir_node  *mem     = get_Load_mem(node);
-       ir_node  *new_mem = be_transform_node(mem);
+       ir_node  *block     = be_transform_node(old_block);
+       ir_node  *ptr       = get_Load_ptr(node);
+       ir_node  *mem       = get_Load_mem(node);
+       ir_node  *new_mem   = be_transform_node(mem);
+       dbg_info *dbgi      = get_irn_dbg_info(node);
+       ir_mode  *mode      = get_Load_mode(node);
        ir_node  *base;
        ir_node  *index;
-       dbg_info *dbgi    = get_irn_dbg_info(node);
-       ir_mode  *mode    = get_Load_mode(node);
        ir_node  *new_node;
        ia32_address_t addr;
 
@@ -2076,7 +2151,6 @@ static ir_node *gen_Load(ir_node *node)
 
        SET_IA32_ORIG_NODE(new_node, node);
 
-       be_dep_on_frame(new_node);
        return new_node;
 }
 
@@ -2105,14 +2179,14 @@ static int use_dest_am(ir_node *block, ir_node *node, ir_node *mem,
        /* don't do AM if other node inputs depend on the load (via mem-proj) */
        if (other != NULL                   &&
            get_nodes_block(other) == block &&
-           heights_reachable_in_block(heights, other, load)) {
+           heights_reachable_in_block(ia32_heights, other, load)) {
                return 0;
        }
 
-       if (prevents_AM(block, load, mem))
+       if (ia32_prevents_AM(block, load, mem))
                return 0;
        /* Store should be attached to the load via mem */
-       assert(heights_reachable_in_block(heights, mem, load));
+       assert(heights_reachable_in_block(ia32_heights, mem, load));
 
        return 1;
 }
@@ -2171,7 +2245,8 @@ static ir_node *dest_am_binop(ir_node *node, ir_node *op1, ir_node *op2,
 
        be_set_transformed_node(get_Proj_pred(am.mem_proj), new_node);
        mem_proj = be_transform_node(am.mem_proj);
-       be_set_transformed_node(mem_proj ? mem_proj : am.mem_proj, new_node);
+       be_set_transformed_node(am.mem_proj, new_node);
+       be_set_transformed_node(mem_proj, new_node);
 
        return new_node;
 }
@@ -2206,31 +2281,26 @@ static ir_node *dest_am_unop(ir_node *node, ir_node *op, ir_node *mem,
 
        be_set_transformed_node(get_Proj_pred(am.mem_proj), new_node);
        mem_proj = be_transform_node(am.mem_proj);
-       be_set_transformed_node(mem_proj ? mem_proj : am.mem_proj, new_node);
+       be_set_transformed_node(am.mem_proj, new_node);
+       be_set_transformed_node(mem_proj, new_node);
 
        return new_node;
 }
 
-static int ia32_get_negated_pnc(int pnc)
-{
-       ir_mode *mode = pnc & ia32_pn_Cmp_float ? mode_F : mode_Iu;
-       return get_negated_pnc(pnc, mode);
-}
-
 static ir_node *try_create_SetMem(ir_node *node, ir_node *ptr, ir_node *mem)
 {
-       ir_mode        *mode      = get_irn_mode(node);
-       ir_node        *mux_true  = get_Mux_true(node);
-       ir_node        *mux_false = get_Mux_false(node);
-       ir_node        *cond;
-       dbg_info       *dbgi;
-       ir_node        *block;
-       ir_node        *new_block;
-       ir_node        *flags;
-       ir_node        *new_node;
-       bool            negated;
-       int             pnc;
-       ia32_address_t  addr;
+       ir_mode              *mode      = get_irn_mode(node);
+       ir_node              *mux_true  = get_Mux_true(node);
+       ir_node              *mux_false = get_Mux_false(node);
+       ir_node              *cond;
+       dbg_info             *dbgi;
+       ir_node              *block;
+       ir_node              *new_block;
+       ir_node              *flags;
+       ir_node              *new_node;
+       bool                  negated;
+       ia32_condition_code_t cc;
+       ia32_address_t        addr;
 
        if (get_mode_size_bits(mode) != 8)
                return NULL;
@@ -2244,12 +2314,12 @@ static ir_node *try_create_SetMem(ir_node *node, ir_node *ptr, ir_node *mem)
        }
 
        cond  = get_Mux_sel(node);
-       flags = get_flags_node(cond, &pnc);
+       flags = get_flags_node(cond, &cc);
        /* we can't handle the float special cases with SetM */
-       if (pnc & ia32_pn_Cmp_float)
+       if (cc & ia32_cc_additional_float_cases)
                return NULL;
        if (negated)
-               pnc = ia32_get_negated_pnc(pnc);
+               cc = ia32_negate_condition_code(cc);
 
        build_address_ptr(&addr, ptr, mem);
 
@@ -2257,7 +2327,7 @@ static ir_node *try_create_SetMem(ir_node *node, ir_node *ptr, ir_node *mem)
        block     = get_nodes_block(node);
        new_block = be_transform_node(block);
        new_node  = new_bd_ia32_SetccMem(dbgi, new_block, addr.base,
-                                        addr.index, addr.mem, flags, pnc);
+                                        addr.index, addr.mem, flags, cc);
        set_address(new_node, &addr);
        set_ia32_op_type(new_node, ia32_AddrModeD);
        set_ia32_ls_mode(new_node, mode);
@@ -2457,7 +2527,7 @@ static ir_node *gen_float_const_Store(ir_node *node, ir_node *cns)
        ir_node        *mem       = get_Store_mem(node);
        dbg_info       *dbgi      = get_irn_dbg_info(node);
        int             ofs       = 0;
-       size_t          i         = 0;
+       int             i         = 0;
        ir_node        *ins[4];
        ia32_address_t  addr;
 
@@ -2697,23 +2767,23 @@ static ir_node *create_Switch(ir_node *node)
  */
 static ir_node *gen_Cond(ir_node *node)
 {
-       ir_node  *block     = get_nodes_block(node);
-       ir_node  *new_block = be_transform_node(block);
-       dbg_info *dbgi      = get_irn_dbg_info(node);
-       ir_node  *sel       = get_Cond_selector(node);
-       ir_mode  *sel_mode  = get_irn_mode(sel);
-       ir_node  *flags     = NULL;
-       ir_node  *new_node;
-       int       pnc;
+       ir_node              *block     = get_nodes_block(node);
+       ir_node              *new_block = be_transform_node(block);
+       dbg_info             *dbgi      = get_irn_dbg_info(node);
+       ir_node              *sel       = get_Cond_selector(node);
+       ir_mode              *sel_mode  = get_irn_mode(sel);
+       ir_node              *flags     = NULL;
+       ir_node              *new_node;
+       ia32_condition_code_t cc;
 
        if (sel_mode != mode_b) {
                return create_Switch(node);
        }
 
        /* we get flags from a Cmp */
-       flags = get_flags_node(sel, &pnc);
+       flags = get_flags_node(sel, &cc);
 
-       new_node = new_bd_ia32_Jcc(dbgi, new_block, flags, pnc);
+       new_node = new_bd_ia32_Jcc(dbgi, new_block, flags, cc);
        SET_IA32_ORIG_NODE(new_node, node);
 
        return new_node;
@@ -2796,25 +2866,6 @@ static ir_node *create_Ucomi(ir_node *node)
        return new_node;
 }
 
-/**
- * helper function: checks whether all Cmp projs are Lg or Eq which is needed
- * to fold an and into a test node
- */
-static bool can_fold_test_and(ir_node *node)
-{
-       const ir_edge_t *edge;
-
-       /** we can only have eq and lg projs */
-       foreach_out_edge(node, edge) {
-               ir_node *proj = get_edge_src_irn(edge);
-               pn_Cmp   pnc  = get_Proj_pn_cmp(proj);
-               if (pnc != pn_Cmp_Eq && pnc != pn_Cmp_Lg)
-                       return false;
-       }
-
-       return true;
-}
-
 /**
  * returns true if it is assured, that the upper bits of a node are "clean"
  * which means for a 16 or 8 bit value, that the upper bits in the register
@@ -2909,7 +2960,6 @@ static ir_node *gen_Cmp(ir_node *node)
        ir_node  *new_node;
        ia32_address_mode_t  am;
        ia32_address_t      *addr = &am.addr;
-       int                  cmp_unsigned;
 
        if (mode_is_float(cmp_mode)) {
                if (ia32_cg_config.use_sse2) {
@@ -2922,11 +2972,9 @@ static ir_node *gen_Cmp(ir_node *node)
        assert(ia32_mode_needs_gp_reg(cmp_mode));
 
        /* Prefer the Test instruction, when encountering (x & y) ==/!= 0 */
-       cmp_unsigned = !mode_is_signed(cmp_mode);
        if (is_Const_0(right)          &&
            is_And(left)               &&
-           get_irn_n_edges(left) == 1 &&
-           can_fold_test_and(node)) {
+           get_irn_n_edges(left) == 1) {
                /* Test(and_left, and_right) */
                ir_node *and_left  = get_And_left(left);
                ir_node *and_right = get_And_right(left);
@@ -2950,11 +2998,10 @@ static ir_node *gen_Cmp(ir_node *node)
 
                if (get_mode_size_bits(cmp_mode) == 8) {
                        new_node = new_bd_ia32_Test8Bit(dbgi, new_block, addr->base,
-                                       addr->index, addr->mem, am.new_op1, am.new_op2, am.ins_permuted,
-                                       cmp_unsigned);
+                                       addr->index, addr->mem, am.new_op1, am.new_op2, am.ins_permuted);
                } else {
                        new_node = new_bd_ia32_Test(dbgi, new_block, addr->base, addr->index,
-                                       addr->mem, am.new_op1, am.new_op2, am.ins_permuted, cmp_unsigned);
+                                       addr->mem, am.new_op1, am.new_op2, am.ins_permuted);
                }
        } else {
                /* Cmp(left, right) */
@@ -2971,11 +3018,10 @@ static ir_node *gen_Cmp(ir_node *node)
                if (get_mode_size_bits(cmp_mode) == 8) {
                        new_node = new_bd_ia32_Cmp8Bit(dbgi, new_block, addr->base,
                                                       addr->index, addr->mem, am.new_op1,
-                                                      am.new_op2, am.ins_permuted,
-                                                      cmp_unsigned);
+                                                      am.new_op2, am.ins_permuted);
                } else {
                        new_node = new_bd_ia32_Cmp(dbgi, new_block, addr->base, addr->index,
-                                       addr->mem, am.new_op1, am.new_op2, am.ins_permuted, cmp_unsigned);
+                                       addr->mem, am.new_op1, am.new_op2, am.ins_permuted);
                }
        }
        set_am_attributes(new_node, &am);
@@ -2989,7 +3035,7 @@ static ir_node *gen_Cmp(ir_node *node)
 }
 
 static ir_node *create_CMov(ir_node *node, ir_node *flags, ir_node *new_flags,
-                            int pnc)
+                            ia32_condition_code_t cc)
 {
        dbg_info            *dbgi          = get_irn_dbg_info(node);
        ir_node             *block         = get_nodes_block(node);
@@ -3009,11 +3055,11 @@ static ir_node *create_CMov(ir_node *node, ir_node *flags, ir_node *new_flags,
                        match_commutative | match_am | match_16bit_am | match_mode_neutral);
 
        if (am.ins_permuted)
-               pnc = ia32_get_negated_pnc(pnc);
+               cc = ia32_negate_condition_code(cc);
 
        new_node = new_bd_ia32_CMovcc(dbgi, new_block, addr->base, addr->index,
                                      addr->mem, am.new_op1, am.new_op2, new_flags,
-                                     pnc);
+                                     cc);
        set_am_attributes(new_node, &am);
 
        SET_IA32_ORIG_NODE(new_node, node);
@@ -3027,13 +3073,13 @@ static ir_node *create_CMov(ir_node *node, ir_node *flags, ir_node *new_flags,
  * Creates a ia32 Setcc instruction.
  */
 static ir_node *create_set_32bit(dbg_info *dbgi, ir_node *new_block,
-                                 ir_node *flags, int pnc,
+                                 ir_node *flags, ia32_condition_code_t cc,
                                  ir_node *orig_node)
 {
        ir_mode *mode  = get_irn_mode(orig_node);
        ir_node *new_node;
 
-       new_node = new_bd_ia32_Setcc(dbgi, new_block, flags, pnc);
+       new_node = new_bd_ia32_Setcc(dbgi, new_block, flags, cc);
        SET_IA32_ORIG_NODE(new_node, orig_node);
 
        /* we might need to conv the result up */
@@ -3068,12 +3114,12 @@ static ir_node *create_doz(ir_node *psi, ir_node *a, ir_node *b)
 
        if (is_Proj(new_node)) {
                sub = get_Proj_pred(new_node);
-               assert(is_ia32_Sub(sub));
        } else {
                sub = new_node;
                set_irn_mode(sub, mode_T);
                new_node = new_rd_Proj(NULL, sub, mode, pn_ia32_res);
        }
+       assert(is_ia32_Sub(sub));
        eflags = new_rd_Proj(NULL, sub, mode_Iu, pn_ia32_Sub_flags);
 
        dbgi = get_irn_dbg_info(psi);
@@ -3161,8 +3207,8 @@ enum setcc_transform_insn {
 };
 
 typedef struct setcc_transform {
-       unsigned num_steps;
-       int      pnc;
+       unsigned              num_steps;
+       ia32_condition_code_t cc;
        struct {
                enum setcc_transform_insn  transform;
                long val;
@@ -3175,7 +3221,8 @@ typedef struct setcc_transform {
  * Find a transformation that creates 0 and 1 from
  * tv_t and tv_f.
  */
-static void find_const_transform(int pnc, ir_tarval *t, ir_tarval *f,
+static void find_const_transform(ia32_condition_code_t cc,
+                                 ir_tarval *t, ir_tarval *f,
                                  setcc_transform_t *res)
 {
        unsigned step = 0;
@@ -3186,15 +3233,15 @@ static void find_const_transform(int pnc, ir_tarval *t, ir_tarval *f,
                ir_tarval *tmp = t;
                t = f;
                f = tmp;
-               pnc = ia32_get_negated_pnc(pnc);
-       } else if (tarval_cmp(t, f) == pn_Cmp_Lt) {
+               cc = ia32_negate_condition_code(cc);
+       } else if (tarval_cmp(t, f) == ir_relation_less) {
                // now, t is the bigger one
                ir_tarval *tmp = t;
                t = f;
                f = tmp;
-               pnc = ia32_get_negated_pnc(pnc);
+               cc = ia32_negate_condition_code(cc);
        }
-       res->pnc = pnc;
+       res->cc = cc;
 
        if (! tarval_is_null(f)) {
                ir_tarval *t_sub = tarval_sub(t, f, NULL);
@@ -3299,34 +3346,33 @@ static void find_const_transform(int pnc, ir_tarval *t, ir_tarval *f,
  */
 static ir_node *gen_Mux(ir_node *node)
 {
-       dbg_info *dbgi      = get_irn_dbg_info(node);
-       ir_node  *block     = get_nodes_block(node);
-       ir_node  *new_block = be_transform_node(block);
-       ir_node  *mux_true  = get_Mux_true(node);
-       ir_node  *mux_false = get_Mux_false(node);
-       ir_node  *cond      = get_Mux_sel(node);
-       ir_mode  *mode      = get_irn_mode(node);
-       ir_node  *flags;
-       ir_node  *new_node;
-       int       is_abs;
-       int       pnc;
-
-       assert(get_irn_mode(cond) == mode_b);
-
-       is_abs = be_mux_is_abs(cond, mux_true, mux_false);
+       dbg_info             *dbgi      = get_irn_dbg_info(node);
+       ir_node              *block     = get_nodes_block(node);
+       ir_node              *new_block = be_transform_node(block);
+       ir_node              *mux_true  = get_Mux_true(node);
+       ir_node              *mux_false = get_Mux_false(node);
+       ir_node              *sel       = get_Mux_sel(node);
+       ir_mode              *mode      = get_irn_mode(node);
+       ir_node              *flags;
+       ir_node              *new_node;
+       int                   is_abs;
+       ia32_condition_code_t cc;
+
+       assert(get_irn_mode(sel) == mode_b);
+
+       is_abs = be_mux_is_abs(sel, mux_true, mux_false);
        if (is_abs != 0) {
-               return create_abs(dbgi, block, be_get_abs_op(cond), is_abs < 0, node);
+               return create_abs(dbgi, block, be_get_abs_op(sel), is_abs < 0, node);
        }
 
        /* Note: a Mux node uses a Load two times IFF it's used in the compare AND in the result */
        if (mode_is_float(mode)) {
-               ir_node  *cmp         = get_Proj_pred(cond);
-               ir_node  *cmp_left    = get_Cmp_left(cmp);
-               ir_node  *cmp_right   = get_Cmp_right(cmp);
-               int       pnc         = get_Proj_proj(cond);
+               ir_node    *cmp_left  = get_Cmp_left(sel);
+               ir_node    *cmp_right = get_Cmp_right(sel);
+               ir_relation relation  = get_Cmp_relation(sel);
 
                if (ia32_cg_config.use_sse2) {
-                       if (pnc == pn_Cmp_Lt || pnc == pn_Cmp_Le) {
+                       if (relation == ir_relation_less || relation == ir_relation_less_equal) {
                                if (cmp_left == mux_true && cmp_right == mux_false) {
                                        /* Mux(a <= b, a, b) => MIN */
                                        return gen_binop(node, cmp_left, cmp_right, new_bd_ia32_xMin,
@@ -3336,7 +3382,7 @@ static ir_node *gen_Mux(ir_node *node)
                                        return gen_binop(node, cmp_left, cmp_right, new_bd_ia32_xMax,
                                         match_commutative | match_am | match_two_users);
                                }
-                       } else if (pnc == pn_Cmp_Gt || pnc == pn_Cmp_Ge) {
+                       } else if (relation == ir_relation_greater || relation == ir_relation_greater_equal) {
                                if (cmp_left == mux_true && cmp_right == mux_false) {
                                        /* Mux(a >= b, a, b) => MAX */
                                        return gen_binop(node, cmp_left, cmp_right, new_bd_ia32_xMax,
@@ -3355,8 +3401,8 @@ static ir_node *gen_Mux(ir_node *node)
                        ir_mode             *new_mode;
                        unsigned            scale;
 
-                       flags    = get_flags_node(cond, &pnc);
-                       new_node = create_set_32bit(dbgi, new_block, flags, pnc, node);
+                       flags    = get_flags_node(sel, &cc);
+                       new_node = create_set_32bit(dbgi, new_block, flags, cc, node);
 
                        if (ia32_cg_config.use_sse2) {
                                /* cannot load from different mode on SSE */
@@ -3390,7 +3436,7 @@ static ir_node *gen_Mux(ir_node *node)
                        case 16:
                                /* arg, shift 16 NOT supported */
                                scale = 3;
-                               new_node = new_bd_ia32_Add(dbgi, new_block, noreg_GP, noreg_GP, nomem, new_node, new_node);
+                               new_node = new_bd_ia32_Lea(dbgi, new_block, new_node, new_node);
                                break;
                        default:
                                panic("Unsupported constant size");
@@ -3403,6 +3449,7 @@ static ir_node *gen_Mux(ir_node *node)
                        am.addr.offset        = 0;
                        am.addr.scale         = scale;
                        am.addr.use_frame     = 0;
+                       am.addr.tls_segment   = false;
                        am.addr.frame_entity  = NULL;
                        am.addr.symconst_sign = 0;
                        am.mem_proj           = am.addr.mem;
@@ -3411,7 +3458,7 @@ static ir_node *gen_Mux(ir_node *node)
                        am.new_op2            = NULL;
                        am.pinned             = op_pin_state_floats;
                        am.commutative        = 1;
-                       am.ins_permuted       = 0;
+                       am.ins_permuted       = false;
 
                        if (ia32_cg_config.use_sse2)
                                load = new_bd_ia32_xLoad(dbgi, block, am.addr.base, am.addr.index, am.addr.mem, new_mode);
@@ -3426,37 +3473,34 @@ static ir_node *gen_Mux(ir_node *node)
        } else {
                assert(ia32_mode_needs_gp_reg(mode));
 
-               if (is_Proj(cond)) {
-                       ir_node *cmp = get_Proj_pred(cond);
-                       if (is_Cmp(cmp)) {
-                               ir_node  *cmp_left  = get_Cmp_left(cmp);
-                               ir_node  *cmp_right = get_Cmp_right(cmp);
-                               ir_node  *val_true  = mux_true;
-                               ir_node  *val_false = mux_false;
-                               int       pnc       = get_Proj_proj(cond);
-
-                               if (is_Const(val_true) && is_Const_null(val_true)) {
-                                       ir_node *tmp = val_false;
-                                       val_false = val_true;
-                                       val_true  = tmp;
-                                       pnc       = ia32_get_negated_pnc(pnc);
+               if (is_Cmp(sel)) {
+                       ir_node    *cmp_left  = get_Cmp_left(sel);
+                       ir_node    *cmp_right = get_Cmp_right(sel);
+                       ir_relation relation  = get_Cmp_relation(sel);
+                       ir_node    *val_true  = mux_true;
+                       ir_node    *val_false = mux_false;
+
+                       if (is_Const(val_true) && is_Const_null(val_true)) {
+                               ir_node *tmp = val_false;
+                               val_false = val_true;
+                               val_true  = tmp;
+                               relation  = get_negated_relation(relation);
+                       }
+                       if (is_Const_0(val_false) && is_Sub(val_true)) {
+                               if ((relation & ir_relation_greater)
+                                       && get_Sub_left(val_true) == cmp_left
+                                       && get_Sub_right(val_true) == cmp_right) {
+                                       return create_doz(node, cmp_left, cmp_right);
                                }
-                               if (is_Const_0(val_false) && is_Sub(val_true)) {
-                                       if ((pnc == pn_Cmp_Gt || pnc == pn_Cmp_Ge)
-                                               && get_Sub_left(val_true) == cmp_left
-                                               && get_Sub_right(val_true) == cmp_right) {
-                                               return create_doz(node, cmp_left, cmp_right);
-                                       }
-                                       if ((pnc == pn_Cmp_Lt || pnc == pn_Cmp_Le)
-                                               && get_Sub_left(val_true) == cmp_right
-                                               && get_Sub_right(val_true) == cmp_left) {
-                                               return create_doz(node, cmp_right, cmp_left);
-                                       }
+                               if ((relation & ir_relation_less)
+                                       && get_Sub_left(val_true) == cmp_right
+                                       && get_Sub_right(val_true) == cmp_left) {
+                                       return create_doz(node, cmp_right, cmp_left);
                                }
                        }
                }
 
-               flags = get_flags_node(cond, &pnc);
+               flags = get_flags_node(sel, &cc);
 
                if (is_Const(mux_true) && is_Const(mux_false)) {
                        /* both are const, good */
@@ -3465,15 +3509,15 @@ static ir_node *gen_Mux(ir_node *node)
                        setcc_transform_t res;
                        int step;
 
-                       find_const_transform(pnc, tv_true, tv_false, &res);
+                       find_const_transform(cc, tv_true, tv_false, &res);
                        new_node = node;
                        for (step = (int)res.num_steps - 1; step >= 0; --step) {
                                ir_node *imm;
 
                                switch (res.steps[step].transform) {
                                case SETCC_TR_ADD:
-                                       imm = ia32_immediate_from_long(res.steps[step].val);
-                                       new_node = new_bd_ia32_Add(dbgi, new_block, noreg_GP, noreg_GP, nomem, new_node, imm);
+                                       new_node = new_bd_ia32_Lea(dbgi, new_block, new_node, noreg_GP);
+                                       add_ia32_am_offs_int(new_node, res.steps[step].val);
                                        break;
                                case SETCC_TR_ADDxx:
                                        new_node = new_bd_ia32_Lea(dbgi, new_block, new_node, new_node);
@@ -3503,7 +3547,7 @@ static ir_node *gen_Mux(ir_node *node)
                                        new_node = new_bd_ia32_And(dbgi, new_block, noreg_GP, noreg_GP, nomem, new_node, imm);
                                        break;
                                case SETCC_TR_SET:
-                                       new_node = create_set_32bit(dbgi, new_block, flags, res.pnc, node);
+                                       new_node = create_set_32bit(dbgi, new_block, flags, res.cc, node);
                                        break;
                                case SETCC_TR_SBB:
                                        new_node = new_bd_ia32_Sbb0(dbgi, new_block, flags);
@@ -3513,7 +3557,7 @@ static ir_node *gen_Mux(ir_node *node)
                                }
                        }
                } else {
-                       new_node = create_CMov(node, cond, flags, pnc);
+                       new_node = create_CMov(node, sel, flags, cc);
                }
                return new_node;
        }
@@ -3874,7 +3918,7 @@ static ir_node *gen_Conv(ir_node *node)
 static ir_node *create_immediate_or_transform(ir_node *node,
                                               char immediate_constraint_type)
 {
-       ir_node *new_node = try_create_Immediate(node, immediate_constraint_type);
+       ir_node *new_node = ia32_try_create_Immediate(node, immediate_constraint_type);
        if (new_node == NULL) {
                new_node = be_transform_node(node);
        }
@@ -3906,19 +3950,23 @@ static ir_node *gen_be_FrameAddr(ir_node *node)
  */
 static ir_node *gen_be_Return(ir_node *node)
 {
-       ir_graph  *irg     = current_ir_graph;
-       ir_node   *ret_val = get_irn_n(node, be_pos_Return_val);
-       ir_node   *ret_mem = get_irn_n(node, be_pos_Return_mem);
-       ir_entity *ent     = get_irg_entity(irg);
-       ir_type   *tp      = get_entity_type(ent);
-       dbg_info  *dbgi;
-       ir_node   *block;
+       ir_graph  *irg         = current_ir_graph;
+       ir_node   *ret_val     = get_irn_n(node, n_be_Return_val);
+       ir_node   *ret_mem     = get_irn_n(node, n_be_Return_mem);
+       ir_node   *new_ret_val = be_transform_node(ret_val);
+       ir_node   *new_ret_mem = be_transform_node(ret_mem);
+       ir_entity *ent         = get_irg_entity(irg);
+       ir_type   *tp          = get_entity_type(ent);
+       dbg_info  *dbgi        = get_irn_dbg_info(node);
+       ir_node   *block       = be_transform_node(get_nodes_block(node));
        ir_type   *res_type;
        ir_mode   *mode;
-       ir_node   *frame, *sse_store, *fld, *mproj, *barrier;
-       ir_node   *new_barrier, *new_ret_val, *new_ret_mem;
-       ir_node   **in;
-       int       pn_ret_val, pn_ret_mem, arity, i;
+       ir_node   *frame, *sse_store, *fld, *mproj;
+       int        i;
+       int        arity;
+       unsigned   pop;
+       ir_node  **in;
+       ir_node   *new_node;
 
        assert(ret_val != NULL);
        if (be_Return_get_n_rets(node) < 1 || ! ia32_cg_config.use_sse2) {
@@ -3938,25 +3986,8 @@ static ir_node *gen_be_Return(ir_node *node)
 
        assert(get_method_n_ress(tp) == 1);
 
-       pn_ret_val = get_Proj_proj(ret_val);
-       pn_ret_mem = get_Proj_proj(ret_mem);
-
-       /* get the Barrier */
-       barrier = get_Proj_pred(ret_val);
-
-       /* get result input of the Barrier */
-       ret_val     = get_irn_n(barrier, pn_ret_val);
-       new_ret_val = be_transform_node(ret_val);
-
-       /* get memory input of the Barrier */
-       ret_mem     = get_irn_n(barrier, pn_ret_mem);
-       new_ret_mem = be_transform_node(ret_mem);
-
        frame = get_irg_frame(irg);
 
-       dbgi  = get_irn_dbg_info(barrier);
-       block = be_transform_node(get_nodes_block(barrier));
-
        /* store xmm0 onto stack */
        sse_store = new_bd_ia32_xStoreSimple(dbgi, block, frame, noreg_GP,
                                             new_ret_mem, new_ret_val);
@@ -3972,32 +4003,24 @@ static ir_node *gen_be_Return(ir_node *node)
        mproj = new_r_Proj(fld, mode_M, pn_ia32_vfld_M);
        fld   = new_r_Proj(fld, mode_vfp, pn_ia32_vfld_res);
 
-       /* create a new barrier */
-       arity = get_irn_arity(barrier);
+       /* create a new return */
+       arity = get_irn_arity(node);
        in    = ALLOCAN(ir_node*, arity);
+       pop   = be_Return_get_pop(node);
        for (i = 0; i < arity; ++i) {
-               ir_node *new_in;
-
-               if (i == pn_ret_val) {
-                       new_in = fld;
-               } else if (i == pn_ret_mem) {
-                       new_in = mproj;
+               ir_node *op = get_irn_n(node, i);
+               if (op == ret_val) {
+                       in[i] = fld;
+               } else if (op == ret_mem) {
+                       in[i] = mproj;
                } else {
-                       ir_node *in = get_irn_n(barrier, i);
-                       new_in = be_transform_node(in);
+                       in[i] = be_transform_node(op);
                }
-               in[i] = new_in;
        }
+       new_node = be_new_Return(dbgi, irg, block, arity, pop, arity, in);
+       copy_node_attr(irg, node, new_node);
 
-       new_barrier = new_ir_node(dbgi, irg, block,
-                                 get_irn_op(barrier), get_irn_mode(barrier),
-                                 arity, in);
-       copy_node_attr(irg, barrier, new_barrier);
-       be_duplicate_deps(barrier, new_barrier);
-       be_set_transformed_node(barrier, new_barrier);
-
-       /* transform normally */
-       return be_duplicate_node(node);
+       return new_node;
 }
 
 /**
@@ -4005,11 +4028,15 @@ static ir_node *gen_be_Return(ir_node *node)
  */
 static ir_node *gen_be_AddSP(ir_node *node)
 {
-       ir_node  *sz = get_irn_n(node, be_pos_AddSP_size);
-       ir_node  *sp = get_irn_n(node, be_pos_AddSP_old_sp);
+       ir_node *sz = get_irn_n(node, n_be_AddSP_size);
+       ir_node *sp = get_irn_n(node, n_be_AddSP_old_sp);
 
-       return gen_binop(node, sp, sz, new_bd_ia32_SubSP,
-                        match_am | match_immediate);
+       ir_node *new_node = gen_binop(node, sp, sz, new_bd_ia32_SubSP,
+                                     match_am | match_immediate);
+       assert(is_ia32_SubSP(new_node));
+       arch_irn_set_register(new_node, pn_ia32_SubSP_stack,
+                             &ia32_registers[REG_ESP]);
+       return new_node;
 }
 
 /**
@@ -4017,11 +4044,15 @@ static ir_node *gen_be_AddSP(ir_node *node)
  */
 static ir_node *gen_be_SubSP(ir_node *node)
 {
-       ir_node  *sz = get_irn_n(node, be_pos_SubSP_size);
-       ir_node  *sp = get_irn_n(node, be_pos_SubSP_old_sp);
+       ir_node *sz = get_irn_n(node, n_be_SubSP_size);
+       ir_node *sp = get_irn_n(node, n_be_SubSP_old_sp);
 
-       return gen_binop(node, sp, sz, new_bd_ia32_AddSP,
-                        match_am | match_immediate);
+       ir_node *new_node = gen_binop(node, sp, sz, new_bd_ia32_AddSP,
+                                     match_am | match_immediate);
+       assert(is_ia32_AddSP(new_node));
+       arch_irn_set_register(new_node, pn_ia32_AddSP_stack,
+                             &ia32_registers[REG_ESP]);
+       return new_node;
 }
 
 /**
@@ -4108,41 +4139,6 @@ static ir_node *gen_IJmp(ir_node *node)
        return new_node;
 }
 
-/**
- * Transform a Bound node.
- */
-static ir_node *gen_Bound(ir_node *node)
-{
-       ir_node  *new_node;
-       ir_node  *lower = get_Bound_lower(node);
-       dbg_info *dbgi  = get_irn_dbg_info(node);
-
-       if (is_Const_0(lower)) {
-               /* typical case for Java */
-               ir_node  *sub, *res, *flags, *block;
-
-               res = gen_binop(node, get_Bound_index(node), get_Bound_upper(node),
-                               new_bd_ia32_Sub,
-                               match_mode_neutral | match_am | match_immediate);
-
-               block = get_nodes_block(res);
-               if (! is_Proj(res)) {
-                       sub = res;
-                       set_irn_mode(sub, mode_T);
-                       res = new_rd_Proj(NULL, sub, mode_Iu, pn_ia32_res);
-               } else {
-                       sub = get_Proj_pred(res);
-               }
-               flags = new_rd_Proj(NULL, sub, mode_Iu, pn_ia32_Sub_flags);
-               new_node = new_bd_ia32_Jcc(dbgi, block, flags, pn_Cmp_Lt | ia32_pn_Cmp_unsigned);
-               SET_IA32_ORIG_NODE(new_node, node);
-       } else {
-               panic("generic Bound not supported in ia32 Backend");
-       }
-       return new_node;
-}
-
-
 static ir_node *gen_ia32_l_ShlDep(ir_node *node)
 {
        ir_node *left  = get_irn_n(node, n_ia32_l_ShlDep_val);
@@ -4362,6 +4358,7 @@ static ir_node *gen_ia32_l_LLtoFloat(ir_node *node)
                am.addr.offset        = 0;
                am.addr.scale         = 2;
                am.addr.symconst_ent  = ia32_gen_fp_known_const(ia32_ULLBIAS);
+               am.addr.tls_segment   = false;
                am.addr.use_frame     = 0;
                am.addr.frame_entity  = NULL;
                am.addr.symconst_sign = 0;
@@ -4372,7 +4369,7 @@ static ir_node *gen_ia32_l_LLtoFloat(ir_node *node)
                am.new_op2            = ia32_new_NoReg_vfp(current_ir_graph);
                am.pinned             = op_pin_state_floats;
                am.commutative        = 1;
-               am.ins_permuted       = 0;
+               am.ins_permuted       = false;
 
                fadd  = new_bd_ia32_vfadd(dbgi, block, am.addr.base, am.addr.index, am.addr.mem,
                        am.new_op1, am.new_op2, get_fpcw());
@@ -4584,9 +4581,9 @@ static ir_node *gen_Proj_Load(ir_node *node)
 }
 
 /**
- * Transform and renumber the Projs from a DivMod like instruction.
+ * Transform and renumber the Projs from a Div or Mod instruction.
  */
-static ir_node *gen_Proj_DivMod(ir_node *node)
+static ir_node *gen_Proj_Div(ir_node *node)
 {
        ir_node  *block    = be_transform_node(get_nodes_block(node));
        ir_node  *pred     = get_Proj_pred(node);
@@ -4594,90 +4591,74 @@ static ir_node *gen_Proj_DivMod(ir_node *node)
        dbg_info *dbgi     = get_irn_dbg_info(node);
        long     proj      = get_Proj_proj(node);
 
-       assert(is_ia32_Div(new_pred) || is_ia32_IDiv(new_pred));
+       assert(pn_ia32_Div_M == pn_ia32_IDiv_M);
+       assert(pn_ia32_Div_div_res == pn_ia32_IDiv_div_res);
 
-       switch (get_irn_opcode(pred)) {
-       case iro_Div:
-               switch (proj) {
-               case pn_Div_M:
-                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_Div_M);
-               case pn_Div_res:
-                       return new_rd_Proj(dbgi, new_pred, mode_Iu, pn_ia32_Div_div_res);
-               case pn_Div_X_regular:
-                       return new_rd_Jmp(dbgi, block);
-               case pn_Div_X_except:
-                       set_ia32_exc_label(new_pred, 1);
-                       return new_rd_Proj(dbgi, new_pred, mode_X, pn_ia32_Div_X_exc);
-               default:
-                       break;
-               }
-               break;
-       case iro_Mod:
-               switch (proj) {
-               case pn_Mod_M:
+       switch (proj) {
+       case pn_Div_M:
+               if (is_ia32_Div(new_pred) || is_ia32_IDiv(new_pred)) {
                        return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_Div_M);
-               case pn_Mod_res:
-                       return new_rd_Proj(dbgi, new_pred, mode_Iu, pn_ia32_Div_mod_res);
-               case pn_Mod_X_except:
-                       set_ia32_exc_label(new_pred, 1);
-                       return new_rd_Proj(dbgi, new_pred, mode_X, pn_ia32_Div_X_exc);
-               default:
-                       break;
+               } else if (is_ia32_xDiv(new_pred)) {
+                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_xDiv_M);
+               } else if (is_ia32_vfdiv(new_pred)) {
+                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_vfdiv_M);
+               } else {
+                       panic("Div transformed to unexpected thing %+F", new_pred);
                }
-               break;
-       case iro_DivMod:
-               switch (proj) {
-               case pn_DivMod_M:
-                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_Div_M);
-               case pn_DivMod_res_div:
+       case pn_Div_res:
+               if (is_ia32_Div(new_pred) || is_ia32_IDiv(new_pred)) {
                        return new_rd_Proj(dbgi, new_pred, mode_Iu, pn_ia32_Div_div_res);
-               case pn_DivMod_res_mod:
-                       return new_rd_Proj(dbgi, new_pred, mode_Iu, pn_ia32_Div_mod_res);
-               case pn_DivMod_X_regular:
-                       return new_rd_Jmp(dbgi, block);
-               case pn_DivMod_X_except:
-                       set_ia32_exc_label(new_pred, 1);
-                       return new_rd_Proj(dbgi, new_pred, mode_X, pn_ia32_Div_X_exc);
-               default:
-                       break;
+               } else if (is_ia32_xDiv(new_pred)) {
+                       return new_rd_Proj(dbgi, new_pred, mode_xmm, pn_ia32_xDiv_res);
+               } else if (is_ia32_vfdiv(new_pred)) {
+                       return new_rd_Proj(dbgi, new_pred, mode_vfp, pn_ia32_vfdiv_res);
+               } else {
+                       panic("Div transformed to unexpected thing %+F", new_pred);
                }
-               break;
+       case pn_Div_X_regular:
+               return new_rd_Jmp(dbgi, block);
+       case pn_Div_X_except:
+               set_ia32_exc_label(new_pred, 1);
+               return new_rd_Proj(dbgi, new_pred, mode_X, pn_ia32_Div_X_exc);
        default:
                break;
        }
 
-       panic("No idea how to transform proj->DivMod");
+       panic("No idea how to transform proj->Div");
 }
 
 /**
- * Transform and renumber the Projs from a CopyB.
+ * Transform and renumber the Projs from a Div or Mod instruction.
  */
-static ir_node *gen_Proj_CopyB(ir_node *node)
+static ir_node *gen_Proj_Mod(ir_node *node)
 {
        ir_node  *pred     = get_Proj_pred(node);
        ir_node  *new_pred = be_transform_node(pred);
        dbg_info *dbgi     = get_irn_dbg_info(node);
        long     proj      = get_Proj_proj(node);
 
+       assert(is_ia32_Div(new_pred) || is_ia32_IDiv(new_pred));
+       assert(pn_ia32_Div_M == pn_ia32_IDiv_M);
+       assert(pn_ia32_Div_mod_res == pn_ia32_IDiv_mod_res);
+
        switch (proj) {
-       case pn_CopyB_M:
-               if (is_ia32_CopyB_i(new_pred)) {
-                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_CopyB_i_M);
-               } else if (is_ia32_CopyB(new_pred)) {
-                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_CopyB_M);
-               }
-               break;
+       case pn_Mod_M:
+               return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_Div_M);
+       case pn_Mod_res:
+               return new_rd_Proj(dbgi, new_pred, mode_Iu, pn_ia32_Div_mod_res);
+       case pn_Mod_X_except:
+               set_ia32_exc_label(new_pred, 1);
+               return new_rd_Proj(dbgi, new_pred, mode_X, pn_ia32_Div_X_exc);
        default:
                break;
        }
-
-       panic("No idea how to transform proj->CopyB");
+       panic("No idea how to transform proj->Mod");
 }
 
 /**
- * Transform and renumber the Projs from a Quot.
+ * Transform and renumber the Projs from a CopyB.
  */
-static ir_node *gen_Proj_Quot(ir_node *node)
+static ir_node *gen_Proj_CopyB(ir_node *node)
 {
        ir_node  *pred     = get_Proj_pred(node);
        ir_node  *new_pred = be_transform_node(pred);
@@ -4685,27 +4666,18 @@ static ir_node *gen_Proj_Quot(ir_node *node)
        long     proj      = get_Proj_proj(node);
 
        switch (proj) {
-       case pn_Quot_M:
-               if (is_ia32_xDiv(new_pred)) {
-                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_xDiv_M);
-               } else if (is_ia32_vfdiv(new_pred)) {
-                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_vfdiv_M);
-               }
-               break;
-       case pn_Quot_res:
-               if (is_ia32_xDiv(new_pred)) {
-                       return new_rd_Proj(dbgi, new_pred, mode_xmm, pn_ia32_xDiv_res);
-               } else if (is_ia32_vfdiv(new_pred)) {
-                       return new_rd_Proj(dbgi, new_pred, mode_vfp, pn_ia32_vfdiv_res);
+       case pn_CopyB_M:
+               if (is_ia32_CopyB_i(new_pred)) {
+                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_CopyB_i_M);
+               } else if (is_ia32_CopyB(new_pred)) {
+                       return new_rd_Proj(dbgi, new_pred, mode_M, pn_ia32_CopyB_M);
                }
                break;
-       case pn_Quot_X_regular:
-       case pn_Quot_X_except:
        default:
                break;
        }
 
-       panic("No idea how to transform proj->Quot");
+       panic("No idea how to transform proj->CopyB");
 }
 
 static ir_node *gen_be_Call(ir_node *node)
@@ -4713,10 +4685,10 @@ static ir_node *gen_be_Call(ir_node *node)
        dbg_info       *const dbgi      = get_irn_dbg_info(node);
        ir_node        *const src_block = get_nodes_block(node);
        ir_node        *const block     = be_transform_node(src_block);
-       ir_node        *const src_mem   = get_irn_n(node, be_pos_Call_mem);
-       ir_node        *const src_sp    = get_irn_n(node, be_pos_Call_sp);
+       ir_node        *const src_mem   = get_irn_n(node, n_be_Call_mem);
+       ir_node        *const src_sp    = get_irn_n(node, n_be_Call_sp);
        ir_node        *const sp        = be_transform_node(src_sp);
-       ir_node        *const src_ptr   = get_irn_n(node, be_pos_Call_ptr);
+       ir_node        *const src_ptr   = get_irn_n(node, n_be_Call_ptr);
        ia32_address_mode_t   am;
        ia32_address_t *const addr      = &am.addr;
        ir_node        *      mem;
@@ -4746,17 +4718,17 @@ static ir_node *gen_be_Call(ir_node *node)
        assert(be_Call_get_entity(node) == NULL);
 
        /* special case for PIC trampoline calls */
-       old_no_pic_adjust no_pic_adjust;
-       no_pic_adjust     = be_get_irg_options(current_ir_graph)->pic;
+       old_no_pic_adjust  = ia32_no_pic_adjust;
+       ia32_no_pic_adjust = be_get_irg_options(current_ir_graph)->pic;
 
        match_arguments(&am, src_block, NULL, src_ptr, src_mem,
                        match_am | match_immediate);
 
-       no_pic_adjust = old_no_pic_adjust;
+       ia32_no_pic_adjust = old_no_pic_adjust;
 
        i    = get_irn_arity(node) - 1;
        fpcw = be_transform_node(get_irn_n(node, i--));
-       for (; i >= be_pos_Call_first_arg; --i) {
+       for (; i >= n_be_Call_first_arg; --i) {
                arch_register_req_t const *const req = arch_get_register_req(node, i);
                ir_node *const reg_parm = be_transform_node(get_irn_n(node, i));
 
@@ -4824,6 +4796,7 @@ static ir_node *gen_return_address(ir_node *node)
        ir_node   *frame    = get_Builtin_param(node, 1);
        dbg_info  *dbgi     = get_irn_dbg_info(node);
        ir_tarval *tv       = get_Const_tarval(param);
+       ir_graph  *irg      = get_irn_irg(node);
        unsigned long value = get_tarval_long(tv);
 
        ir_node *block  = be_transform_node(get_nodes_block(node));
@@ -4845,7 +4818,7 @@ static ir_node *gen_return_address(ir_node *node)
 
        set_ia32_am_offs_int(load, 0);
        set_ia32_use_frame(load);
-       set_ia32_frame_ent(load, ia32_get_return_address_entity());
+       set_ia32_frame_ent(load, ia32_get_return_address_entity(irg));
 
        if (get_irn_pinned(node) == op_pin_state_floats) {
                assert((int)pn_ia32_xLoad_res == (int)pn_ia32_vfld_res
@@ -4867,6 +4840,7 @@ static ir_node *gen_frame_address(ir_node *node)
        ir_node   *frame    = get_Builtin_param(node, 1);
        dbg_info  *dbgi     = get_irn_dbg_info(node);
        ir_tarval *tv       = get_Const_tarval(param);
+       ir_graph  *irg      = get_irn_irg(node);
        unsigned long value = get_tarval_long(tv);
 
        ir_node *block  = be_transform_node(get_nodes_block(node));
@@ -4887,7 +4861,7 @@ static ir_node *gen_frame_address(ir_node *node)
        set_ia32_op_type(load, ia32_AddrModeS);
        set_ia32_ls_mode(load, mode_Iu);
 
-       ent = ia32_get_frame_address_entity();
+       ent = ia32_get_frame_address_entity(irg);
        if (ent != NULL) {
                set_ia32_am_offs_int(load, 0);
                set_ia32_use_frame(load);
@@ -4989,7 +4963,6 @@ static ir_node *gen_prefetch(ir_node *node)
 
        SET_IA32_ORIG_NODE(new_node, node);
 
-       be_dep_on_frame(new_node);
        return new_r_Proj(new_node, mode_M, pn_ia32_Prefetch_M);
 }
 
@@ -5027,7 +5000,7 @@ static ir_node *gen_ffs(ir_node *node)
        ir_node  *real  = skip_Proj(bsf);
        dbg_info *dbgi  = get_irn_dbg_info(real);
        ir_node  *block = get_nodes_block(real);
-       ir_node  *flag, *set, *conv, *neg, *orn;
+       ir_node  *flag, *set, *conv, *neg, *orn, *add;
 
        /* bsf x */
        if (get_irn_mode(real) != mode_T) {
@@ -5038,7 +5011,7 @@ static ir_node *gen_ffs(ir_node *node)
        flag = new_r_Proj(real, mode_b, pn_ia32_flags);
 
        /* sete */
-       set = new_bd_ia32_Setcc(dbgi, block, flag, pn_Cmp_Eq);
+       set = new_bd_ia32_Setcc(dbgi, block, flag, ia32_cc_equal);
        SET_IA32_ORIG_NODE(set, node);
 
        /* conv to 32bit */
@@ -5053,7 +5026,9 @@ static ir_node *gen_ffs(ir_node *node)
        set_ia32_commutative(orn);
 
        /* add 1 */
-       return new_bd_ia32_Add(dbgi, block, noreg_GP, noreg_GP, nomem, orn, ia32_create_Immediate(NULL, 0, 1));
+       add = new_bd_ia32_Lea(dbgi, block, orn, noreg_GP);
+       add_ia32_am_offs_int(add, 1);
+       return add;
 }
 
 /**
@@ -5083,32 +5058,31 @@ static ir_node *gen_ctz(ir_node *node)
  */
 static ir_node *gen_parity(ir_node *node)
 {
-       ir_node *param      = get_Builtin_param(node, 0);
        dbg_info *dbgi      = get_irn_dbg_info(node);
+       ir_node  *block     = get_nodes_block(node);
+       ir_node  *new_block = be_transform_node(block);
+       ir_node  *param     = get_Builtin_param(node, 0);
+       ir_node  *new_param = be_transform_node(param);
+       ir_node  *new_node;
 
-       ir_node *block      = get_nodes_block(node);
-
-       ir_node *new_block  = be_transform_node(block);
-       ir_node *imm, *cmp, *new_node;
-
-       ia32_address_mode_t am;
-       ia32_address_t      *addr = &am.addr;
-
-
-       /* cmp param, 0 */
-       match_arguments(&am, block, NULL, param, NULL, match_am);
-       imm = ia32_create_Immediate(NULL, 0, 0);
-       cmp = new_bd_ia32_Cmp(dbgi, new_block, addr->base, addr->index,
-                             addr->mem, imm, am.new_op2, am.ins_permuted, 0);
-       set_am_attributes(cmp, &am);
-       set_ia32_ls_mode(cmp, mode_Iu);
-
-       SET_IA32_ORIG_NODE(cmp, node);
+       /* the x86 parity bit is stupid: it only looks at the lowest byte,
+        * so we have to do complicated xoring first.
+        * (we should also better lower this before the backend so we still have a
+        * chance for CSE, constant folding and other goodies for some of these
+        * operations)
+        */
+       ir_node *count = ia32_create_Immediate(NULL, 0, 16);
+       ir_node *shr = new_bd_ia32_Shr(dbgi, new_block, new_param, count);
+       ir_node *xor = new_bd_ia32_Xor(dbgi, new_block, noreg_GP, noreg_GP, nomem,
+                                      shr, new_param);
+       ir_node *xor2 = new_bd_ia32_XorHighLow(dbgi, new_block, xor);
+       ir_node *flags;
 
-       cmp = fix_mem_proj(cmp, &am);
+       set_irn_mode(xor2, mode_T);
+       flags = new_r_Proj(xor2, mode_Iu, pn_ia32_XorHighLow_flags);
 
        /* setp */
-       new_node = new_bd_ia32_Setcc(dbgi, new_block, cmp, ia32_pn_Cmp_parity);
+       new_node = new_bd_ia32_Setcc(dbgi, new_block, flags, ia32_cc_not_parity);
        SET_IA32_ORIG_NODE(new_node, node);
 
        /* conv to 32bit */
@@ -5151,6 +5125,13 @@ static ir_node *gen_popcount(ir_node *node)
        new_param = be_transform_node(param);
 
        /* do the standard popcount algo */
+       /* TODO: This is stupid, we should transform this before the backend,
+        * to get CSE, localopts, etc. for the operations
+        * TODO: This is also not the optimal algorithm (it is just the starting
+        * example in hackers delight, they optimize it more on the following page)
+        * But I'm too lazy to fix this now, as the code should get lowered before
+        * the backend anyway.
+        */
 
        /* m1 = x & 0x55555555 */
        imm = ia32_create_Immediate(NULL, 0, 0x55555555);
@@ -5158,7 +5139,7 @@ static ir_node *gen_popcount(ir_node *node)
 
        /* s1 = x >> 1 */
        simm = ia32_create_Immediate(NULL, 0, 1);
-       s1 = new_bd_ia32_Shl(dbgi, new_block, new_param, simm);
+       s1 = new_bd_ia32_Shr(dbgi, new_block, new_param, simm);
 
        /* m2 = s1 & 0x55555555 */
        m2 = new_bd_ia32_And(dbgi, new_block, noreg_GP, noreg_GP, nomem, s1, imm);
@@ -5172,7 +5153,7 @@ static ir_node *gen_popcount(ir_node *node)
 
        /* s2 = m3 >> 2 */
        simm = ia32_create_Immediate(NULL, 0, 2);
-       s2 = new_bd_ia32_Shl(dbgi, new_block, m3, simm);
+       s2 = new_bd_ia32_Shr(dbgi, new_block, m3, simm);
 
        /* m5 = s2 & 0x33333333 */
        m5 = new_bd_ia32_And(dbgi, new_block, noreg_GP, noreg_GP, nomem, s2, imm);
@@ -5186,7 +5167,7 @@ static ir_node *gen_popcount(ir_node *node)
 
        /* s3 = m6 >> 4 */
        simm = ia32_create_Immediate(NULL, 0, 4);
-       s3 = new_bd_ia32_Shl(dbgi, new_block, m6, simm);
+       s3 = new_bd_ia32_Shr(dbgi, new_block, m6, simm);
 
        /* m8 = s3 & 0x0F0F0F0F */
        m8 = new_bd_ia32_And(dbgi, new_block, noreg_GP, noreg_GP, nomem, s3, imm);
@@ -5200,7 +5181,7 @@ static ir_node *gen_popcount(ir_node *node)
 
        /* s4 = m9 >> 8 */
        simm = ia32_create_Immediate(NULL, 0, 8);
-       s4 = new_bd_ia32_Shl(dbgi, new_block, m9, simm);
+       s4 = new_bd_ia32_Shr(dbgi, new_block, m9, simm);
 
        /* m11 = s4 & 0x00FF00FF */
        m11 = new_bd_ia32_And(dbgi, new_block, noreg_GP, noreg_GP, nomem, s4, imm);
@@ -5214,7 +5195,7 @@ static ir_node *gen_popcount(ir_node *node)
 
        /* s5 = m12 >> 16 */
        simm = ia32_create_Immediate(NULL, 0, 16);
-       s5 = new_bd_ia32_Shl(dbgi, new_block, m12, simm);
+       s5 = new_bd_ia32_Shr(dbgi, new_block, m12, simm);
 
        /* res = m13 + s5 */
        return new_bd_ia32_Lea(dbgi, new_block, m13, s5);
@@ -5374,7 +5355,8 @@ static ir_node *gen_inner_trampoline(ir_node *node)
        if (is_SymConst(callee)) {
                rel = new_bd_ia32_Const(dbgi, new_block, get_SymConst_entity(callee), 0, 0, -10);
        } else {
-               rel = new_bd_ia32_Lea(dbgi, new_block, be_transform_node(callee), ia32_create_Immediate(NULL, 0, -10));
+               rel = new_bd_ia32_Lea(dbgi, new_block, be_transform_node(callee), noreg_GP);
+               add_ia32_am_offs_int(rel, -10);
        }
        rel = new_bd_ia32_Sub(dbgi, new_block, noreg_GP, noreg_GP, nomem, rel, trampoline);
 
@@ -5558,30 +5540,6 @@ static ir_node *gen_Proj_Cmp(ir_node *node)
              node);
 }
 
-/**
- * Transform the Projs from a Bound.
- */
-static ir_node *gen_Proj_Bound(ir_node *node)
-{
-       ir_node *new_node;
-       ir_node *pred = get_Proj_pred(node);
-
-       switch (get_Proj_proj(node)) {
-       case pn_Bound_M:
-               return be_transform_node(get_Bound_mem(pred));
-       case pn_Bound_X_regular:
-               new_node = be_transform_node(pred);
-               return new_r_Proj(new_node, mode_X, pn_ia32_Jcc_true);
-       case pn_Bound_X_except:
-               new_node = be_transform_node(pred);
-               return new_r_Proj(new_node, mode_X, pn_ia32_Jcc_false);
-       case pn_Bound_res:
-               return be_transform_node(get_Bound_index(pred));
-       default:
-               panic("unsupported Proj from Bound");
-       }
-}
-
 static ir_node *gen_Proj_ASM(ir_node *node)
 {
        ir_mode *mode     = get_irn_mode(node);
@@ -5625,13 +5583,11 @@ static ir_node *gen_Proj(ir_node *node)
        case iro_Builtin:
                return gen_Proj_Builtin(node);
        case iro_Div:
+               return gen_Proj_Div(node);
        case iro_Mod:
-       case iro_DivMod:
-               return gen_Proj_DivMod(node);
+               return gen_Proj_Mod(node);
        case iro_CopyB:
                return gen_Proj_CopyB(node);
-       case iro_Quot:
-               return gen_Proj_Quot(node);
        case beo_SubSP:
                return gen_Proj_be_SubSP(node);
        case beo_AddSP:
@@ -5640,8 +5596,6 @@ static ir_node *gen_Proj(ir_node *node)
                return gen_Proj_be_Call(node);
        case iro_Cmp:
                return gen_Proj_Cmp(node);
-       case iro_Bound:
-               return gen_Proj_Bound(node);
        case iro_Start:
                proj = get_Proj_proj(node);
                switch (proj) {
@@ -5654,9 +5608,6 @@ static ir_node *gen_Proj(ir_node *node)
 
                                return jump;
                        }
-
-                       case pn_Start_P_tls:
-                               return gen_Proj_tls(node);
                }
                break;
 
@@ -5691,7 +5642,7 @@ static void register_transformers(void)
 
        be_set_transform_function(op_Add,              gen_Add);
        be_set_transform_function(op_And,              gen_And);
-       be_set_transform_function(op_ASM,              gen_ASM);
+       be_set_transform_function(op_ASM,              ia32_gen_ASM);
        be_set_transform_function(op_be_AddSP,         gen_be_AddSP);
        be_set_transform_function(op_be_Call,          gen_be_Call);
        be_set_transform_function(op_be_Copy,          gen_be_Copy);
@@ -5699,15 +5650,13 @@ static void register_transformers(void)
        be_set_transform_function(op_be_IncSP,         gen_be_IncSP);
        be_set_transform_function(op_be_Return,        gen_be_Return);
        be_set_transform_function(op_be_SubSP,         gen_be_SubSP);
-       be_set_transform_function(op_Bound,            gen_Bound);
        be_set_transform_function(op_Builtin,          gen_Builtin);
        be_set_transform_function(op_Cmp,              gen_Cmp);
        be_set_transform_function(op_Cond,             gen_Cond);
        be_set_transform_function(op_Const,            gen_Const);
        be_set_transform_function(op_Conv,             gen_Conv);
-       be_set_transform_function(op_CopyB,            gen_CopyB);
+       be_set_transform_function(op_CopyB,            ia32_gen_CopyB);
        be_set_transform_function(op_Div,              gen_Div);
-       be_set_transform_function(op_DivMod,           gen_DivMod);
        be_set_transform_function(op_Eor,              gen_Eor);
        be_set_transform_function(op_ia32_l_Adc,       gen_ia32_l_Adc);
        be_set_transform_function(op_ia32_l_Add,       gen_ia32_l_Add);
@@ -5742,7 +5691,6 @@ static void register_transformers(void)
        be_set_transform_function(op_Or,               gen_Or);
        be_set_transform_function(op_Phi,              gen_Phi);
        be_set_transform_function(op_Proj,             gen_Proj);
-       be_set_transform_function(op_Quot,             gen_Quot);
        be_set_transform_function(op_Rotl,             gen_Rotl);
        be_set_transform_function(op_Shl,              gen_Shl);
        be_set_transform_function(op_Shr,              gen_Shr);
@@ -5750,7 +5698,7 @@ static void register_transformers(void)
        be_set_transform_function(op_Store,            gen_Store);
        be_set_transform_function(op_Sub,              gen_Sub);
        be_set_transform_function(op_SymConst,         gen_SymConst);
-       be_set_transform_function(op_Unknown,          gen_Unknown);
+       be_set_transform_function(op_Unknown,          ia32_gen_Unknown);
 }
 
 /**
@@ -5761,14 +5709,14 @@ static void ia32_pretransform_node(void)
        ir_graph        *irg      = current_ir_graph;
        ia32_irg_data_t *irg_data = ia32_get_irg_data(current_ir_graph);
 
-       irg_data->noreg_gp  = be_pre_transform_node(irg_data->noreg_gp);
-       irg_data->noreg_vfp = be_pre_transform_node(irg_data->noreg_vfp);
-       irg_data->noreg_xmm = be_pre_transform_node(irg_data->noreg_xmm);
+       irg_data->noreg_gp       = be_pre_transform_node(irg_data->noreg_gp);
+       irg_data->noreg_vfp      = be_pre_transform_node(irg_data->noreg_vfp);
+       irg_data->noreg_xmm      = be_pre_transform_node(irg_data->noreg_xmm);
+       irg_data->get_eip        = be_pre_transform_node(irg_data->get_eip);
+       irg_data->fpu_trunc_mode = be_pre_transform_node(irg_data->fpu_trunc_mode);
 
        nomem    = get_irg_no_mem(irg);
        noreg_GP = ia32_new_NoReg_gp(irg);
-
-       get_fpcw();
 }
 
 /**
@@ -5778,9 +5726,9 @@ static void ia32_pretransform_node(void)
  */
 static void postprocess_fp_call_results(void)
 {
-       int i;
+       size_t i, n;
 
-       for (i = ARR_LEN(call_list) - 1; i >= 0; --i) {
+       for (i = 0, n = ARR_LEN(call_list); i < n; ++i) {
                ir_node *call = call_list[i];
                ir_type *mtp  = call_types[i];
                int     j;
@@ -5854,7 +5802,7 @@ static void postprocess_fp_call_results(void)
                                                new_mem = new_r_Proj(xld, mode_M, pn_ia32_xLoad_M);
 
                                                if (old_mem != NULL) {
-                                                       edges_reroute(old_mem, new_mem, current_ir_graph);
+                                                       edges_reroute(old_mem, new_mem);
                                                        kill_node(old_mem);
                                                }
                                        }
@@ -5871,11 +5819,13 @@ void ia32_transform_graph(ir_graph *irg)
        int cse_last;
 
        register_transformers();
-       initial_fpcw  = NULL;
-       no_pic_adjust = 0;
+       initial_fpcw       = NULL;
+       ia32_no_pic_adjust = 0;
+
+       old_initial_fpcw = be_get_initial_reg_value(irg, &ia32_registers[REG_FPCW]);
 
        be_timer_push(T_HEIGHTS);
-       heights      = heights_new(irg);
+       ia32_heights = heights_new(irg);
        be_timer_pop(T_HEIGHTS);
        ia32_calculate_non_address_mode_nodes(irg);
 
@@ -5896,8 +5846,8 @@ void ia32_transform_graph(ir_graph *irg)
        set_opt_cse(cse_last);
 
        ia32_free_non_address_mode_nodes();
-       heights_free(heights);
-       heights = NULL;
+       heights_free(ia32_heights);
+       ia32_heights = NULL;
 }
 
 void ia32_init_transform(void)