make if-conversion and archdep optimisations get their information directly from...
[libfirm] / ir / be / arm / arm_emitter.c
index 8fb8fef..de458a0 100644 (file)
-/* arm emitter */
-/* $Id$ */
+/*
+ * Copyright (C) 1995-2008 University of Karlsruhe.  All right reserved.
+ *
+ * This file is part of libFirm.
+ *
+ * This file may be distributed and/or modified under the terms of the
+ * GNU General Public License version 2 as published by the Free Software
+ * Foundation and appearing in the file LICENSE.GPL included in the
+ * packaging of this file.
+ *
+ * Licensees holding valid libFirm Professional Edition licenses may use
+ * this file in accordance with the libFirm Commercial License.
+ * Agreement provided with the Software.
+ *
+ * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
+ * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE.
+ */
 
-#ifdef HAVE_CONFIG_H
+/**
+ * @file
+ * @brief   arm emitter
+ * @author  Oliver Richter, Tobias Gneist, Michael Beck
+ * @version $Id$
+ */
 #include "config.h"
-#endif
 
 #include <limits.h>
+#include <stdbool.h>
 
 #include "xmalloc.h"
 #include "tv.h"
 #include "iredges.h"
 #include "debug.h"
 #include "irgwalk.h"
+#include "irtools.h"
 #include "irprintf.h"
 #include "irop_t.h"
 #include "irprog_t.h"
 #include "irargs_t.h"
+#include "error.h"
+#include "raw_bitset.h"
+#include "dbginfo.h"
 
 #include "../besched.h"
+#include "../beblocksched.h"
+#include "../beirg.h"
+#include "../begnuas.h"
+#include "../be_dbgout.h"
 
 #include "arm_emitter.h"
+#include "arm_optimize.h"
 #include "gen_arm_emitter.h"
 #include "arm_nodes_attr.h"
 #include "arm_new_nodes.h"
 #include "arm_map_regs.h"
 #include "gen_arm_regalloc_if.h"
 
-#include "../benode_t.h"
+#include "../benode.h"
 
 #define SNPRINTF_BUF_LEN 128
 
-static const arch_env_t *arch_env = NULL;
-
-
-/*************************************************************
- *             _       _    __   _          _
- *            (_)     | |  / _| | |        | |
- *  _ __  _ __ _ _ __ | |_| |_  | |__   ___| |_ __   ___ _ __
- * | '_ \| '__| | '_ \| __|  _| | '_ \ / _ \ | '_ \ / _ \ '__|
- * | |_) | |  | | | | | |_| |   | | | |  __/ | |_) |  __/ |
- * | .__/|_|  |_|_| |_|\__|_|   |_| |_|\___|_| .__/ \___|_|
- * | |                                       | |
- * |_|                                       |_|
- *************************************************************/
-
-int is_immediate_node(ir_node *irn) {
-       if (is_arm_Add_i(irn) || is_arm_Sub_i(irn))
-               return 1;
-       if (is_arm_Shr_i(irn) || is_arm_Shr_i(irn) || is_arm_Shl_i(irn))
-               return 1;
-       if (is_arm_And_i(irn) || is_arm_Or_i(irn) || is_arm_Eor_i(irn))
-               return 1;
-       if (is_arm_Or_Shl_i(irn))
-               return 1;
-       return 0;
-}
-
-/**
- * Return a const or symconst as string.
- */
-static const char *node_const_to_str(ir_node *n) {
-       char buffer[SNPRINTF_BUF_LEN];
-
-       if ( is_immediate_node(n) ) {
-               long longvalue = get_tarval_long(get_arm_value(n));
-               char *str;
-               assert(longvalue < 0x1000 && "constant doesn't fit in shifter_operand");
-               snprintf(buffer, SNPRINTF_BUF_LEN - 1, "#%ld << %ld", longvalue & 0xff, (longvalue >> 8) << 1 );
-               str = xmalloc(strlen(buffer) * sizeof(char));
-               strcpy(str, buffer);
-               return str;
-       }
-       if ( is_arm_Const(n) || is_arm_Const_Neg(n) ) {
-               tarval *tv = get_arm_value(n);
-               if ( mode_is_int(get_tarval_mode(tv)) ) {
-                       long longvalue = get_tarval_long(get_arm_value(n));
-                       char *str;
-                       assert(longvalue < 0x1000 && "constant doesn't fit in shifter_operand");
-                       snprintf(buffer, SNPRINTF_BUF_LEN - 1, "#%ld << %ld", longvalue & 0xff, (longvalue >> 8) << 1 );
-                       str = xmalloc(strlen(buffer) * sizeof(char));
-                       strcpy(str, buffer);
-                       return str;
-               } else {
-                       return "found something else in arm_const";
-               }
-       } else if ( is_arm_SymConst(n) ) {
-               return get_arm_symconst_label(n);
-       } else {
-               assert( 0 && "das ist gar keine Konstante");
-               return NULL;
-       }
-
-}
-
-/**
- * Returns node's offset as string.
- */
-static char *node_offset_to_str(ir_node *n) {
-       char buffer[SNPRINTF_BUF_LEN];
-       char *result;
-       int offset = 0;
-       ir_op *irn_op = get_irn_op(n);
-       if (irn_op == op_be_StackParam) {
-               entity *ent = be_get_frame_entity(n);
-               offset = get_entity_offset_bytes(ent);
-       } else if (irn_op==op_be_Reload || irn_op==op_be_Spill) {
-               entity * ent = be_get_spill_entity(n);
-               offset = get_entity_offset_bytes(ent);
-       } else if (irn_op==op_be_IncSP) {
-               int offs = be_get_IncSP_offset(n);
-               be_stack_dir_t dir  = be_get_IncSP_direction(n);
-               offset = (dir == be_stack_dir_expand) ? -offs : offs;
-       } else {
-               return "node_offset_to_str will fuer diesen Knotentyp noch implementiert werden";
-       }
-       snprintf(buffer, SNPRINTF_BUF_LEN, "%d", offset);
-       result = xmalloc(sizeof(char)*(strlen(buffer) + 1));
-       strcpy(result, buffer);
-       return result;
-}
-
-/* We always pass the ir_node which is a pointer. */
-static int arm_get_arg_type(const lc_arg_occ_t *occ) {
-       return lc_arg_type_ptr;
-}
+DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)
 
+static const arm_code_gen_t *cg;
+static set                  *sym_or_tv;
 
 /**
  * Returns the register at in position pos.
  */
-static const arch_register_t *get_in_reg(const ir_node *irn, int pos) {
+static const arch_register_t *get_in_reg(const ir_node *irn, int pos)
+{
        ir_node                *op;
        const arch_register_t  *reg = NULL;
 
@@ -139,677 +79,948 @@ static const arch_register_t *get_in_reg(const ir_node *irn, int pos) {
           in register we need. */
        op = get_irn_n(irn, pos);
 
-       reg = arch_get_irn_register(arch_env, op);
-
-       /* ONLY TEMPORARY WORK-AROUND */
-//     if (!reg) {
-//             printf("FIXME\n");
-//             reg = &arm_general_purpose_regs[REG_MURX];
-//     }
+       reg = arch_get_irn_register(op);
 
        assert(reg && "no in register found");
+
+       /* in case of a joker register: just return a valid register */
+       if (arch_register_type_is(reg, joker)) {
+               const arch_register_req_t *req = arch_get_register_req(irn, pos);
+
+               if (arch_register_req_is(req, limited)) {
+                       /* in case of limited requirements: get the first allowed register */
+                       unsigned idx = rbitset_next(req->limited, 0, 1);
+                       reg = arch_register_for_index(req->cls, idx);
+               } else {
+                       /* otherwise get first register in class */
+                       reg = arch_register_for_index(req->cls, 0);
+               }
+       }
        return reg;
 }
 
+
 /**
  * Returns the register at out position pos.
  */
-static const arch_register_t *get_out_reg(const ir_node *irn, int pos) {
-       ir_node                *proj;
-       const arch_register_t  *reg = NULL;
-
-       assert(get_irn_n_edges(irn) > pos && "Invalid OUT position");
+static const arch_register_t *get_out_reg(const ir_node *node, int pos)
+{
+    ir_node                *proj;
+    const arch_register_t  *reg = NULL;
+
+    /* 1st case: irn is not of mode_T, so it has only                 */
+    /*           one OUT register -> good                             */
+    /* 2nd case: irn is of mode_T -> collect all Projs and ask the    */
+    /*           Proj with the corresponding projnum for the register */
+
+    if (get_irn_mode(node) != mode_T) {
+        reg = arch_get_irn_register(node);
+    } else if (is_arm_irn(node)) {
+        reg = arch_irn_get_register(node, pos);
+    } else {
+        const ir_edge_t *edge;
+
+        foreach_out_edge(node, edge) {
+            proj = get_edge_src_irn(edge);
+            assert(is_Proj(proj) && "non-Proj from mode_T node");
+            if (get_Proj_proj(proj) == pos) {
+                reg = arch_get_irn_register(proj);
+                break;
+            }
+        }
+    }
+
+    assert(reg && "no out register found");
+    return reg;
+}
 
-       /* 1st case: irn is not of mode_T, so it has only                 */
-       /*           one OUT register -> good                             */
-       /* 2nd case: irn is of mode_T -> collect all Projs and ask the    */
-       /*           Proj with the corresponding projnum for the register */
+void arm_emit_source_register(const ir_node *node, int pos)
+{
+       const arch_register_t *reg = get_in_reg(node, pos);
+       be_emit_string(arch_register_get_name(reg));
+}
 
-       if (get_irn_mode(irn) != mode_T) {
-               reg = arch_get_irn_register(arch_env, irn);
-       }
-       else if (is_arm_irn(irn)) {
-               reg = get_arm_out_reg(irn, pos);
-       }
-       else {
-               const ir_edge_t *edge;
+void arm_emit_dest_register(const ir_node *node, int pos)
+{
+       const arch_register_t *reg = get_out_reg(node, pos);
+       be_emit_string(arch_register_get_name(reg));
+}
 
-               foreach_out_edge(irn, edge) {
-                       proj = get_edge_src_irn(edge);
-                       assert(is_Proj(proj) && "non-Proj from mode_T node");
-                       if (get_Proj_proj(proj) == pos) {
-                               reg = arch_get_irn_register(arch_env, proj);
-                               break;
-                       }
-               }
-       }
+void arm_emit_offset(const ir_node *node)
+{
+       const arm_load_store_attr_t *attr = get_arm_load_store_attr_const(node);
+       assert(attr->base.is_load_store);
 
-       assert(reg && "no out register found");
-       return reg;
+       be_emit_irprintf("0x%X", attr->offset);
 }
 
 /**
- * Returns the number of the in register at position pos.
+ * Emit the arm fpa instruction suffix depending on the mode.
  */
-int get_arm_reg_nr(ir_node *irn, int pos, int in_out) {
-       const arch_register_t *reg;
+static void arm_emit_fpa_postfix(const ir_mode *mode)
+{
+       int bits = get_mode_size_bits(mode);
+       char c = 'e';
+
+       if (bits == 32)
+               c = 's';
+       else if (bits == 64)
+               c = 'd';
+       be_emit_char(c);
+}
 
-       if (in_out == 1) {
-               reg = get_in_reg(irn, pos);
-       }
-       else {
-               reg = get_out_reg(irn, pos);
-       }
+void arm_emit_float_load_store_mode(const ir_node *node)
+{
+       const arm_load_store_attr_t *attr = get_arm_load_store_attr_const(node);
+       arm_emit_fpa_postfix(attr->load_store_mode);
+}
 
-       return arch_register_get_index(reg);
+void arm_emit_float_arithmetic_mode(const ir_node *node)
+{
+       const arm_farith_attr_t *attr = get_arm_farith_attr_const(node);
+       arm_emit_fpa_postfix(attr->mode);
 }
 
-/**
- * Returns the name of the in register at position pos.
- */
-const char *get_arm_reg_name(ir_node *irn, int pos, int in_out) {
-       const arch_register_t *reg;
+void arm_emit_symconst(const ir_node *node)
+{
+       const arm_SymConst_attr_t *symconst = get_arm_SymConst_attr_const(node);
+       ir_entity                 *entity   = symconst->entity;
 
-       if (in_out == 1) {
-               reg = get_in_reg(irn, pos);
-       }
-       else {
-               reg = get_out_reg(irn, pos);
-       }
+       be_gas_emit_entity(entity);
 
-       return arch_register_get_name(reg);
+       /* TODO do something with offset */
 }
 
-/**
- * Get the register name for a node.
- */
-static int arm_get_reg_name(lc_appendable_t *app,
-    const lc_arg_occ_t *occ, const lc_arg_value_t *arg)
+void arm_emit_load_mode(const ir_node *node)
 {
-       const char *buf;
-       ir_node    *X  = arg->v_ptr;
-       int         nr = occ->width - 1;
-
-       if (!X)
-               return lc_appendable_snadd(app, "(null)", 6);
-
-       if (occ->conversion == 'S') {
-               buf = get_arm_reg_name(X, nr, 1);
-       }
-       else { /* 'D' */
-               buf = get_arm_reg_name(X, nr, 0);
+       const arm_load_store_attr_t *attr = get_arm_load_store_attr_const(node);
+       ir_mode *mode      = attr->load_store_mode;
+       int      bits      = get_mode_size_bits(mode);
+       bool     is_signed = mode_is_signed(mode);
+       if (bits == 16) {
+               be_emit_string(is_signed ? "sh" : "h");
+       } else if (bits == 8) {
+               be_emit_string(is_signed ? "sb" : "b");
+       } else {
+               assert(bits == 32);
        }
+}
 
-       lc_appendable_chadd(app, '%');
-       return lc_appendable_snadd(app, buf, strlen(buf));
+void arm_emit_store_mode(const ir_node *node)
+{
+       const arm_load_store_attr_t *attr = get_arm_load_store_attr_const(node);
+       ir_mode *mode      = attr->load_store_mode;
+       int      bits      = get_mode_size_bits(mode);
+       if (bits == 16) {
+               be_emit_cstring("h");
+       } else if (bits == 8) {
+               be_emit_cstring("b");
+       } else {
+               assert(bits == 32);
+       }
 }
 
-/**
- * Returns the tarval or offset of an arm node as a string.
- */
-static int arm_const_to_str(lc_appendable_t *app,
-    const lc_arg_occ_t *occ, const lc_arg_value_t *arg)
+static void emit_shf_mod_name(arm_shift_modifier_t mod)
 {
-       const char *buf;
-       ir_node    *X = arg->v_ptr;
+       switch (mod) {
+       case ARM_SHF_ASR_REG:
+       case ARM_SHF_ASR_IMM:
+               be_emit_cstring("asr");
+               return;
+       case ARM_SHF_LSL_REG:
+       case ARM_SHF_LSL_IMM:
+               be_emit_cstring("lsl");
+               return;
+       case ARM_SHF_LSR_REG:
+       case ARM_SHF_LSR_IMM:
+               be_emit_cstring("lsr");
+               return;
+       case ARM_SHF_ROR_REG:
+       case ARM_SHF_ROR_IMM:
+               be_emit_cstring("ror");
+               return;
+       default:
+               break;
+       }
+       panic("can't emit this shf_mod_name %d", (int) mod);
+}
 
-       if (!X)
-               return lc_appendable_snadd(app, "(null)", 6);
+void arm_emit_shifter_operand(const ir_node *node)
+{
+       const arm_shifter_operand_t *attr = get_irn_generic_attr_const(node);
 
-       if (occ->conversion == 'C') {
-               buf = node_const_to_str(X);
-       }
-       else { /* 'O' */
-               buf = node_offset_to_str(X);
+       switch (attr->shift_modifier) {
+       case ARM_SHF_REG:
+               arm_emit_source_register(node, get_irn_arity(node) - 1);
+               return;
+       case ARM_SHF_IMM: {
+               unsigned val = attr->immediate_value;
+               val = (val >> attr->shift_immediate)
+                       | (val << (32-attr->shift_immediate));
+               val &= 0xFFFFFFFF;
+               be_emit_irprintf("#0x%X", val);
+               return;
        }
+       case ARM_SHF_ASR_IMM:
+       case ARM_SHF_LSL_IMM:
+       case ARM_SHF_LSR_IMM:
+       case ARM_SHF_ROR_IMM:
+               arm_emit_source_register(node, get_irn_arity(node) - 1);
+               be_emit_cstring(", ");
+               emit_shf_mod_name(attr->shift_modifier);
+               be_emit_irprintf(" #0x%X", attr->shift_immediate);
+               return;
+
+       case ARM_SHF_ASR_REG:
+       case ARM_SHF_LSL_REG:
+       case ARM_SHF_LSR_REG:
+       case ARM_SHF_ROR_REG:
+               arm_emit_source_register(node, get_irn_arity(node) - 2);
+               be_emit_cstring(", ");
+               emit_shf_mod_name(attr->shift_modifier);
+               be_emit_cstring(" ");
+               arm_emit_source_register(node, get_irn_arity(node) - 1);
+               return;
 
-       return lc_appendable_snadd(app, buf, strlen(buf));
+       case ARM_SHF_RRX:
+               arm_emit_source_register(node, get_irn_arity(node) - 1);
+               panic("RRX shifter emitter TODO");
+
+       case ARM_SHF_INVALID:
+               break;
+       }
+       panic("Invalid shift_modifier while emitting %+F", node);
 }
 
+/** An entry in the sym_or_tv set. */
+typedef struct sym_or_tv_t {
+       union {
+               ir_entity  *entity;  /**< An entity. */
+               tarval     *tv;      /**< A tarval. */
+               const void *generic; /**< For generic compare. */
+       } u;
+       unsigned label;      /**< the associated label. */
+       bool     is_entity;  /**< true if an entity is stored. */
+} sym_or_tv_t;
+
 /**
- * Determines the SSE suffix depending on the mode.
+ * Returns a unique label. This number will not be used a second time.
  */
-static int arm_get_mode_suffix(lc_appendable_t *app,
-    const lc_arg_occ_t *occ, const lc_arg_value_t *arg)
+static unsigned get_unique_label(void)
 {
-       ir_node *X = arg->v_ptr;
-
-       if (!X)
-               return lc_appendable_snadd(app, "(null)", 6);
+       static unsigned id = 0;
+       return ++id;
+}
 
-       if (get_mode_size_bits(get_irn_mode(X)) == 32)
-               return lc_appendable_chadd(app, 's');
-       else
-               return lc_appendable_chadd(app, 'd');
+static void emit_constant_name(const sym_or_tv_t *entry)
+{
+       be_emit_irprintf("%sC%u", be_gas_get_private_prefix(), entry->label);
 }
 
 /**
- * Return the arm printf arg environment.
- * We use the firm environment with some additional handlers.
+ * Emit a SymConst.
  */
-const lc_arg_env_t *arm_get_arg_env(void) {
-       static lc_arg_env_t *env = NULL;
-
-       static const lc_arg_handler_t arm_reg_handler   = { arm_get_arg_type, arm_get_reg_name };
-       static const lc_arg_handler_t arm_const_handler = { arm_get_arg_type, arm_const_to_str };
-       static const lc_arg_handler_t arm_mode_handler  = { arm_get_arg_type, arm_get_mode_suffix };
+static void emit_arm_SymConst(const ir_node *irn)
+{
+       const arm_SymConst_attr_t *attr = get_arm_SymConst_attr_const(irn);
+       sym_or_tv_t key, *entry;
+       unsigned label;
+
+       key.u.entity  = attr->entity;
+       key.is_entity = true;
+       key.label     = 0;
+       entry = (sym_or_tv_t *)set_insert(sym_or_tv, &key, sizeof(key), HASH_PTR(key.u.generic));
+       if (entry->label == 0) {
+               /* allocate a label */
+               entry->label = get_unique_label();
+       }
+       label = entry->label;
+
+       /* load the symbol indirect */
+       be_emit_cstring("\tldr ");
+       arm_emit_dest_register(irn, 0);
+       be_emit_cstring(", ");
+       emit_constant_name(entry);
+       be_emit_finish_line_gas(irn);
+}
 
-       if(env == NULL) {
-               /* extend the firm printer */
-               env = firm_get_arg_env();
-                       //lc_arg_new_env();
+static void emit_arm_FrameAddr(const ir_node *irn)
+{
+       const arm_SymConst_attr_t *attr = get_irn_generic_attr_const(irn);
+
+       be_emit_cstring("\tadd ");
+       arm_emit_dest_register(irn, 0);
+       be_emit_cstring(", ");
+       arm_emit_source_register(irn, 0);
+       be_emit_cstring(", ");
+       be_emit_irprintf("#0x%X", attr->fp_offset);
+       be_emit_finish_line_gas(irn);
+}
 
-               lc_arg_register(env, "arm:sreg", 'S', &arm_reg_handler);
-               lc_arg_register(env, "arm:dreg", 'D', &arm_reg_handler);
-               lc_arg_register(env, "arm:cnst", 'C', &arm_const_handler);
-               lc_arg_register(env, "arm:offs", 'O', &arm_const_handler);
-               lc_arg_register(env, "arm:mode", 'M', &arm_mode_handler);
+/**
+ * Emit a floating point fpa constant.
+ */
+static void emit_arm_fConst(const ir_node *irn)
+{
+       sym_or_tv_t key, *entry;
+       unsigned label;
+       ir_mode *mode;
+
+       key.u.tv      = get_fConst_value(irn);
+       key.is_entity = false;
+       key.label     = 0;
+       entry = (sym_or_tv_t *)set_insert(sym_or_tv, &key, sizeof(key), HASH_PTR(key.u.generic));
+       if (entry->label == 0) {
+               /* allocate a label */
+               entry->label = get_unique_label();
        }
-
-       return env;
+       label = entry->label;
+
+       /* load the tarval indirect */
+       mode = get_irn_mode(irn);
+       be_emit_cstring("\tldf");
+       arm_emit_fpa_postfix(mode);
+       be_emit_char(' ');
+
+       arm_emit_dest_register(irn, 0);
+       be_emit_cstring(", ");
+       emit_constant_name(entry);
+       be_emit_finish_line_gas(irn);
 }
 
 /**
- * Formated print of commands and comments.
+ * Returns the next block in a block schedule.
  */
-static void arm_fprintf_format(FILE *F, char *cmd_buf, char *cmnt_buf, ir_node *irn) {
-       lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
+static ir_node *sched_next_block(const ir_node *block)
+{
+    return get_irn_link(block);
 }
 
-/*
- * Add a number to a prefix. This number will not be used a second time.
+/**
+ * Returns the target block for a control flow node.
  */
-static char *get_unique_label(char *buf, size_t buflen, const char *prefix) {
-       static unsigned long id = 0;
-       snprintf(buf, buflen, "%s%lu", prefix, ++id);
-       return buf;
+static ir_node *get_cfop_target_block(const ir_node *irn)
+{
+       return get_irn_link(irn);
 }
 
+/**
+ * Emit the target label for a control flow node.
+ */
+static void arm_emit_cfop_target(const ir_node *irn)
+{
+       ir_node *block = get_cfop_target_block(irn);
+
+       be_gas_emit_block_name(block);
+}
 
 /**
- * Returns the target label for a control flow node.
+ * Emit a Compare with conditional branch.
  */
-static char *get_cfop_target(const ir_node *irn, char *buf) {
-       ir_node *bl = get_irn_link(irn);
-
-       snprintf(buf, SNPRINTF_BUF_LEN, "BLOCK_%ld", get_irn_node_nr(bl));
-       return buf;
-}
-
-/************************************************************************/
-/* emit_arm                                                             */
-/************************************************************************/
-
-static void emit_arm_SymConst(ir_node *irn, void *env) {
-       arm_emit_env_t *emit_env = env;
-       FILE *out = emit_env->out;
-       char buffer1[SNPRINTF_BUF_LEN];
-       char *skip_label = get_unique_label(buffer1, SNPRINTF_BUF_LEN, ".L");
-       char buffer2[SNPRINTF_BUF_LEN];
-       char *indi_label = get_unique_label(buffer2, SNPRINTF_BUF_LEN, ".L");
-       fprintf( out, "\tB %s\t\t\t\t\t/* start of indirect SymConst */\n", skip_label );
-       fprintf( out, "\t.align 2\n" );
-       fprintf( out, "%s:\n", indi_label );
-       lc_efprintf(arm_get_arg_env(), out, "\t.word\t%C\n", irn);
-       fprintf( out, "\t.align 2\n" );
-       fprintf( out, "%s:\n", skip_label );
-       lc_efprintf(arm_get_arg_env(), out, "\tLDR %1D, %s\t\t\t/* end of indirect SymConst */\n", irn, indi_label);
-}
-
-static void emit_arm_CondJmp(ir_node *irn, void *env) {
-       arm_emit_env_t *emit_env = env;
-       FILE *out = emit_env->out;
+static void emit_arm_B(const ir_node *irn)
+{
        const ir_edge_t *edge;
-       ir_node *true_block = NULL;
-       ir_node *false_block = NULL;
+       const ir_node *proj_true  = NULL;
+       const ir_node *proj_false = NULL;
+       const ir_node *block;
+       const ir_node *next_block;
        ir_node *op1 = get_irn_n(irn, 0);
-       ir_mode *opmode = get_irn_mode(op1);
-       char *suffix;
-       int proj_num = get_arm_proj_num(irn);
-       char cmd_buf[SNPRINTF_BUF_LEN], cmnt_buf[SNPRINTF_BUF_LEN];
-
-
-       foreach_out_edge(irn, edge) {
-               ir_node* proj = get_edge_src_irn(edge);
-               long nr = get_Proj_proj(proj);
-               ir_node *block = get_irn_link(proj);
-               if ( nr == pn_Cond_true) {
-                       true_block = block;
-               } else if (nr == pn_Cond_false) {
-                       false_block = block;
+       const char *suffix;
+       pn_Cmp pnc = get_arm_CondJmp_pnc(irn);
+       const arm_cmp_attr_t *cmp_attr = get_irn_generic_attr_const(op1);
+       bool is_signed = !cmp_attr->is_unsigned;
+
+       assert(is_arm_Cmp(op1) || is_arm_Tst(op1));
+
+       foreach_out_edge(irn, edge) {
+               ir_node *proj = get_edge_src_irn(edge);
+               long nr = get_Proj_proj(proj);
+               if (nr == pn_Cond_true) {
+                       proj_true = proj;
                } else {
-                       assert(0 && "tertium non datur! (CondJmp)");
+                       proj_false = proj;
                }
-       }
+       }
 
-       if (proj_num == pn_Cmp_False) {
-               fprintf(out, "\tB BLOCK_%ld\t\t\t/* false case */\n", get_irn_node_nr(false_block));
-       } else if (proj_num == pn_Cmp_True) {
-               fprintf(out, "\tB BLOCK_%ld\t\t\t/* true case */\n", get_irn_node_nr(true_block));
-       } else {
-               if (mode_is_float(opmode)) {
-                       suffix = "ICHWILLIMPLEMENTIERTWERDEN";
+       if (cmp_attr->ins_permuted) {
+               pnc = get_mirrored_pnc(pnc);
+       }
 
-                       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "FCMP %1S, %2S", irn, irn);
-                       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* Compare(%1S, %2S) -> FCPSR */", irn, irn );
-                       arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
+       /* for now, the code works for scheduled and non-schedules blocks */
+       block = get_nodes_block(irn);
 
-                       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "FMSTAT", irn, irn);
-                       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* FCSPR -> CPSR */");
-                       arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
+       /* we have a block schedule */
+       next_block = sched_next_block(block);
 
-                       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "B%s BLOCK_%d", suffix, get_irn_node_nr(true_block));
-                       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* true case */");
-                       arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
+       assert(pnc != pn_Cmp_False);
+       assert(pnc != pn_Cmp_True);
 
-                       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "B BLOCK_%d", get_irn_node_nr(false_block));
-                       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* false case */");
-                       arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
-               } else {
-                       switch(proj_num) {
-                               case pn_Cmp_Eq:  suffix = "EQ"; break;
-                               case pn_Cmp_Lt:  suffix = "LT"; break;
-                               case pn_Cmp_Le:  suffix = "LE"; break;
-                               case pn_Cmp_Gt:  suffix = "GT"; break;
-                               case pn_Cmp_Ge:  suffix = "GE"; break;
-                               case pn_Cmp_Lg:  suffix = "NE"; break;
-                               case pn_Cmp_Leg: suffix = "AL"; break;
-                       default: assert(0 && "komische Dinge geschehen");
-                       }
+       if (get_cfop_target_block(proj_true) == next_block) {
+               /* exchange both proj's so the second one can be omitted */
+               const ir_node *t = proj_true;
 
-                       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "CMP %1S, %2S", irn, irn);
-                       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* Compare(%1S, %2S) -> CPSR */", irn, irn );
-                       arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
+               proj_true  = proj_false;
+               proj_false = t;
+               pnc        = get_negated_pnc(pnc, mode_Iu);
+       }
 
-                       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "B%s BLOCK_%d", suffix, get_irn_node_nr(true_block));
-                       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* true case */");
-                       arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
+       switch (pnc) {
+               case pn_Cmp_Eq:  suffix = "eq"; break;
+               case pn_Cmp_Lt:  suffix = is_signed ? "lt" : "lo"; break;
+               case pn_Cmp_Le:  suffix = is_signed ? "le" : "ls"; break;
+               case pn_Cmp_Gt:  suffix = is_signed ? "gt" : "hi"; break;
+               case pn_Cmp_Ge:  suffix = is_signed ? "ge" : "hs"; break;
+               case pn_Cmp_Lg:  suffix = "ne"; break;
+               case pn_Cmp_Leg: suffix = "al"; break;
+               default: panic("Cmp has unsupported pnc");
+       }
 
-                       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "B BLOCK_%d", get_irn_node_nr(false_block));
-                       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* false case */");
-                       arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
-               }
+       /* emit the true proj */
+       be_emit_irprintf("\tb%s ", suffix);
+       arm_emit_cfop_target(proj_true);
+       be_emit_finish_line_gas(proj_true);
+
+       if (get_cfop_target_block(proj_false) == next_block) {
+               be_emit_cstring("\t/* fallthrough to ");
+               arm_emit_cfop_target(proj_false);
+               be_emit_cstring(" */");
+               be_emit_finish_line_gas(proj_false);
+       } else {
+               be_emit_cstring("\tb ");
+               arm_emit_cfop_target(proj_false);
+               be_emit_finish_line_gas(proj_false);
        }
 }
 
-static void emit_arm_CopyB(ir_node *irn, void *env) {
-       arm_emit_env_t *emit_env = env;
-       FILE *out = emit_env->out;
-       char cmd_buf[SNPRINTF_BUF_LEN], cmnt_buf[SNPRINTF_BUF_LEN];
-       unsigned int size = get_tarval_long(get_arm_value(irn));
-       const lc_arg_env_t *arg_env = arm_get_arg_env();
+/** Sort register in ascending order. */
+static int reg_cmp(const void *a, const void *b)
+{
+       const arch_register_t * const *ra = a;
+       const arch_register_t * const *rb = b;
 
-       lc_esnprintf(arg_env, cmnt_buf, SNPRINTF_BUF_LEN, "/* MemCopy (%2S)->(%1S) [%d bytes], Use %3S, %4S, %5S and %%r12 */", irn, irn, size, irn, irn, irn);
+       return *ra < *rb ? -1 : (*ra != *rb);
+}
 
-       assert ( size > 0 && "CopyB needs size > 0" );
-       if (size & 3)
+/**
+ * Create the CopyB instruction sequence.
+ */
+static void emit_arm_CopyB(const ir_node *irn)
+{
+       const arm_CopyB_attr_t *attr = get_irn_generic_attr_const(irn);
+       unsigned size = attr->size;
+
+       const char *tgt = arch_register_get_name(get_in_reg(irn, 0));
+       const char *src = arch_register_get_name(get_in_reg(irn, 1));
+       const char *t0, *t1, *t2, *t3;
+
+       const arch_register_t *tmpregs[4];
+
+       /* collect the temporary registers and sort them, we need ascending order */
+       tmpregs[0] = get_in_reg(irn, 2);
+       tmpregs[1] = get_in_reg(irn, 3);
+       tmpregs[2] = get_in_reg(irn, 4);
+       tmpregs[3] = &arm_gp_regs[REG_R12];
+
+       /* Note: R12 is always the last register because the RA did not assign higher ones */
+       qsort((void *)tmpregs, 3, sizeof(tmpregs[0]), reg_cmp);
+
+       /* need ascending order */
+       t0 = arch_register_get_name(tmpregs[0]);
+       t1 = arch_register_get_name(tmpregs[1]);
+       t2 = arch_register_get_name(tmpregs[2]);
+       t3 = arch_register_get_name(tmpregs[3]);
+
+       be_emit_cstring("/* MemCopy (");
+       be_emit_string(src);
+       be_emit_cstring(")->(");
+       arm_emit_source_register(irn, 0);
+       be_emit_irprintf(" [%u bytes], Uses ", size);
+       be_emit_string(t0);
+       be_emit_cstring(", ");
+       be_emit_string(t1);
+       be_emit_cstring(", ");
+       be_emit_string(t2);
+       be_emit_cstring(", and ");
+       be_emit_string(t3);
+       be_emit_cstring("*/");
+       be_emit_finish_line_gas(NULL);
+
+       assert(size > 0 && "CopyB needs size > 0" );
+
+       if (size & 3) {
+               fprintf(stderr, "strange hack enabled: copy more bytes than needed!");
                size += 4;
+       }
+
        size >>= 2;
-       switch(size & 3) {
+       switch (size & 3) {
        case 0:
                break;
        case 1:
-               lc_esnprintf(arg_env, cmd_buf, SNPRINTF_BUF_LEN, "LDR %%r12, [%2S, #0]!", irn);
-               arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
-               lc_esnprintf(arg_env, cmd_buf, SNPRINTF_BUF_LEN, "STR  %%r12, [%1S, #0]!", irn);
-               arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
+               be_emit_cstring("\tldr ");
+               be_emit_string(t3);
+               be_emit_cstring(", [");
+               be_emit_string(src);
+               be_emit_cstring(", #0]");
+               be_emit_finish_line_gas(NULL);
+
+               be_emit_cstring("\tstr ");
+               be_emit_string(t3);
+               be_emit_cstring(", [");
+               be_emit_string(tgt);
+               be_emit_cstring(", #0]");
+               be_emit_finish_line_gas(irn);
                break;
        case 2:
-               lc_esnprintf(arg_env, cmd_buf, SNPRINTF_BUF_LEN, "LDMIA %2S!, {%%r12, %3S}", irn, irn);
-               arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
-               lc_esnprintf(arg_env, cmd_buf, SNPRINTF_BUF_LEN, "STMIA %1S!, {%%r12, %3S}", irn, irn);
-               arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
+               be_emit_cstring("\tldmia ");
+               be_emit_string(src);
+               be_emit_cstring("!, {");
+               be_emit_string(t0);
+               be_emit_cstring(", ");
+               be_emit_string(t1);
+               be_emit_char('}');
+               be_emit_finish_line_gas(NULL);
+
+               be_emit_cstring("\tstmia ");
+               be_emit_string(tgt);
+               be_emit_cstring("!, {");
+               be_emit_string(t0);
+               be_emit_cstring(", ");
+               be_emit_string(t1);
+               be_emit_char('}');
+               be_emit_finish_line_gas(irn);
                break;
        case 3:
-               lc_esnprintf(arg_env, cmd_buf, SNPRINTF_BUF_LEN, "LDMIA %2S!, {%%r12, %3S, %4S}", irn, irn, irn);
-               arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
-               lc_esnprintf(arg_env, cmd_buf, SNPRINTF_BUF_LEN, "STMIA %1S!, {%%r12, %3S, %4S}", irn, irn, irn);
-               arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
+               be_emit_cstring("\tldmia ");
+               be_emit_string(src);
+               be_emit_cstring("!, {");
+               be_emit_string(t0);
+               be_emit_cstring(", ");
+               be_emit_string(t1);
+               be_emit_cstring(", ");
+               be_emit_string(t2);
+               be_emit_char('}');
+               be_emit_finish_line_gas(NULL);
+
+               be_emit_cstring("\tstmia ");
+               be_emit_string(tgt);
+               be_emit_cstring("!, {");
+               be_emit_string(t0);
+               be_emit_cstring(", ");
+               be_emit_string(t1);
+               be_emit_cstring(", ");
+               be_emit_string(t2);
+               be_emit_char('}');
+               be_emit_finish_line_gas(irn);
                break;
        }
        size >>= 2;
        while (size) {
-               lc_esnprintf(arg_env, cmd_buf, SNPRINTF_BUF_LEN, "LDMIA %2S!, {%%r12, %3S, %4S, %5S}", irn, irn, irn, irn);
-               arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
-               lc_esnprintf(arg_env, cmd_buf, SNPRINTF_BUF_LEN, "STMIA %1S!, {%%r12, %3S, %4S, %5S}", irn, irn, irn, irn);
-               arm_fprintf_format(out, cmd_buf, cmnt_buf, irn);
+               be_emit_cstring("\tldmia ");
+               be_emit_string(src);
+               be_emit_cstring("!, {");
+               be_emit_string(t0);
+               be_emit_cstring(", ");
+               be_emit_string(t1);
+               be_emit_cstring(", ");
+               be_emit_string(t2);
+               be_emit_cstring(", ");
+               be_emit_string(t3);
+               be_emit_char('}');
+               be_emit_finish_line_gas(NULL);
+
+               be_emit_cstring("\tstmia ");
+               be_emit_string(tgt);
+               be_emit_cstring("!, {");
+               be_emit_string(t0);
+               be_emit_cstring(", ");
+               be_emit_string(t1);
+               be_emit_cstring(", ");
+               be_emit_string(t2);
+               be_emit_cstring(", ");
+               be_emit_string(t3);
+               be_emit_char('}');
+               be_emit_finish_line_gas(irn);
                --size;
        }
 }
 
-static void emit_arm_SwitchJmp(ir_node *irn, void *env) {
-       char cmd_buf[SNPRINTF_BUF_LEN], cmnt_buf[SNPRINTF_BUF_LEN];
+static void emit_arm_SwitchJmp(const ir_node *irn)
+{
        const ir_edge_t    *edge;
        ir_node            *proj;
-       arm_emit_env_t *emit_env = env;
-       FILE *out = emit_env->out;
        int i;
        ir_node **projs;
        int n_projs;
        int block_nr;
-       int default_block_num;
+       ir_node *default_proj = NULL;
 
        block_nr = get_irn_node_nr(irn);
-       n_projs = get_arm_n_projs(irn);
+       n_projs = get_arm_SwitchJmp_n_projs(irn);
 
-       projs = xcalloc(n_projs , sizeof(ir_node*));
+       projs = XMALLOCNZ(ir_node*, n_projs);
 
        foreach_out_edge(irn, edge) {
                proj = get_edge_src_irn(edge);
                assert(is_Proj(proj) && "Only proj allowed at SwitchJmp");
 
-               if (get_Proj_proj(proj) == get_arm_default_proj_num(irn))
-                       default_block_num = get_irn_node_nr(get_irn_link(proj));
+               if (get_Proj_proj(proj) == get_arm_SwitchJmp_default_proj_num(irn))
+                       default_proj = proj;
 
                projs[get_Proj_proj(proj)] = proj;
        }
-
-       // CMP %1S, n_projs - 1
-       // BHI default
-
-
-
-       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "CMP %1S, #%u", irn, n_projs - 1);
-       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "", irn);
-       lc_efprintf(arm_get_arg_env(), out, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-
-       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "BHI BLOCK_%d", default_block_num);
-       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "", irn);
-       lc_efprintf(arm_get_arg_env(), out, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-
-
-       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "LDR %%r12, TABLE_%d_START", block_nr);
-       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "", irn);
-       lc_efprintf(arm_get_arg_env(), out, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-
-       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "ADD %%r12, %%r12, %1S, LSL #2", irn);
-       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "", irn);
-       lc_efprintf(arm_get_arg_env(), out, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-
-       lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "LDR %%r15, [%%r12, #0]");
-       lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "", irn);
-       lc_efprintf(arm_get_arg_env(), out, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-
-       // LDR %r12, .TABLE_X_START
-       // ADD %r12, %r12, [%1S, LSL #2]
-       // LDR %r15, %r12
-
-       fprintf(out, "TABLE_%d_START:\n\t.word\tTABLE_%d\n", block_nr, block_nr);
-       fprintf(out, "\t.align 2\n");
-       fprintf(out, "TABLE_%d:\n", block_nr);
-
-
-       for ( i=0; i<n_projs; i++) {
-               ir_node *block;
+       assert(default_proj != NULL && "SwitchJmp should have a Default Proj");
+
+       /*
+          CMP %1S, n_projs - 1
+          BHI default
+       */
+
+       be_emit_cstring("\tcmp ");
+       arm_emit_source_register(irn, 0);
+       be_emit_irprintf(", #%u", n_projs - 1);
+       be_emit_finish_line_gas(irn);
+
+       be_emit_cstring("\tbhi ");
+       arm_emit_cfop_target(default_proj);
+       be_emit_finish_line_gas(default_proj);
+
+       /*
+          LDR %r12, .TABLE_X_START
+          ADD %r12, %r12, [%1S, LSL #2]
+          LDR %r15, %r12
+        */
+
+       be_emit_irprintf("\tldr %%r12, TABLE_%d_START", block_nr);
+       be_emit_finish_line_gas(NULL);
+
+       be_emit_irprintf("\tadd %%r12, %%r12, ");
+       arm_emit_source_register(irn, 0);
+       be_emit_cstring(", LSL #2");
+       be_emit_finish_line_gas(NULL);
+
+       be_emit_cstring("\tldr %r15, [%r12, #0]");
+       be_emit_finish_line_gas(NULL);
+
+       be_emit_irprintf("TABLE_%d_START:\n\t.word\tTABLE_%d", block_nr, block_nr);
+       be_emit_finish_line_gas(NULL);
+       be_emit_irprintf("\t.align 2");
+       be_emit_finish_line_gas(NULL);
+       be_emit_irprintf("TABLE_%d:", block_nr);
+       be_emit_finish_line_gas(NULL);
+
+       for (i = 0; i < n_projs; ++i) {
                proj = projs[i];
-               if ( proj ) {
-                       block = get_irn_link(proj);
-               } else {
-                       block = get_irn_link(projs[get_arm_default_proj_num(irn)]);
+               if (proj == NULL) {
+                       proj = projs[get_arm_SwitchJmp_default_proj_num(irn)];
                }
-               fprintf(out, "\t.word\tBLOCK_%ld\n",get_irn_node_nr(block));
+               be_emit_cstring("\t.word\t");
+               arm_emit_cfop_target(proj);
+               be_emit_finish_line_gas(proj);
        }
-       fprintf(out, "\t.align 2\n");
-
+       be_emit_irprintf("\t.align 2\n");
+       be_emit_finish_line_gas(NULL);
        xfree(projs);
 }
 
-/************************************************************************/
-/* emit_be                                                              */
-/************************************************************************/
-
-static void emit_be_Call(ir_node *irn, void *env) {
-       arm_emit_env_t *emit_env = env;
-       FILE *out = emit_env->out;
-       entity *target_entity = be_Call_get_entity(irn);
-       const char *target_name = get_entity_name(target_entity);
-       fprintf(out, "\tBL %s\t\t\t\t/* Call */\n", target_name);
-}
+/** Emit an IncSP node */
+static void emit_be_IncSP(const ir_node *irn)
+{
+       int offs = -be_get_IncSP_offset(irn);
 
-static void emit_be_IncSP(const ir_node *irn, arm_emit_env_t *emit_env) {
-       FILE *F = emit_env->out;
-       unsigned offs = be_get_IncSP_offset(irn);
-       if (offs) {
-               char cmd_buf[SNPRINTF_BUF_LEN], cmnt_buf[SNPRINTF_BUF_LEN];
-               lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "ADD %1D, %1S, #%O", irn, irn, irn );
-               lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* IncSP(%O) */", irn);
-               lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
+       if (offs != 0) {
+               if (offs < 0) {
+                       be_emit_cstring("\tsub ");
+                       offs = -offs;
+               } else {
+                       be_emit_cstring("\tadd ");
+               }
+               arm_emit_dest_register(irn, 0);
+               be_emit_cstring(", ");
+               arm_emit_source_register(irn, 0);
+               be_emit_irprintf(", #0x%X", offs);
        } else {
-               char cmd_buf[SNPRINTF_BUF_LEN], cmnt_buf[SNPRINTF_BUF_LEN];
-               lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "");
-               lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* omitted IncSP(%O) */", irn);
-               lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
+               /* omitted IncSP(0) */
+               return;
        }
+       be_emit_finish_line_gas(irn);
 }
 
-// void emit_be_AddSP(const ir_node *irn, arm_emit_env_t *emit_env) {
-//     FILE *F = emit_env->out;
-//     char cmd_buf[SNPRINTF_BUF_LEN], cmnt_buf[SNPRINTF_BUF_LEN];
-//     lc_esnprintf(arm_get_arg_env(), cmd_buf, SNPRINTF_BUF_LEN, "ADD %1D, %1S, %2S", irn, irn, irn );
-//     lc_esnprintf(arm_get_arg_env(), cmnt_buf, SNPRINTF_BUF_LEN, "/* AddSP(%2S) */", irn);
-//     lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-// }
-
-static void emit_be_Copy(const ir_node *irn, arm_emit_env_t *emit_env) {
-       FILE *F    = emit_env->out;
+static void emit_be_Copy(const ir_node *irn)
+{
        ir_mode *mode = get_irn_mode(irn);
-       assert( (mode != mode_E) && "IEEE Extended FP not supported");
 
        if (get_in_reg(irn, 0) == get_out_reg(irn, 0)) {
-               char cmd_buf[256], cmnt_buf[256];
-               lc_esnprintf(arm_get_arg_env(), cmd_buf, 256, "");
-               lc_esnprintf(arm_get_arg_env(), cmnt_buf, 256, "/* omitted Copy: %1S -> %1D */", irn, irn);
-               lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
+               /* omitted Copy */
                return;
        }
 
-       if (mode == mode_F) {
-               char cmd_buf[256], cmnt_buf[256];
-               lc_esnprintf(arm_get_arg_env(), cmd_buf, 256, "FCPYS %1D, %1S", irn, irn);
-               lc_esnprintf(arm_get_arg_env(), cmnt_buf, 256, "/* Copy: %1S -> %1D */", irn, irn);
-               lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-       } else if (mode == mode_D) {
-               char cmd_buf[256], cmnt_buf[256];
-               lc_esnprintf(arm_get_arg_env(), cmd_buf, 256, "FCPYD %1D, %1S", irn, irn);
-               lc_esnprintf(arm_get_arg_env(), cmnt_buf, 256, "/* Copy: %1S -> %1D */", irn, irn);
-               lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-       } else if (mode_is_numP(mode)) {
-               char cmd_buf[256], cmnt_buf[256];
-               lc_esnprintf(arm_get_arg_env(), cmd_buf, 256, "MOV %1D, %1S", irn, irn);
-               lc_esnprintf(arm_get_arg_env(), cmnt_buf, 256, "/* Copy: %1S -> %1D */", irn, irn);
-               lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
+       if (mode_is_float(mode)) {
+               if (USE_FPA(cg->isa)) {
+                       be_emit_cstring("\tmvf");
+                       be_emit_char(' ');
+                       arm_emit_dest_register(irn, 0);
+                       be_emit_cstring(", ");
+                       arm_emit_source_register(irn, 0);
+                       be_emit_finish_line_gas(irn);
+               } else {
+                       panic("emit_be_Copy: move not supported for this mode");
+               }
+       } else if (mode_is_data(mode)) {
+               be_emit_cstring("\tmov ");
+               arm_emit_dest_register(irn, 0);
+               be_emit_cstring(", ");
+               arm_emit_source_register(irn, 0);
+               be_emit_finish_line_gas(irn);
        } else {
-               assert(0 && "move not supported for this mode");
+               panic("emit_be_Copy: move not supported for this mode");
        }
-//     emit_arm_Copy(irn, emit_env);
 }
 
-static void emit_be_Spill(const ir_node *irn, arm_emit_env_t *emit_env) {
-       FILE *F = emit_env->out;
-       ir_mode *mode = get_irn_mode(irn);
-       assert( (mode != mode_E) && "IEEE Extended FP not supported");
-       if (mode_is_dataM(mode)) {
-               char cmd_buf[256], cmnt_buf[256];
-               lc_esnprintf(arm_get_arg_env(), cmd_buf, 256, "STR %2S, [%1S, #%O]", irn, irn, irn );
-               lc_esnprintf(arm_get_arg_env(), cmnt_buf, 256, "/* Spill(%2S) -> (%1S) */", irn, irn);
-               lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-       } else {
-               assert(0 && "spill not supported for this mode");
-       }
+static void emit_be_Perm(const ir_node *irn)
+{
+       be_emit_cstring("\teor ");
+       arm_emit_source_register(irn, 0);
+       be_emit_cstring(", ");
+       arm_emit_source_register(irn, 0);
+       be_emit_cstring(", ");
+       arm_emit_source_register(irn, 1);
+       be_emit_finish_line_gas(NULL);
+
+       be_emit_cstring("\teor ");
+       arm_emit_source_register(irn, 1);
+       be_emit_cstring(", ");
+       arm_emit_source_register(irn, 0);
+       be_emit_cstring(", ");
+       arm_emit_source_register(irn, 1);
+       be_emit_finish_line_gas(NULL);
+
+       be_emit_cstring("\teor ");
+       arm_emit_source_register(irn, 0);
+       be_emit_cstring(", ");
+       arm_emit_source_register(irn, 0);
+       be_emit_cstring(", ");
+       arm_emit_source_register(irn, 1);
+       be_emit_finish_line_gas(irn);
 }
 
-static void emit_be_Reload(const ir_node* irn, arm_emit_env_t *emit_env) {
-       FILE *F = emit_env->out;
-       ir_mode *mode = get_irn_mode(irn);
-       assert( (mode != mode_E) && "IEEE Extended FP not supported");
-       if (mode_is_dataM(mode)) {
-               char cmd_buf[256], cmnt_buf[256];
-               lc_esnprintf(arm_get_arg_env(), cmd_buf, 256, "LDR %1D, [%1S, #%O]", irn, irn, irn );
-               lc_esnprintf(arm_get_arg_env(), cmnt_buf, 256, "/* Reload(%1S) -> (%1D) */", irn, irn);
-               lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
-       } else {
-               assert(0 && "reload not supported for this mode");
+static void emit_be_MemPerm(const ir_node *node)
+{
+       int i;
+       int memperm_arity;
+       int sp_change = 0;
+
+       /* TODO: this implementation is slower than necessary.
+          The longterm goal is however to avoid the memperm node completely */
+
+       memperm_arity = be_get_MemPerm_entity_arity(node);
+       if (memperm_arity > 12)
+               panic("memperm with more than 12 inputs not supported yet");
+
+       for (i = 0; i < memperm_arity; ++i) {
+               int offset;
+               ir_entity *entity = be_get_MemPerm_in_entity(node, i);
+
+               /* spill register */
+               be_emit_irprintf("\tstr r%d, [sp, #-4]!", i);
+               be_emit_finish_line_gas(node);
+               sp_change += 4;
+               /* load from entity */
+               offset = get_entity_offset(entity) + sp_change;
+               be_emit_irprintf("\tldr r%d, [sp, #%d]", i, offset);
+               be_emit_finish_line_gas(node);
        }
-}
 
-static void emit_be_Perm(const ir_node* irn, arm_emit_env_t *emit_env) {
-       FILE *F = emit_env->out;
-       ir_mode *mode = get_irn_mode(irn);
-       assert( (mode != mode_E) && "IEEE Extended FP not supported");
-       lc_efprintf(arm_get_arg_env(), F, "\tEOR %1S, %1S, %2S\t\t\t/* begin Perm(%1S, %2S) */\n", irn, irn, irn, irn, irn);
-       lc_efprintf(arm_get_arg_env(), F, "\tEOR %2S, %1S, %2S\n", irn, irn, irn);
-       lc_efprintf(arm_get_arg_env(), F, "\tEOR %1S, %1S, %2S\t\t\t/* end Perm(%1S, %2S) */\n", irn, irn, irn, irn, irn);
+       for (i = memperm_arity-1; i >= 0; --i) {
+               int        offset;
+               ir_entity *entity = be_get_MemPerm_out_entity(node, i);
+
+               /* store to new entity */
+               offset = get_entity_offset(entity) + sp_change;
+               be_emit_irprintf("\tstr r%d, [sp, #%d]", i, offset);
+               be_emit_finish_line_gas(node);
+               /* restore register */
+               be_emit_irprintf("\tldr r%d, [sp], #4", i);
+               sp_change -= 4;
+               be_emit_finish_line_gas(node);
+       }
+       assert(sp_change == 0);
 }
 
-static void emit_be_StackParam(const ir_node *irn, arm_emit_env_t *emit_env) {
-       FILE *F = emit_env->out;
-       ir_mode *mode = get_irn_mode(irn);
-       char cmd_buf[256], cmnt_buf[256];
-       assert( (mode != mode_E) && "IEEE Extended FP not supported");
-
-       lc_esnprintf(arm_get_arg_env(), cmd_buf, 256, "LDR %1D, [%1S, #%O]", irn, irn, irn );
-       lc_esnprintf(arm_get_arg_env(), cmnt_buf, 256, "/* StackParam: (%1S + %O) -> %1D */",irn , irn, irn, get_irn_n(irn, 0));
-       lc_efprintf(arm_get_arg_env(), F, "\t%-35s %-60s /* %+F */\n", cmd_buf, cmnt_buf, irn);
+static void emit_be_Return(const ir_node *node)
+{
+       be_emit_cstring("\tmov pc, lr");
+       be_emit_finish_line_gas(node);
 }
 
-/************************************************************************/
-/* emit                                                                 */
-/************************************************************************/
 
-static void emit_Jmp(ir_node *irn, void *env) {
-       arm_emit_env_t *emit_env = env;
-       FILE *out = emit_env->out;
-       const ir_edge_t *edge = get_irn_out_edge_first(irn);
-       ir_node *target_block = get_edge_src_irn(edge);
-       fprintf(out, "\tB BLOCK_%ld\t\t\t/* unconditional Jump */\n", get_irn_node_nr(target_block));
-}
+static void emit_arm_Jmp(const ir_node *node)
+{
+       ir_node *block, *next_block;
 
-static void emit_Proj(ir_node *irn, void *env) {
+       /* for now, the code works for scheduled and non-schedules blocks */
+       block = get_nodes_block(node);
 
+       /* we have a block schedule */
+       next_block = sched_next_block(block);
+       if (get_cfop_target_block(node) != next_block) {
+               be_emit_cstring("\tb ");
+               arm_emit_cfop_target(node);
+       } else {
+               be_emit_cstring("\t/* fallthrough to ");
+               arm_emit_cfop_target(node);
+               be_emit_cstring(" */");
+       }
+       be_emit_finish_line_gas(node);
 }
 
+static void emit_nothing(const ir_node *irn)
+{
+       (void) irn;
+}
 
+/**
+ * The type of a emitter function.
+ */
+typedef void (emit_func)(const ir_node *irn);
 
-/***********************************************************************************
- *                  _          __                                             _
- *                 (_)        / _|                                           | |
- *  _ __ ___   __ _ _ _ __   | |_ _ __ __ _ _ __ ___   _____      _____  _ __| | __
- * | '_ ` _ \ / _` | | '_ \  |  _| '__/ _` | '_ ` _ \ / _ \ \ /\ / / _ \| '__| |/ /
- * | | | | | | (_| | | | | | | | | | | (_| | | | | | |  __/\ V  V / (_) | |  |   <
- * |_| |_| |_|\__,_|_|_| |_| |_| |_|  \__,_|_| |_| |_|\___| \_/\_/ \___/|_|  |_|\_\
- *
- ***********************************************************************************/
+/**
+ * Set a node emitter. Make it a bit more type safe.
+ */
+static inline void set_emitter(ir_op *op, emit_func arm_emit_node)
+{
+       op->ops.generic = (op_func)arm_emit_node;
+}
 
 /**
  * Enters the emitter functions for handled nodes into the generic
  * pointer of an opcode.
  */
-static void arm_register_emitters(void) {
-
-#define ARM_EMIT(a) op_arm_##a->ops.generic = (op_func)emit_arm_##a
-#define EMIT(a)      op_##a->ops.generic = (op_func)emit_##a
-#define BE_EMIT(a)   op_be_##a->ops.generic = (op_func)emit_be_##a
-
+static void arm_register_emitters(void)
+{
        /* first clear the generic function pointer for all ops */
        clear_irp_opcodes_generic_func();
 
        /* register all emitter functions defined in spec */
        arm_register_spec_emitters();
 
-       /* other emitter functions */
-       ARM_EMIT(CondJmp);
-//     ARM_EMIT(SwitchJmp);
-       ARM_EMIT(CopyB);
-//     ARM_EMIT(CopyB_i);
-//     ARM_EMIT(Const);
-       ARM_EMIT(SymConst);
-       ARM_EMIT(SwitchJmp);
-
-       /* benode emitter */
-       BE_EMIT(Call);
-       BE_EMIT(IncSP);
-//     BE_EMIT(AddSP);
-       BE_EMIT(Copy);
-       BE_EMIT(Spill);
-       BE_EMIT(Reload);
-       BE_EMIT(Perm);
-       BE_EMIT(StackParam);
-
-       /* firm emitter */
-       EMIT(Jmp);
-
-
-       /* noisy stuff */
-#ifdef SILENCER
-       EMIT(Proj);
-#endif
-
-#undef ARM_EMIT
-#undef BE_EMIT
-#undef EMIT
+       /* custom emitter */
+       set_emitter(op_arm_B,         emit_arm_B);
+       set_emitter(op_arm_CopyB,     emit_arm_CopyB);
+       set_emitter(op_arm_fConst,    emit_arm_fConst);
+       set_emitter(op_arm_FrameAddr, emit_arm_FrameAddr);
+       set_emitter(op_arm_Jmp,       emit_arm_Jmp);
+       set_emitter(op_arm_SwitchJmp, emit_arm_SwitchJmp);
+       set_emitter(op_arm_SymConst,  emit_arm_SymConst);
+       set_emitter(op_be_Copy,       emit_be_Copy);
+       set_emitter(op_be_CopyKeep,   emit_be_Copy);
+       set_emitter(op_be_IncSP,      emit_be_IncSP);
+       set_emitter(op_be_MemPerm,    emit_be_MemPerm);
+       set_emitter(op_be_Perm,       emit_be_Perm);
+       set_emitter(op_be_Return,     emit_be_Return);
+
+       /* no need to emit anything for the following nodes */
+       set_emitter(op_Phi,           emit_nothing);
+       set_emitter(op_be_Keep,       emit_nothing);
+       set_emitter(op_be_Start,      emit_nothing);
+       set_emitter(op_be_Barrier,    emit_nothing);
 }
 
 /**
  * Emits code for a node.
  */
-static void arm_emit_node(const ir_node *irn, void *env) {
-       arm_emit_env_t        *emit_env = env;
-       FILE              *F        = emit_env->out;
-       ir_op             *op       = get_irn_op(irn);
-       DEBUG_ONLY(firm_dbg_module_t *mod      = emit_env->mod;)
-
-       DBG((mod, LEVEL_1, "emitting code for %+F\n", irn));
+static void arm_emit_node(const ir_node *irn)
+{
+       ir_op *op = get_irn_op(irn);
 
        if (op->ops.generic) {
-               void (*emit)(const ir_node *, void *) = (void (*)(const ir_node *, void *))op->ops.generic;
-               (*emit)(irn, env);
-       }
-       else {
-               ir_fprintf(F, "\t\t\t\t\t/* %+F */\n", irn);
+               emit_func *emit = (emit_func *)op->ops.generic;
+               be_dbg_set_dbg_info(get_irn_dbg_info(irn));
+               (*emit)(irn);
+       } else {
+               panic("Error: No emit handler for node %+F (graph %+F)\n",
+                     irn, current_ir_graph);
        }
 }
 
 /**
- * Walks over the nodes in a block connected by scheduling edges
- * and emits code for each node.
+ * emit the block label if needed.
  */
-void arm_gen_block(ir_node *block, void *env) {
-       ir_node *irn;
+static void arm_emit_block_header(ir_node *block, ir_node *prev)
+{
+       int           n_cfgpreds;
+       int           need_label;
+       int           i, arity;
+       ir_exec_freq  *exec_freq = be_get_irg_exec_freq(cg->irg);
+
+       need_label = 0;
+       n_cfgpreds = get_Block_n_cfgpreds(block);
+       if (n_cfgpreds == 1) {
+               ir_node *pred       = get_Block_cfgpred(block, 0);
+               ir_node *pred_block = get_nodes_block(pred);
+
+               /* we don't need labels for fallthrough blocks, however switch-jmps
+                * are no fallthroughs */
+               if (pred_block == prev &&
+                               !(is_Proj(pred) && is_arm_SwitchJmp(get_Proj_pred(pred)))) {
+                       need_label = 0;
+               } else {
+                       need_label = 1;
+               }
+       } else {
+               need_label = 1;
+       }
 
-       if (! is_Block(block))
-               return;
+       if (need_label) {
+               be_gas_emit_block_name(block);
+               be_emit_char(':');
 
-       fprintf(((arm_emit_env_t *)env)->out, "BLOCK_%ld:\n", get_irn_node_nr(block));
-       sched_foreach(block, irn) {
-               arm_emit_node(irn, env);
+               be_emit_pad_comment();
+               be_emit_cstring("   /* preds:");
+
+               /* emit list of pred blocks in comment */
+               arity = get_irn_arity(block);
+               for (i = 0; i < arity; ++i) {
+                       ir_node *predblock = get_Block_cfgpred_block(block, i);
+                       be_emit_irprintf(" %d", get_irn_node_nr(predblock));
+               }
+       } else {
+               be_emit_cstring("\t/* ");
+               be_gas_emit_block_name(block);
+               be_emit_cstring(": ");
+       }
+       if (exec_freq != NULL) {
+               be_emit_irprintf(" freq: %f",
+                                get_block_execfreq(exec_freq, block));
        }
+       be_emit_cstring(" */\n");
+       be_emit_write_line();
 }
 
-
 /**
- * Emits code for function start.
+ * Walks over the nodes in a block connected by scheduling edges
+ * and emits code for each node.
  */
-void arm_emit_start(FILE *F, ir_graph *irg) {
-       const char *irg_name = get_entity_name(get_irg_entity(irg));
-       fprintf(F, "\t.text\n");
-       fprintf(F, "\t.align  2\n");
-       fprintf(F, "\t.global %s\n", irg_name);
-       fprintf(F, "%s:\n", irg_name);
-}
+static void arm_gen_block(ir_node *block, ir_node *prev_block)
+{
+       ir_node *irn;
 
-/**
- * Emits code for function end
- */
-void arm_emit_end(FILE *F, ir_graph *irg) {
+       arm_emit_block_header(block, prev_block);
+       be_dbg_set_dbg_info(get_irn_dbg_info(block));
+       sched_foreach(block, irn) {
+               arm_emit_node(irn);
+       }
 }
 
 /**
+ * Block-walker:
  * Sets labels for control flow nodes (jump target)
- * TODO: Jump optimization
  */
-void arm_gen_labels(ir_node *block, void *env) {
+static void arm_gen_labels(ir_node *block, void *env)
+{
        ir_node *pred;
        int n = get_Block_n_cfgpreds(block);
+       (void)env;
 
        for (n--; n >= 0; n--) {
                pred = get_Block_cfgpred(block, n);
@@ -817,25 +1028,100 @@ void arm_gen_labels(ir_node *block, void *env) {
        }
 }
 
-
 /**
- * Main driver
+ * Compare two entries of the symbol or tarval set.
  */
-void arm_gen_routine(FILE *F, ir_graph *irg, const arm_code_gen_t *cg) {
-       arm_emit_env_t emit_env;
+static int cmp_sym_or_tv(const void *elt, const void *key, size_t size)
+{
+       const sym_or_tv_t *p1 = elt;
+       const sym_or_tv_t *p2 = key;
+       (void) size;
+
+       /* as an identifier NEVER can point to a tarval, it's enough
+          to compare it this way */
+       return p1->u.generic != p2->u.generic;
+}
+
+void arm_gen_routine(const arm_code_gen_t *arm_cg, ir_graph *irg)
+{
+       ir_node   **blk_sched;
+       int       i, n;
+       ir_node   *last_block = NULL;
+       ir_entity *entity     = get_irg_entity(irg);
 
-       emit_env.out      = F;
-       emit_env.arch_env = cg->arch_env;
-       emit_env.cg       = cg;
-       FIRM_DBG_REGISTER(emit_env.mod, "firm.be.arm.emit");
+       cg        = arm_cg;
+       sym_or_tv = new_set(cmp_sym_or_tv, 8);
 
-       /* set the global arch_env (needed by print hooks) */
-       arch_env = cg->arch_env;
+       be_gas_elf_type_char = '%';
 
        arm_register_emitters();
 
-       arm_emit_start(F, irg);
-       irg_block_walk_graph(irg, arm_gen_labels, NULL, &emit_env);
-       irg_walk_blkwise_graph(irg, NULL, arm_gen_block, &emit_env);
-       arm_emit_end(F, irg);
+       be_dbg_method_begin(entity);
+
+       /* create the block schedule */
+       blk_sched = be_create_block_schedule(irg);
+
+       be_gas_emit_function_prolog(entity, 4);
+
+       irg_block_walk_graph(irg, arm_gen_labels, NULL, NULL);
+
+       n = ARR_LEN(blk_sched);
+       for (i = 0; i < n;) {
+               ir_node *block, *next_bl;
+
+               block   = blk_sched[i];
+               ++i;
+               next_bl = i < n ? blk_sched[i] : NULL;
+
+               /* set here the link. the emitter expects to find the next block here */
+               set_irn_link(block, next_bl);
+               arm_gen_block(block, last_block);
+               last_block = block;
+       }
+
+       /* emit SymConst values */
+       if (set_count(sym_or_tv) > 0) {
+               sym_or_tv_t *entry;
+
+               be_emit_cstring("\t.align 2\n");
+
+               foreach_set(sym_or_tv, entry) {
+                       emit_constant_name(entry);
+                       be_emit_cstring(":\n");
+                       be_emit_write_line();
+
+                       if (entry->is_entity) {
+                               be_emit_cstring("\t.word\t");
+                               be_gas_emit_entity(entry->u.entity);
+                               be_emit_char('\n');
+                               be_emit_write_line();
+                       } else {
+                               tarval *tv = entry->u.tv;
+                               int i, size = get_mode_size_bytes(get_tarval_mode(tv));
+                               unsigned v;
+
+                               /* beware: ARM fpa uses big endian format */
+                               for (i = ((size + 3) & ~3) - 4; i >= 0; i -= 4) {
+                                       /* get 32 bits */
+                                       v =            get_tarval_sub_bits(tv, i+3);
+                                       v = (v << 8) | get_tarval_sub_bits(tv, i+2);
+                                       v = (v << 8) | get_tarval_sub_bits(tv, i+1);
+                                       v = (v << 8) | get_tarval_sub_bits(tv, i+0);
+                                       be_emit_irprintf("\t.word\t%u\n", v);
+                                       be_emit_write_line();
+                               }
+                       }
+               }
+               be_emit_char('\n');
+               be_emit_write_line();
+       }
+       del_set(sym_or_tv);
+
+       be_gas_emit_function_epilog(entity);
+       be_dbg_method_end();
+}
+
+void arm_init_emitter(void)
+{
+       FIRM_DBG_REGISTER(dbg, "firm.be.arm.emit");
 }