X-Git-Url: http://nsz.repo.hu/git/?a=blobdiff_plain;f=ir%2Fbe%2Fia32%2Fia32_emitter.c;h=a55008299ddd94193c01ff6a004d9388d35578e0;hb=ebdaa596d904a0651c8d794481288d2d629bdb3a;hp=d377143b0af700954862016768d01af9254fa5f0;hpb=5cb14f12bacb0c7d1c646112b4660d57e14236a2;p=libfirm diff --git a/ir/be/ia32/ia32_emitter.c b/ir/be/ia32/ia32_emitter.c index d377143b0..4716f55f4 100644 --- a/ir/be/ia32/ia32_emitter.c +++ b/ir/be/ia32/ia32_emitter.c @@ -23,9 +23,7 @@ * @author Christian Wuerdig, Matthias Braun * @version $Id$ */ -#ifdef HAVE_CONFIG_H #include "config.h" -#endif #include @@ -39,18 +37,20 @@ #include "irargs_t.h" #include "irprog_t.h" #include "iredges_t.h" +#include "irtools.h" #include "execfreq.h" #include "error.h" #include "raw_bitset.h" #include "dbginfo.h" +#include "lc_opts.h" -#include "../besched_t.h" -#include "../benode_t.h" +#include "../besched.h" +#include "../benode.h" #include "../beabi.h" #include "../be_dbgout.h" #include "../beemitter.h" #include "../begnuas.h" -#include "../beirg_t.h" +#include "../beirg.h" #include "../be_dbgout.h" #include "ia32_emitter.h" @@ -68,12 +68,12 @@ DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;) #define SNPRINTF_BUF_LEN 128 -static const arch_env_t *arch_env; static const ia32_isa_t *isa; static ia32_code_gen_t *cg; -static int do_pic; static char pic_base_label[128]; static ir_label_t exc_label_id; +static int mark_spill_reload = 0; +static int do_pic; /** Return the next block in Block schedule */ static ir_node *get_prev_block_sched(const ir_node *block) @@ -81,6 +81,7 @@ static ir_node *get_prev_block_sched(const ir_node *block) return get_irn_link(block); } +/** Checks if the current block is a fall-through target. */ static int is_fallthrough(const ir_node *cfgpred) { ir_node *pred; @@ -94,11 +95,18 @@ static int is_fallthrough(const ir_node *cfgpred) return 1; } +/** + * returns non-zero if the given block needs a label + * because of being a jump-target (and not a fall-through) + */ static int block_needs_label(const ir_node *block) { int need_label = 1; int n_cfgpreds = get_Block_n_cfgpreds(block); + if (has_Block_entity(block)) + return 1; + if (n_cfgpreds == 0) { need_label = 0; } else if (n_cfgpreds == 1) { @@ -128,7 +136,7 @@ static const arch_register_t *get_in_reg(const ir_node *irn, int pos) in register we need. */ op = get_irn_n(irn, pos); - reg = arch_get_irn_register(arch_env, op); + reg = arch_get_irn_register(op); assert(reg && "no in register found"); @@ -137,10 +145,7 @@ static const arch_register_t *get_in_reg(const ir_node *irn, int pos) /* in case of unknown register: just return a valid register */ if (reg == &ia32_gp_regs[REG_GP_UKNWN]) { - const arch_register_req_t *req; - - /* ask for the requirements */ - req = arch_get_register_req(arch_env, irn, pos); + const arch_register_req_t *req = arch_get_register_req(irn, pos); if (arch_register_req_is(req, limited)) { /* in case of limited requirements: get the first allowed register */ @@ -170,9 +175,9 @@ static const arch_register_t *get_out_reg(const ir_node *irn, int pos) if (get_irn_mode(irn) != mode_T) { assert(pos == 0); - reg = arch_get_irn_register(arch_env, irn); + reg = arch_get_irn_register(irn); } else if (is_ia32_irn(irn)) { - reg = get_ia32_out_reg(irn, pos); + reg = arch_irn_get_register(irn, pos); } else { const ir_edge_t *edge; @@ -180,7 +185,7 @@ static const arch_register_t *get_out_reg(const ir_node *irn, int pos) proj = get_edge_src_irn(edge); assert(is_Proj(proj) && "non-Proj from mode_T node"); if (get_Proj_proj(proj) == pos) { - reg = arch_get_irn_register(arch_env, proj); + reg = arch_get_irn_register(proj); break; } } @@ -211,6 +216,9 @@ static char *get_unique_label(char *buf, size_t buflen, const char *prefix) * |_| |_| *************************************************************/ +/** + * Emit the name of the 8bit low register + */ static void emit_8bit_register(const arch_register_t *reg) { const char *reg_name = arch_register_get_name(reg); @@ -220,6 +228,18 @@ static void emit_8bit_register(const arch_register_t *reg) be_emit_char('l'); } +/** + * Emit the name of the 8bit high register + */ +static void emit_8bit_register_high(const arch_register_t *reg) +{ + const char *reg_name = arch_register_get_name(reg); + + be_emit_char('%'); + be_emit_char(reg_name[1]); + be_emit_char('h'); +} + static void emit_16bit_register(const arch_register_t *reg) { const char *reg_name = ia32_get_mapped_reg_name(isa->regs_16bit, reg); @@ -228,6 +248,12 @@ static void emit_16bit_register(const arch_register_t *reg) be_emit_string(reg_name); } +/** + * emit a register, possible shortened by a mode + * + * @param reg the register + * @param mode the mode of the register or NULL for full register + */ static void emit_register(const arch_register_t *reg, const ir_mode *mode) { const char *reg_name; @@ -254,12 +280,52 @@ void ia32_emit_source_register(const ir_node *node, int pos) emit_register(reg, NULL); } -static void emit_ia32_Immediate(const ir_node *node); +static void ia32_emit_entity(ir_entity *entity, int no_pic_adjust) +{ + be_gas_emit_entity(entity); + + if (get_entity_owner(entity) == get_tls_type()) { + if (get_entity_linkage(entity) & IR_LINKAGE_EXTERN) { + be_emit_cstring("@INDNTPOFF"); + } else { + be_emit_cstring("@NTPOFF"); + } + } + + if (do_pic && !no_pic_adjust) { + be_emit_char('-'); + be_emit_string(pic_base_label); + } +} + +static void emit_ia32_Immediate_no_prefix(const ir_node *node) +{ + const ia32_immediate_attr_t *attr = get_ia32_immediate_attr_const(node); + + if (attr->symconst != NULL) { + if (attr->sc_sign) + be_emit_char('-'); + ia32_emit_entity(attr->symconst, attr->no_pic_adjust); + } + if (attr->symconst == NULL || attr->offset != 0) { + if (attr->symconst != NULL) { + be_emit_irprintf("%+d", attr->offset); + } else { + be_emit_irprintf("0x%X", attr->offset); + } + } +} + +static void emit_ia32_Immediate(const ir_node *node) +{ + be_emit_char('$'); + emit_ia32_Immediate_no_prefix(node); +} void ia32_emit_8bit_source_register_or_immediate(const ir_node *node, int pos) { const arch_register_t *reg; - ir_node *in = get_irn_n(node, pos); + const ir_node *in = get_irn_n(node, pos); if (is_ia32_Immediate(in)) { emit_ia32_Immediate(in); return; @@ -269,6 +335,25 @@ void ia32_emit_8bit_source_register_or_immediate(const ir_node *node, int pos) emit_8bit_register(reg); } +void ia32_emit_8bit_high_source_register(const ir_node *node, int pos) +{ + const arch_register_t *reg = get_in_reg(node, pos); + emit_8bit_register_high(reg); +} + +void ia32_emit_16bit_source_register_or_immediate(const ir_node *node, int pos) +{ + const arch_register_t *reg; + const ir_node *in = get_irn_n(node, pos); + if (is_ia32_Immediate(in)) { + emit_ia32_Immediate(in); + return; + } + + reg = get_in_reg(node, pos); + emit_16bit_register(reg); +} + void ia32_emit_dest_register(const ir_node *node, int pos) { const arch_register_t *reg = get_out_reg(node, pos); @@ -276,6 +361,13 @@ void ia32_emit_dest_register(const ir_node *node, int pos) emit_register(reg, NULL); } +void ia32_emit_dest_register_size(const ir_node *node, int pos) +{ + const arch_register_t *reg = get_out_reg(node, pos); + + emit_register(reg, get_ia32_ls_mode(node)); +} + void ia32_emit_8bit_dest_register(const ir_node *node, int pos) { const arch_register_t *reg = get_out_reg(node, pos); @@ -294,23 +386,14 @@ void ia32_emit_x87_register(const ir_node *node, int pos) static void ia32_emit_mode_suffix_mode(const ir_mode *mode) { - if (mode_is_float(mode)) { - switch(get_mode_size_bits(mode)) { - case 32: be_emit_char('s'); return; - case 64: be_emit_char('l'); return; - case 80: - case 96: be_emit_char('t'); return; - } - } else { - assert(mode_is_int(mode) || mode_is_reference(mode)); - switch(get_mode_size_bits(mode)) { + assert(mode_is_int(mode) || mode_is_reference(mode)); + switch (get_mode_size_bits(mode)) { + case 8: be_emit_char('b'); return; + case 16: be_emit_char('w'); return; + case 32: be_emit_char('l'); return; /* gas docu says q is the suffix but gcc, objdump and icc use ll * apparently */ case 64: be_emit_cstring("ll"); return; - case 32: be_emit_char('l'); return; - case 16: be_emit_char('w'); return; - case 8: be_emit_char('b'); return; - } } panic("Can't output mode_suffix for %+F", mode); } @@ -326,12 +409,33 @@ void ia32_emit_mode_suffix(const ir_node *node) void ia32_emit_x87_mode_suffix(const ir_node *node) { + ir_mode *mode; + /* we only need to emit the mode on address mode */ - if (get_ia32_op_type(node) != ia32_Normal) { - ir_mode *mode = get_ia32_ls_mode(node); - assert(mode != NULL); - ia32_emit_mode_suffix_mode(mode); + if (get_ia32_op_type(node) == ia32_Normal) + return; + + mode = get_ia32_ls_mode(node); + assert(mode != NULL); + + if (mode_is_float(mode)) { + switch (get_mode_size_bits(mode)) { + case 32: be_emit_char('s'); return; + case 64: be_emit_char('l'); return; + case 80: + case 96: be_emit_char('t'); return; + } + } else { + assert(mode_is_int(mode)); + switch (get_mode_size_bits(mode)) { + case 16: be_emit_char('s'); return; + case 32: be_emit_char('l'); return; + /* gas docu says q is the suffix but gcc, objdump and icc use ll + * apparently */ + case 64: be_emit_cstring("ll"); return; + } } + panic("Can't output mode_suffix for %+F", mode); } static char get_xmm_mode_suffix(ir_mode *mode) @@ -359,11 +463,13 @@ void ia32_emit_xmm_mode_suffix_s(const ir_node *node) be_emit_char(get_xmm_mode_suffix(mode)); } -void ia32_emit_extend_suffix(const ir_mode *mode) +void ia32_emit_extend_suffix(const ir_node *node) { + ir_mode *mode = get_ia32_ls_mode(node); if (get_mode_size_bits(mode) == 32) return; be_emit_char(mode_is_signed(mode) ? 's' : 'z'); + ia32_emit_mode_suffix_mode(mode); } void ia32_emit_source_register_or_immediate(const ir_node *node, int pos) @@ -379,130 +485,94 @@ void ia32_emit_source_register_or_immediate(const ir_node *node, int pos) } /** - * Emits registers and/or address mode of a binary operation. + * Returns the target block for a control flow node. */ -void ia32_emit_binop(const ir_node *node) +static ir_node *get_cfop_target_block(const ir_node *irn) { - const ir_node *right_op = get_irn_n(node, n_ia32_binary_right); - const ir_mode *mode = get_ia32_ls_mode(node); - const arch_register_t *reg_left; - - switch(get_ia32_op_type(node)) { - case ia32_Normal: - reg_left = get_in_reg(node, n_ia32_binary_left); - if (is_ia32_Immediate(right_op)) { - emit_ia32_Immediate(right_op); - be_emit_cstring(", "); - emit_register(reg_left, mode); - break; - } else { - const arch_register_t *reg_right - = get_in_reg(node, n_ia32_binary_right); - emit_register(reg_right, mode); - be_emit_cstring(", "); - emit_register(reg_left, mode); - } - break; - case ia32_AddrModeS: - if (is_ia32_Immediate(right_op)) { - emit_ia32_Immediate(right_op); - be_emit_cstring(", "); - ia32_emit_am(node); - } else { - reg_left = get_in_reg(node, n_ia32_binary_left); - ia32_emit_am(node); - be_emit_cstring(", "); - emit_register(reg_left, mode); - } - break; - case ia32_AddrModeD: - panic("DestMode can't be output by %%binop anymore"); - break; - default: - assert(0 && "unsupported op type"); - } + assert(get_irn_mode(irn) == mode_X); + return get_irn_link(irn); } /** - * Emits registers and/or address mode of a binary operation. + * Emits a block label for the given block. */ -void ia32_emit_x87_binop(const ir_node *node) +static void ia32_emit_block_name(const ir_node *block) { - switch(get_ia32_op_type(node)) { - case ia32_Normal: - { - const ia32_x87_attr_t *x87_attr = get_ia32_x87_attr_const(node); - const arch_register_t *in1 = x87_attr->x87[0]; - const arch_register_t *in2 = x87_attr->x87[1]; - const arch_register_t *out = x87_attr->x87[2]; - const arch_register_t *in; - - in = out ? ((out == in2) ? in1 : in2) : in2; - out = out ? out : in1; - - be_emit_char('%'); - be_emit_string(arch_register_get_name(in)); - be_emit_cstring(", %"); - be_emit_string(arch_register_get_name(out)); - } - break; - case ia32_AddrModeS: - ia32_emit_am(node); - break; - case ia32_AddrModeD: - default: - assert(0 && "unsupported op type"); + if (has_Block_entity(block)) { + ir_entity *entity = get_Block_entity(block); + be_gas_emit_entity(entity); + } else { + be_emit_cstring(BLOCK_PREFIX); + be_emit_irprintf("%ld", get_irn_node_nr(block)); } } /** - * Emits registers and/or address mode of a unary operation. + * Emits the target label for a control flow node. */ -void ia32_emit_unop(const ir_node *node, int pos) +static void ia32_emit_cfop_target(const ir_node *node) { - const ir_node *op; - - switch(get_ia32_op_type(node)) { - case ia32_Normal: - op = get_irn_n(node, pos); - if (is_ia32_Immediate(op)) { - emit_ia32_Immediate(op); - } else { - ia32_emit_source_register(node, pos); - } - break; - case ia32_AddrModeS: - case ia32_AddrModeD: - ia32_emit_am(node); - break; - default: - assert(0 && "unsupported op type"); - } + ir_node *block = get_cfop_target_block(node); + ia32_emit_block_name(block); } -static void ia32_emit_entity(ir_entity *entity, int no_pic_adjust) -{ - ident *id; +/* + * positive conditions for signed compares + */ +static const char *const cmp2condition_s[] = { + NULL, /* always false */ + "e", /* == */ + "l", /* < */ + "le", /* <= */ + "g", /* > */ + "ge", /* >= */ + "ne", /* != */ + NULL /* always true */ +}; - set_entity_backend_marked(entity, 1); - id = get_entity_ld_ident(entity); - be_emit_ident(id); +/* + * positive conditions for unsigned compares + */ +static const char *const cmp2condition_u[] = { + NULL, /* always false */ + "e", /* == */ + "b", /* < */ + "be", /* <= */ + "a", /* > */ + "ae", /* >= */ + "ne", /* != */ + NULL /* always true */ +}; - if (get_entity_owner(entity) == get_tls_type()) { - if (get_entity_visibility(entity) == visibility_external_allocated) { - be_emit_cstring("@INDNTPOFF"); - } else { - be_emit_cstring("@NTPOFF"); - } +/** + * Emit the suffix for a compare instruction. + */ +static void ia32_emit_cmp_suffix(int pnc) +{ + const char *str; + + if (pnc == ia32_pn_Cmp_parity) { + be_emit_char('p'); + return; } - if (!no_pic_adjust && do_pic) { - /* TODO: only do this when necessary */ - be_emit_char('-'); - be_emit_string(pic_base_label); + if (pnc & ia32_pn_Cmp_float || pnc & ia32_pn_Cmp_unsigned) { + str = cmp2condition_u[pnc & 7]; + } else { + str = cmp2condition_s[pnc & 7]; } + + be_emit_string(str); } +typedef enum ia32_emit_mod_t { + EMIT_RESPECT_LS = 1U << 0, + EMIT_ALTERNATE_AM = 1U << 1, + EMIT_LONG = 1U << 2, + EMIT_HIGH_REG = 1U << 3, + EMIT_LOW_REG = 1U << 4 +} ia32_emit_mod_t; + /** * Emits address mode. */ @@ -520,9 +590,10 @@ void ia32_emit_am(const ir_node *node) /* emit offset */ if (ent != NULL) { + const ia32_attr_t *attr = get_ia32_attr_const(node); if (is_ia32_am_sc_sign(node)) be_emit_char('-'); - ia32_emit_entity(ent, 0); + ia32_emit_entity(ent, attr->data.am_sc_no_pic_adjust); } /* also handle special case if nothing is set */ @@ -559,108 +630,322 @@ void ia32_emit_am(const ir_node *node) } } -static void emit_ia32_IMul(const ir_node *node) +/** + * fmt parameter output + * ---- ---------------------- --------------------------------------------- + * %% % + * %AM address mode of the node + * %AR const arch_register_t* address mode of the node or register + * %ASx address mode of the node or source register x + * %Dx destination register x + * %I immediate of the node + * %L control flow target of the node + * %M mode suffix of the node + * %P int condition code + * %R const arch_register_t* register + * %Sx source register x + * %s const char* string + * %u unsigned int unsigned int + * %d signed int signed int + * + * x starts at 0 + * # modifier for %ASx, %D, %R, and %S uses ls mode of node to alter register width + * * modifier does not prefix immediates with $, but AM with * + * l modifier for %lu and %ld + * > modifier to output high 8bit register (ah, bh) + * < modifier to output low 8bit register (al, bl) + */ +static void ia32_emitf(const ir_node *node, const char *fmt, ...) { - ir_node *left = get_irn_n(node, n_ia32_IMul_left); - const arch_register_t *out_reg = get_out_reg(node, pn_ia32_IMul_res); + va_list ap; + va_start(ap, fmt); - be_emit_cstring("\timul"); - ia32_emit_mode_suffix(node); - be_emit_char(' '); + for (;;) { + const char *start = fmt; + ia32_emit_mod_t mod = 0; - ia32_emit_binop(node); + while (*fmt != '%' && *fmt != '\n' && *fmt != '\0') + ++fmt; + if (fmt != start) { + be_emit_string_len(start, fmt - start); + } - /* do we need the 3-address form? */ - if (is_ia32_NoReg_GP(left) || - get_in_reg(node, n_ia32_IMul_left) != out_reg) { - be_emit_cstring(", "); - emit_register(out_reg, get_ia32_ls_mode(node)); - } - be_emit_finish_line_gas(node); -} + if (*fmt == '\n') { + be_emit_finish_line_gas(node); + ++fmt; + if (*fmt == '\0') + break; + continue; + } -/************************************************* - * _ _ _ - * (_) | | | - * ___ _ __ ___ _| |_ ___ ___ _ __ __| | - * / _ \ '_ ` _ \| | __| / __/ _ \| '_ \ / _` | - * | __/ | | | | | | |_ | (_| (_) | | | | (_| | - * \___|_| |_| |_|_|\__| \___\___/|_| |_|\__,_| - * - *************************************************/ + if (*fmt == '\0') + break; -#undef IA32_DO_EMIT -#define IA32_DO_EMIT(irn) ia32_fprintf_format(F, irn, cmd_buf, cmnt_buf) + ++fmt; + while (1) { + switch(*fmt) { + case '*': mod |= EMIT_ALTERNATE_AM; break; + case '#': mod |= EMIT_RESPECT_LS; break; + case 'l': mod |= EMIT_LONG; break; + case '>': mod |= EMIT_HIGH_REG; break; + case '<': mod |= EMIT_LOW_REG; break; + default: + goto end_of_mods; + } + ++fmt; + } +end_of_mods: -/* - * coding of conditions - */ -struct cmp2conditon_t { - const char *name; - int num; -}; + switch (*fmt++) { + case '%': + be_emit_char('%'); + break; -/* - * positive conditions for signed compares - */ -static const struct cmp2conditon_t cmp2condition_s[] = { - { NULL, pn_Cmp_False }, /* always false */ - { "e", pn_Cmp_Eq }, /* == */ - { "l", pn_Cmp_Lt }, /* < */ - { "le", pn_Cmp_Le }, /* <= */ - { "g", pn_Cmp_Gt }, /* > */ - { "ge", pn_Cmp_Ge }, /* >= */ - { "ne", pn_Cmp_Lg }, /* != */ - { NULL, pn_Cmp_Leg}, /* always true */ -}; + case 'A': { + switch (*fmt++) { +emit_AM: + case 'M': + if (mod & EMIT_ALTERNATE_AM) + be_emit_char('*'); + ia32_emit_am(node); + break; + + case 'R': { + const arch_register_t *reg = va_arg(ap, const arch_register_t*); + if (get_ia32_op_type(node) == ia32_AddrModeS) { + goto emit_AM; + } else { + if (mod & EMIT_ALTERNATE_AM) + be_emit_char('*'); + emit_register(reg, NULL); + } + break; + } + + case 'S': + if (get_ia32_op_type(node) == ia32_AddrModeS) { + ++fmt; + goto emit_AM; + } else { + assert(get_ia32_op_type(node) == ia32_Normal); + goto emit_S; + } + break; + + default: goto unknown; + } + break; + } -/* - * positive conditions for unsigned compares - */ -static const struct cmp2conditon_t cmp2condition_u[] = { - { NULL, pn_Cmp_False }, /* always false */ - { "e", pn_Cmp_Eq }, /* == */ - { "b", pn_Cmp_Lt }, /* < */ - { "be", pn_Cmp_Le }, /* <= */ - { "a", pn_Cmp_Gt }, /* > */ - { "ae", pn_Cmp_Ge }, /* >= */ - { "ne", pn_Cmp_Lg }, /* != */ - { NULL, pn_Cmp_Leg }, /* always true */ -}; + case 'D': { + unsigned pos; + const arch_register_t *reg; -/** - * walks up a tree of copies/perms/spills/reloads to find the original value - * that is moved around - */ -static ir_node *find_original_value(ir_node *node) -{ - if (irn_visited(node)) - return NULL; + if (*fmt < '0' || '9' <= *fmt) + goto unknown; - mark_irn_visited(node); - if (be_is_Copy(node)) { - return find_original_value(be_get_Copy_op(node)); - } else if (be_is_CopyKeep(node)) { - return find_original_value(be_get_CopyKeep_op(node)); - } else if (is_Proj(node)) { - ir_node *pred = get_Proj_pred(node); - if (be_is_Perm(pred)) { - return find_original_value(get_irn_n(pred, get_Proj_proj(node))); - } else if (be_is_MemPerm(pred)) { - return find_original_value(get_irn_n(pred, get_Proj_proj(node) + 1)); - } else if (is_ia32_Load(pred)) { - return find_original_value(get_irn_n(pred, n_ia32_Load_mem)); - } else { - return node; - } - } else if (is_ia32_Store(node)) { - return find_original_value(get_irn_n(node, n_ia32_Store_val)); - } else if (is_Phi(node)) { - int i, arity; - arity = get_irn_arity(node); - for (i = 0; i < arity; ++i) { - ir_node *in = get_irn_n(node, i); - ir_node *res = find_original_value(in); + pos = *fmt++ - '0'; + reg = get_out_reg(node, pos); + emit_register(reg, mod & EMIT_RESPECT_LS ? get_ia32_ls_mode(node) : NULL); + break; + } + + case 'I': + if (!(mod & EMIT_ALTERNATE_AM)) + be_emit_char('$'); + emit_ia32_Immediate_no_prefix(node); + break; + + case 'L': + ia32_emit_cfop_target(node); + break; + + case 'M': { + ia32_emit_mode_suffix_mode(get_ia32_ls_mode(node)); + break; + } + + case 'P': { + int pnc = va_arg(ap, int); + ia32_emit_cmp_suffix(pnc); + break; + } + + case 'R': { + const arch_register_t *reg = va_arg(ap, const arch_register_t*); + if (mod & EMIT_HIGH_REG) { + emit_8bit_register_high(reg); + } else if (mod & EMIT_LOW_REG) { + emit_8bit_register(reg); + } else { + emit_register(reg, mod & EMIT_RESPECT_LS ? get_ia32_ls_mode(node) : NULL); + } + break; + } + +emit_S: + case 'S': { + unsigned pos; + const ir_node *in; + + if (*fmt < '0' || '9' <= *fmt) + goto unknown; + + pos = *fmt++ - '0'; + in = get_irn_n(node, pos); + if (is_ia32_Immediate(in)) { + if (!(mod & EMIT_ALTERNATE_AM)) + be_emit_char('$'); + emit_ia32_Immediate_no_prefix(in); + } else { + const arch_register_t *reg; + + if (mod & EMIT_ALTERNATE_AM) + be_emit_char('*'); + reg = get_in_reg(node, pos); + emit_register(reg, mod & EMIT_RESPECT_LS ? get_ia32_ls_mode(node) : NULL); + } + break; + } + + case 's': { + const char *str = va_arg(ap, const char*); + be_emit_string(str); + break; + } + + case 'u': + if (mod & EMIT_LONG) { + unsigned long num = va_arg(ap, unsigned long); + be_emit_irprintf("%lu", num); + } else { + unsigned num = va_arg(ap, unsigned); + be_emit_irprintf("%u", num); + } + break; + + case 'd': + if (mod & EMIT_LONG) { + long num = va_arg(ap, long); + be_emit_irprintf("%ld", num); + } else { + int num = va_arg(ap, int); + be_emit_irprintf("%d", num); + } + break; + + default: +unknown: + panic("unknown format conversion in ia32_emitf()"); + } + } + + va_end(ap); +} + +/** + * Emits registers and/or address mode of a binary operation. + */ +void ia32_emit_binop(const ir_node *node) +{ + if (is_ia32_Immediate(get_irn_n(node, n_ia32_binary_right))) { + ia32_emitf(node, "%#S4, %#AS3"); + } else { + ia32_emitf(node, "%#AS4, %#S3"); + } +} + +/** + * Emits registers and/or address mode of a binary operation. + */ +void ia32_emit_x87_binop(const ir_node *node) +{ + switch(get_ia32_op_type(node)) { + case ia32_Normal: + { + const ia32_x87_attr_t *x87_attr = get_ia32_x87_attr_const(node); + const arch_register_t *in1 = x87_attr->x87[0]; + const arch_register_t *in = x87_attr->x87[1]; + const arch_register_t *out = x87_attr->x87[2]; + + if (out == NULL) { + out = in1; + } else if (out == in) { + in = in1; + } + + be_emit_char('%'); + be_emit_string(arch_register_get_name(in)); + be_emit_cstring(", %"); + be_emit_string(arch_register_get_name(out)); + } + break; + case ia32_AddrModeS: + ia32_emit_am(node); + break; + case ia32_AddrModeD: + default: + assert(0 && "unsupported op type"); + } +} + +/** + * Emits registers and/or address mode of a unary operation. + */ +void ia32_emit_unop(const ir_node *node, int pos) +{ + char fmt[] = "%ASx"; + fmt[3] = '0' + pos; + ia32_emitf(node, fmt); +} + +static void emit_ia32_IMul(const ir_node *node) +{ + ir_node *left = get_irn_n(node, n_ia32_IMul_left); + const arch_register_t *out_reg = get_out_reg(node, pn_ia32_IMul_res); + + /* do we need the 3-address form? */ + if (is_ia32_NoReg_GP(left) || + get_in_reg(node, n_ia32_IMul_left) != out_reg) { + ia32_emitf(node, "\timul%M %#S4, %#AS3, %#D0\n"); + } else { + ia32_emitf(node, "\timul%M %#AS4, %#S3\n"); + } +} + +/** + * walks up a tree of copies/perms/spills/reloads to find the original value + * that is moved around + */ +static ir_node *find_original_value(ir_node *node) +{ + if (irn_visited(node)) + return NULL; + + mark_irn_visited(node); + if (be_is_Copy(node)) { + return find_original_value(be_get_Copy_op(node)); + } else if (be_is_CopyKeep(node)) { + return find_original_value(be_get_CopyKeep_op(node)); + } else if (is_Proj(node)) { + ir_node *pred = get_Proj_pred(node); + if (be_is_Perm(pred)) { + return find_original_value(get_irn_n(pred, get_Proj_proj(node))); + } else if (be_is_MemPerm(pred)) { + return find_original_value(get_irn_n(pred, get_Proj_proj(node) + 1)); + } else if (is_ia32_Load(pred)) { + return find_original_value(get_irn_n(pred, n_ia32_Load_mem)); + } else { + return node; + } + } else if (is_ia32_Store(node)) { + return find_original_value(get_irn_n(node, n_ia32_Store_val)); + } else if (is_Phi(node)) { + int i, arity; + arity = get_irn_arity(node); + for (i = 0; i < arity; ++i) { + ir_node *in = get_irn_n(node, i); + ir_node *res = find_original_value(in); if (res != NULL) return res; @@ -671,8 +956,7 @@ static ir_node *find_original_value(ir_node *node) } } -static int determine_final_pnc(const ir_node *node, int flags_pos, - int pnc) +static int determine_final_pnc(const ir_node *node, int flags_pos, int pnc) { ir_node *flags = get_irn_n(node, flags_pos); const ia32_attr_t *flags_attr; @@ -701,10 +985,6 @@ static int determine_final_pnc(const ir_node *node, int flags_pos, pnc = get_mirrored_pnc(pnc); pnc |= ia32_pn_Cmp_float; } else { -#if 0 - assert(is_ia32_Cmp(flags) || is_ia32_Test(flags) - || is_ia32_Cmp8Bit(flags) || is_ia32_Test8Bit(flags)); -#endif flags_attr = get_ia32_attr_const(flags); if (flags_attr->data.ins_permuted) @@ -716,21 +996,10 @@ static int determine_final_pnc(const ir_node *node, int flags_pos, return pnc; } -static void ia32_emit_cmp_suffix(int pnc) +static pn_Cmp ia32_get_negated_pnc(pn_Cmp pnc) { - const char *str; - - if ((pnc & ia32_pn_Cmp_float) || (pnc & ia32_pn_Cmp_unsigned)) { - pnc = pnc & 7; - assert(cmp2condition_u[pnc].num == pnc); - str = cmp2condition_u[pnc].name; - } else { - pnc = pnc & 7; - assert(cmp2condition_s[pnc].num == pnc); - str = cmp2condition_s[pnc].name; - } - - be_emit_string(str); + ir_mode *mode = pnc & ia32_pn_Cmp_float ? mode_F : mode_Iu; + return get_negated_pnc(pnc, mode); } void ia32_emit_cmp_suffix_node(const ir_node *node, @@ -741,40 +1010,12 @@ void ia32_emit_cmp_suffix_node(const ir_node *node, pn_Cmp pnc = get_ia32_condcode(node); pnc = determine_final_pnc(node, flags_pos, pnc); - if (attr->data.ins_permuted) { - if (pnc & ia32_pn_Cmp_float) { - pnc = get_negated_pnc(pnc, mode_F); - } else { - pnc = get_negated_pnc(pnc, mode_Iu); - } - } + if (attr->data.ins_permuted) + pnc = ia32_get_negated_pnc(pnc); ia32_emit_cmp_suffix(pnc); } -/** - * Returns the target block for a control flow node. - */ -static ir_node *get_cfop_target_block(const ir_node *irn) -{ - assert(get_irn_mode(irn) == mode_X); - return get_irn_link(irn); -} - -/** - * Emits a block label for the given block. - */ -static void ia32_emit_block_name(const ir_node *block) -{ - if (has_Block_label(block)) { - be_emit_string(be_gas_block_label_prefix()); - be_emit_irprintf("%lu", get_Block_label(block)); - } else { - be_emit_cstring(BLOCK_PREFIX); - be_emit_irprintf("%ld", get_irn_node_nr(block)); - } -} - /** * Emits an exception label for a given node. */ @@ -784,16 +1025,6 @@ static void ia32_emit_exc_label(const ir_node *node) be_emit_irprintf("%lu", get_ia32_exc_label_id(node)); } -/** - * Emits the target label for a control flow node. - */ -static void ia32_emit_cfop_target(const ir_node *node) -{ - ir_node *block = get_cfop_target_block(node); - - ia32_emit_block_name(block); -} - /** * Returns the Proj with projection number proj and NOT mode_M */ @@ -852,98 +1083,120 @@ static void emit_ia32_Jcc(const ir_node *node) proj_true = proj_false; proj_false = t; - if (pnc & ia32_pn_Cmp_float) { - pnc = get_negated_pnc(pnc, mode_F); - } else { - pnc = get_negated_pnc(pnc, mode_Iu); - } + pnc = ia32_get_negated_pnc(pnc); } if (pnc & ia32_pn_Cmp_float) { /* Some floating point comparisons require a test of the parity flag, * which indicates that the result is unordered */ - switch (pnc & 15) { - case pn_Cmp_Uo: { - be_emit_cstring("\tjp "); - ia32_emit_cfop_target(proj_true); - be_emit_finish_line_gas(proj_true); - break; - } + switch (pnc & 0x0f) { + case pn_Cmp_Uo: { + ia32_emitf(proj_true, "\tjp %L\n"); + break; + } - case pn_Cmp_Leg: - be_emit_cstring("\tjnp "); - ia32_emit_cfop_target(proj_true); - be_emit_finish_line_gas(proj_true); - break; + case pn_Cmp_Leg: + ia32_emitf(proj_true, "\tjnp %L\n"); + break; - case pn_Cmp_Eq: - case pn_Cmp_Lt: - case pn_Cmp_Le: - /* we need a local label if the false proj is a fallthrough - * as the falseblock might have no label emitted then */ - if (can_be_fallthrough(proj_false)) { - need_parity_label = 1; - be_emit_cstring("\tjp 1f"); - } else { - be_emit_cstring("\tjp "); - ia32_emit_cfop_target(proj_false); - } - be_emit_finish_line_gas(proj_false); - goto emit_jcc; + case pn_Cmp_Eq: + case pn_Cmp_Lt: + case pn_Cmp_Le: + /* we need a local label if the false proj is a fallthrough + * as the falseblock might have no label emitted then */ + if (can_be_fallthrough(proj_false)) { + need_parity_label = 1; + ia32_emitf(proj_false, "\tjp 1f\n"); + } else { + ia32_emitf(proj_false, "\tjp %L\n"); + } + goto emit_jcc; - case pn_Cmp_Ug: - case pn_Cmp_Uge: - case pn_Cmp_Ne: - be_emit_cstring("\tjp "); - ia32_emit_cfop_target(proj_true); - be_emit_finish_line_gas(proj_true); - goto emit_jcc; + case pn_Cmp_Ug: + case pn_Cmp_Uge: + case pn_Cmp_Ne: + ia32_emitf(proj_true, "\tjp %L\n"); + goto emit_jcc; - default: - goto emit_jcc; + default: + goto emit_jcc; } } else { emit_jcc: - be_emit_cstring("\tj"); - ia32_emit_cmp_suffix(pnc); - be_emit_char(' '); - ia32_emit_cfop_target(proj_true); - be_emit_finish_line_gas(proj_true); + ia32_emitf(proj_true, "\tj%P %L\n", pnc); } if (need_parity_label) { - be_emit_cstring("1:"); - be_emit_write_line(); + ia32_emitf(NULL, "1:\n"); } /* the second Proj might be a fallthrough */ if (can_be_fallthrough(proj_false)) { - be_emit_cstring("\t/* fallthrough to "); - ia32_emit_cfop_target(proj_false); - be_emit_cstring(" */"); - be_emit_finish_line_gas(proj_false); + ia32_emitf(proj_false, "\t/* fallthrough to %L */\n"); } else { - be_emit_cstring("\tjmp "); - ia32_emit_cfop_target(proj_false); - be_emit_finish_line_gas(proj_false); + ia32_emitf(proj_false, "\tjmp %L\n"); + } +} + +/** + * Emits an ia32 Setcc. This is mostly easy but some floating point compares + * are tricky. + */ +static void emit_ia32_Setcc(const ir_node *node) +{ + const arch_register_t *dreg = get_out_reg(node, pn_ia32_Setcc_res); + + pn_Cmp pnc = get_ia32_condcode(node); + pnc = determine_final_pnc(node, n_ia32_Setcc_eflags, pnc); + if (pnc & ia32_pn_Cmp_float) { + switch (pnc & 0x0f) { + case pn_Cmp_Uo: + ia32_emitf(node, "\tsetp %#R\n", dreg); + return; + + case pn_Cmp_Leg: + ia32_emitf(node, "\tsetnp %#R\n", dreg); + return; + + case pn_Cmp_Eq: + case pn_Cmp_Lt: + case pn_Cmp_Le: + ia32_emitf(node, "\tset%P %R\n", dreg); + ia32_emitf(node, "\tandb %>R, %R\n", dreg); + ia32_emitf(node, "\torb %>R, %data.ins_permuted; - const arch_register_t *out = arch_get_irn_register(arch_env, node); + const arch_register_t *out = arch_irn_get_register(node, pn_ia32_res); pn_Cmp pnc = get_ia32_condcode(node); const arch_register_t *in_true; const arch_register_t *in_false; - pnc = determine_final_pnc(node, n_ia32_CMov_eflags, pnc); + pnc = determine_final_pnc(node, n_ia32_CMovcc_eflags, pnc); + /* although you can't set ins_permuted in the constructor it might still + be set by memory operand folding */ + if (attr->data.ins_permuted) + pnc = ia32_get_negated_pnc(pnc); - in_true = arch_get_irn_register(arch_env, - get_irn_n(node, n_ia32_CMov_val_true)); - in_false = arch_get_irn_register(arch_env, - get_irn_n(node, n_ia32_CMov_val_false)); + in_true = arch_get_irn_register(get_irn_n(node, n_ia32_CMovcc_val_true)); + in_false = arch_get_irn_register(get_irn_n(node, n_ia32_CMovcc_val_false)); /* should be same constraint fullfilled? */ if (out == in_false) { @@ -953,41 +1206,32 @@ static void emit_ia32_CMov(const ir_node *node) assert(get_ia32_op_type(node) == ia32_Normal); - ins_permuted = !ins_permuted; + pnc = ia32_get_negated_pnc(pnc); tmp = in_true; in_true = in_false; in_false = tmp; } else { /* we need a mov */ - be_emit_cstring("\tmovl "); - emit_register(in_false, NULL); - be_emit_cstring(", "); - emit_register(out, NULL); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tmovl %R, %R\n", in_false, out); } - if (ins_permuted) { - if (pnc & ia32_pn_Cmp_float) { - pnc = get_negated_pnc(pnc, mode_F); - } else { - pnc = get_negated_pnc(pnc, mode_Iu); + /* TODO: handling of Nans isn't correct yet */ + if (pnc & ia32_pn_Cmp_float) { + switch (pnc & 0x0f) { + case pn_Cmp_Uo: + case pn_Cmp_Leg: + case pn_Cmp_Eq: + case pn_Cmp_Lt: + case pn_Cmp_Le: + case pn_Cmp_Ug: + case pn_Cmp_Uge: + case pn_Cmp_Ne: + panic("CMov with floatingpoint compare/parity not supported yet"); } } - /* TODO: handling of Nans isn't correct yet */ - - be_emit_cstring("\tcmov"); - ia32_emit_cmp_suffix(pnc); - be_emit_char(' '); - if (get_ia32_op_type(node) == ia32_AddrModeS) { - ia32_emit_am(node); - } else { - emit_register(in_true, get_ia32_ls_mode(node)); - } - be_emit_cstring(", "); - emit_register(out, get_ia32_ls_mode(node)); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tcmov%P %#AR, %#R\n", pnc, in_true, out); } /********************************************************* @@ -1009,12 +1253,12 @@ typedef struct _branch_t { /* jump table for switch generation */ typedef struct _jmp_tbl_t { - ir_node *defProj; /**< default target */ - long min_value; /**< smallest switch case */ - long max_value; /**< largest switch case */ - long num_branches; /**< number of jumps */ - char *label; /**< label of the jump table */ - branch_t *branches; /**< jump array */ + ir_node *defProj; /**< default target */ + long min_value; /**< smallest switch case */ + long max_value; /**< largest switch case */ + long num_branches; /**< number of jumps */ + char label[SNPRINTF_BUF_LEN]; /**< label of the jump table */ + branch_t *branches; /**< jump array */ } jmp_tbl_t; /** @@ -1031,29 +1275,21 @@ static int ia32_cmp_branch_t(const void *a, const void *b) return 1; } -/** - * Emits code for a SwitchJmp (creates a jump table if - * possible otherwise a cmp-jmp cascade). Port from - * cggg ia32 backend - */ -static void emit_ia32_SwitchJmp(const ir_node *node) +static void generate_jump_table(jmp_tbl_t *tbl, const ir_node *node) { - unsigned long interval; - int last_value, i; + int i; long pnc; long default_pn; - jmp_tbl_t tbl; ir_node *proj; const ir_edge_t *edge; /* fill the table structure */ - tbl.label = xmalloc(SNPRINTF_BUF_LEN); - tbl.label = get_unique_label(tbl.label, SNPRINTF_BUF_LEN, ".TBL_"); - tbl.defProj = NULL; - tbl.num_branches = get_irn_n_edges(node) - 1; - tbl.branches = xcalloc(tbl.num_branches, sizeof(tbl.branches[0])); - tbl.min_value = INT_MAX; - tbl.max_value = INT_MIN; + get_unique_label(tbl->label, SNPRINTF_BUF_LEN, ".TBL_"); + tbl->defProj = NULL; + tbl->num_branches = get_irn_n_edges(node) - 1; + tbl->branches = XMALLOCNZ(branch_t, tbl->num_branches); + tbl->min_value = LONG_MAX; + tbl->max_value = LONG_MIN; default_pn = get_ia32_condcode(node); i = 0; @@ -1066,87 +1302,76 @@ static void emit_ia32_SwitchJmp(const ir_node *node) /* check for default proj */ if (pnc == default_pn) { - assert(tbl.defProj == NULL && "found two default Projs at SwitchJmp"); - tbl.defProj = proj; + assert(tbl->defProj == NULL && "found two default Projs at SwitchJmp"); + tbl->defProj = proj; } else { - tbl.min_value = pnc < tbl.min_value ? pnc : tbl.min_value; - tbl.max_value = pnc > tbl.max_value ? pnc : tbl.max_value; + tbl->min_value = pnc < tbl->min_value ? pnc : tbl->min_value; + tbl->max_value = pnc > tbl->max_value ? pnc : tbl->max_value; /* create branch entry */ - tbl.branches[i].target = proj; - tbl.branches[i].value = pnc; + tbl->branches[i].target = proj; + tbl->branches[i].value = pnc; ++i; } } - assert(i == tbl.num_branches); + assert(i == tbl->num_branches); /* sort the branches by their number */ - qsort(tbl.branches, tbl.num_branches, sizeof(tbl.branches[0]), ia32_cmp_branch_t); + qsort(tbl->branches, tbl->num_branches, sizeof(tbl->branches[0]), ia32_cmp_branch_t); +} + +/** + * Emits code for a SwitchJmp (creates a jump table if + * possible otherwise a cmp-jmp cascade). Port from + * cggg ia32 backend + */ +static void emit_ia32_SwitchJmp(const ir_node *node) +{ + unsigned long interval; + int last_value, i; + jmp_tbl_t tbl; + + /* fill the table structure */ + generate_jump_table(&tbl, node); /* two-complement's magic make this work without overflow */ interval = tbl.max_value - tbl.min_value; /* emit the table */ - be_emit_cstring("\tcmpl $"); - be_emit_irprintf("%u, ", interval); - ia32_emit_source_register(node, 0); - be_emit_finish_line_gas(node); - - be_emit_cstring("\tja "); - ia32_emit_cfop_target(tbl.defProj); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tcmpl $%u, %S0\n", interval); + ia32_emitf(tbl.defProj, "\tja %L\n"); if (tbl.num_branches > 1) { /* create table */ - be_emit_cstring("\tjmp *"); - be_emit_string(tbl.label); - be_emit_cstring("(,"); - ia32_emit_source_register(node, 0); - be_emit_cstring(",4)"); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tjmp *%s(,%S0,4)\n", tbl.label); be_gas_emit_switch_section(GAS_SECTION_RODATA); - be_emit_cstring("\t.align 4\n"); - be_emit_write_line(); - - be_emit_string(tbl.label); - be_emit_cstring(":\n"); - be_emit_write_line(); - - be_emit_cstring(".long "); - ia32_emit_cfop_target(tbl.branches[0].target); - be_emit_finish_line_gas(NULL); + ia32_emitf(NULL, "\t.align 4\n"); + ia32_emitf(NULL, "%s:\n", tbl.label); last_value = tbl.branches[0].value; - for (i = 1; i < tbl.num_branches; ++i) { - while (++last_value < tbl.branches[i].value) { - be_emit_cstring(".long "); - ia32_emit_cfop_target(tbl.defProj); - be_emit_finish_line_gas(NULL); + for (i = 0; i != tbl.num_branches; ++i) { + while (last_value != tbl.branches[i].value) { + ia32_emitf(tbl.defProj, ".long %L\n"); + ++last_value; } - be_emit_cstring(".long "); - ia32_emit_cfop_target(tbl.branches[i].target); - be_emit_finish_line_gas(NULL); + ia32_emitf(tbl.branches[i].target, ".long %L\n"); + ++last_value; } be_gas_emit_switch_section(GAS_SECTION_TEXT); } else { /* one jump is enough */ - be_emit_cstring("\tjmp "); - ia32_emit_cfop_target(tbl.branches[0].target); - be_emit_finish_line_gas(node); + ia32_emitf(tbl.branches[0].target, "\tjmp %L\n"); } - if (tbl.label) - free(tbl.label); - if (tbl.branches) - free(tbl.branches); + free(tbl.branches); } /** * Emits code for a unconditional jump. */ -static void emit_Jmp(const ir_node *node) +static void emit_ia32_Jmp(const ir_node *node) { ir_node *block; @@ -1155,32 +1380,9 @@ static void emit_Jmp(const ir_node *node) /* we have a block schedule */ if (can_be_fallthrough(node)) { - be_emit_cstring("\t/* fallthrough to "); - ia32_emit_cfop_target(node); - be_emit_cstring(" */"); + ia32_emitf(node, "\t/* fallthrough to %L */\n"); } else { - be_emit_cstring("\tjmp "); - ia32_emit_cfop_target(node); - } - be_emit_finish_line_gas(node); -} - -static void emit_ia32_Immediate(const ir_node *node) -{ - const ia32_immediate_attr_t *attr = get_ia32_immediate_attr_const(node); - - be_emit_char('$'); - if (attr->symconst != NULL) { - if (attr->sc_sign) - be_emit_char('-'); - ia32_emit_entity(attr->symconst, 0); - } - if (attr->symconst == NULL || attr->offset != 0) { - if (attr->symconst != NULL) { - be_emit_irprintf("%+d", attr->offset); - } else { - be_emit_irprintf("0x%X", attr->offset); - } + ia32_emitf(node, "\tjmp %L\n"); } } @@ -1212,7 +1414,7 @@ static const char* emit_asm_operand(const ir_node *node, const char *s) /* parse modifiers */ switch(c) { case 0: - ir_fprintf(stderr, "Warning: asm text (%+F) ends with %\n", node); + ir_fprintf(stderr, "Warning: asm text (%+F) ends with %%\n", node); be_emit_char('%'); return s + 1; case '%': @@ -1236,8 +1438,9 @@ static const char* emit_asm_operand(const ir_node *node, const char *s) case '9': break; default: - ir_fprintf(stderr, "Warning: asm text (%+F) contains unknown modifier " - "'%c' for asm op\n", node, c); + ir_fprintf(stderr, + "Warning: asm text (%+F) contains unknown modifier '%c' for asm op\n", + node, c); ++s; break; } @@ -1252,9 +1455,10 @@ static const char* emit_asm_operand(const ir_node *node, const char *s) s += p; } - if (num < 0 || num >= ARR_LEN(asm_regs)) { - ir_fprintf(stderr, "Error: Custom assembler references invalid " - "input/output (%+F)\n", node); + if (num < 0 || ARR_LEN(asm_regs) <= num) { + ir_fprintf(stderr, + "Error: Custom assembler references invalid input/output (%+F)\n", + node); return s; } asm_reg = & asm_regs[num]; @@ -1274,8 +1478,9 @@ static const char* emit_asm_operand(const ir_node *node, const char *s) reg = get_in_reg(node, asm_reg->inout_pos); } if (reg == NULL) { - ir_fprintf(stderr, "Warning: no register assigned for %d asm op " - "(%+F)\n", num, node); + ir_fprintf(stderr, + "Warning: no register assigned for %d asm op (%+F)\n", + num, node); return s; } @@ -1322,8 +1527,7 @@ static void emit_ia32_Asm(const ir_node *node) ident *asm_text = attr->asm_text; const char *s = get_id_str(asm_text); - be_emit_cstring("#APP\t"); - be_emit_finish_line_gas(node); + ia32_emitf(node, "#APP\t\n"); if (s[0] != '\t') be_emit_char('\t'); @@ -1336,11 +1540,7 @@ static void emit_ia32_Asm(const ir_node *node) } } - be_emit_char('\n'); - be_emit_write_line(); - - be_emit_cstring("#NO_APP\n"); - be_emit_write_line(); + ia32_emitf(NULL, "\n#NO_APP\n"); } /********************************** @@ -1359,25 +1559,10 @@ static void emit_ia32_Asm(const ir_node *node) */ static void emit_CopyB_prolog(unsigned size) { - be_emit_cstring("\tcld"); - be_emit_finish_line_gas(NULL); - - switch (size) { - case 1: - be_emit_cstring("\tmovsb"); - be_emit_finish_line_gas(NULL); - break; - case 2: - be_emit_cstring("\tmovsw"); - be_emit_finish_line_gas(NULL); - break; - case 3: - be_emit_cstring("\tmovsb"); - be_emit_finish_line_gas(NULL); - be_emit_cstring("\tmovsw"); - be_emit_finish_line_gas(NULL); - break; - } + if (size & 1) + ia32_emitf(NULL, "\tmovsb\n"); + if (size & 2) + ia32_emitf(NULL, "\tmovsw\n"); } /** @@ -1388,9 +1573,7 @@ static void emit_ia32_CopyB(const ir_node *node) unsigned size = get_ia32_copyb_size(node); emit_CopyB_prolog(size); - - be_emit_cstring("\trep movsd"); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\trep movsd\n"); } /** @@ -1400,12 +1583,11 @@ static void emit_ia32_CopyB_i(const ir_node *node) { unsigned size = get_ia32_copyb_size(node); - emit_CopyB_prolog(size & 0x3); + emit_CopyB_prolog(size); size >>= 2; while (size--) { - be_emit_cstring("\tmovsd"); - be_emit_finish_line_gas(NULL); + ia32_emitf(NULL, "\tmovsd\n"); } } @@ -1424,63 +1606,29 @@ static void emit_ia32_CopyB_i(const ir_node *node) /** * Emit code for conversions (I, FP), (FP, I) and (FP, FP). */ -static void emit_ia32_Conv_with_FP(const ir_node *node) +static void emit_ia32_Conv_with_FP(const ir_node *node, const char* conv_f, + const char* conv_d) { ir_mode *ls_mode = get_ia32_ls_mode(node); int ls_bits = get_mode_size_bits(ls_mode); + const char *conv = ls_bits == 32 ? conv_f : conv_d; - be_emit_cstring("\tcvt"); - - if (is_ia32_Conv_I2FP(node)) { - if (ls_bits == 32) { - be_emit_cstring("si2ss"); - } else { - be_emit_cstring("si2sd"); - } - } else if (is_ia32_Conv_FP2I(node)) { - if (ls_bits == 32) { - be_emit_cstring("ss2si"); - } else { - be_emit_cstring("sd2si"); - } - } else { - assert(is_ia32_Conv_FP2FP(node)); - if (ls_bits == 32) { - be_emit_cstring("sd2ss"); - } else { - be_emit_cstring("ss2sd"); - } - } - be_emit_char(' '); - - switch(get_ia32_op_type(node)) { - case ia32_Normal: - ia32_emit_source_register(node, n_ia32_unary_op); - break; - case ia32_AddrModeS: - ia32_emit_am(node); - break; - default: - assert(0 && "unsupported op type for Conv"); - } - be_emit_cstring(", "); - ia32_emit_dest_register(node, 0); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tcvt%s %AS3, %D0\n", conv); } static void emit_ia32_Conv_I2FP(const ir_node *node) { - emit_ia32_Conv_with_FP(node); + emit_ia32_Conv_with_FP(node, "si2ss", "si2sd"); } static void emit_ia32_Conv_FP2I(const ir_node *node) { - emit_ia32_Conv_with_FP(node); + emit_ia32_Conv_with_FP(node, "ss2si", "sd2si"); } static void emit_ia32_Conv_FP2FP(const ir_node *node) { - emit_ia32_Conv_with_FP(node); + emit_ia32_Conv_with_FP(node, "sd2ss", "ss2sd"); } /** @@ -1488,56 +1636,24 @@ static void emit_ia32_Conv_FP2FP(const ir_node *node) */ static void emit_ia32_Conv_I2I(const ir_node *node) { - const char *sign_suffix; - ir_mode *smaller_mode = get_ia32_ls_mode(node); - int smaller_bits = get_mode_size_bits(smaller_mode); - int signed_mode; - const arch_register_t *in_reg, *out_reg; + ir_mode *smaller_mode = get_ia32_ls_mode(node); + int signed_mode = mode_is_signed(smaller_mode); + const char *sign_suffix; assert(!mode_is_float(smaller_mode)); - assert(smaller_bits == 8 || smaller_bits == 16); - signed_mode = mode_is_signed(smaller_mode); sign_suffix = signed_mode ? "s" : "z"; + ia32_emitf(node, "\tmov%s%Ml %#AS3, %D0\n", sign_suffix); +} - out_reg = get_out_reg(node, 0); - - switch(get_ia32_op_type(node)) { - case ia32_Normal: - in_reg = get_in_reg(node, n_ia32_unary_op); - - if (in_reg == &ia32_gp_regs[REG_EAX] && - out_reg == &ia32_gp_regs[REG_EAX] && - signed_mode && - smaller_bits == 16) - { - /* argument and result are both in EAX and */ - /* signedness is ok: -> use the smaller cwtl opcode */ - be_emit_cstring("\tcwtl"); - } else { - be_emit_cstring("\tmov"); - be_emit_string(sign_suffix); - ia32_emit_mode_suffix_mode(smaller_mode); - be_emit_cstring("l "); - emit_register(in_reg, smaller_mode); - be_emit_cstring(", "); - emit_register(out_reg, NULL); - } - break; - case ia32_AddrModeS: { - be_emit_cstring("\tmov"); - be_emit_string(sign_suffix); - ia32_emit_mode_suffix_mode(smaller_mode); - be_emit_cstring("l "); - ia32_emit_am(node); - be_emit_cstring(", "); - emit_register(out_reg, NULL); - break; - } - default: - panic("unsupported op type for Conv"); - } - be_emit_finish_line_gas(node); +/** + * Emits a call + */ +static void emit_ia32_Call(const ir_node *node) +{ + /* Special case: Call must not have its immediates prefixed by $, instead + * address mode is prefixed by *. */ + ia32_emitf(node, "\tcall %*AS3\n"); } @@ -1551,45 +1667,31 @@ static void emit_ia32_Conv_I2I(const ir_node *node) * *******************************************/ -/** - * Emits a backend call - */ -static void emit_be_Call(const ir_node *node) -{ - ir_entity *ent = be_Call_get_entity(node); - - be_emit_cstring("\tcall "); - if (ent) { - ia32_emit_entity(ent, 1); - } else { - const arch_register_t *reg = get_in_reg(node, be_pos_Call_ptr); - be_emit_char('*'); - emit_register(reg, NULL); - } - be_emit_finish_line_gas(node); -} - /** * Emits code to increase stack pointer. */ static void emit_be_IncSP(const ir_node *node) { - int offs = be_get_IncSP_offset(node); - const arch_register_t *reg = arch_get_irn_register(arch_env, node); + int offs = be_get_IncSP_offset(node); if (offs == 0) return; if (offs > 0) { - be_emit_cstring("\tsubl $"); - be_emit_irprintf("%u, ", offs); - emit_register(reg, NULL); + ia32_emitf(node, "\tsubl $%u, %D0\n", offs); } else { - be_emit_cstring("\taddl $"); - be_emit_irprintf("%u, ", -offs); - emit_register(reg, NULL); + ia32_emitf(node, "\taddl $%u, %D0\n", -offs); } - be_emit_finish_line_gas(node); +} + +static inline bool is_unknown_reg(const arch_register_t *reg) +{ + if(reg == &ia32_gp_regs[REG_GP_UKNWN] + || reg == &ia32_xmm_regs[REG_XMM_UKNWN] + || reg == &ia32_vfp_regs[REG_VFP_UKNWN]) + return true; + + return false; } /** @@ -1597,9 +1699,8 @@ static void emit_be_IncSP(const ir_node *node) */ static void Copy_emitter(const ir_node *node, const ir_node *op) { - const arch_register_t *in = arch_get_irn_register(arch_env, op); - const arch_register_t *out = arch_get_irn_register(arch_env, node); - ir_mode *mode; + const arch_register_t *in = arch_get_irn_register(op); + const arch_register_t *out = arch_get_irn_register(node); if (in == out) { return; @@ -1610,19 +1711,11 @@ static void Copy_emitter(const ir_node *node, const ir_node *op) if (arch_register_get_class(in) == &ia32_reg_classes[CLASS_ia32_vfp]) return; - mode = get_irn_mode(node); - if (mode == mode_E) { - be_emit_cstring("\tmovsd "); - emit_register(in, NULL); - be_emit_cstring(", "); - emit_register(out, NULL); + if (get_irn_mode(node) == mode_E) { + ia32_emitf(node, "\tmovsd %R, %R\n", in, out); } else { - be_emit_cstring("\tmovl "); - emit_register(in, NULL); - be_emit_cstring(", "); - emit_register(out, NULL); + ia32_emitf(node, "\tmovl %R, %R\n", in, out); } - be_emit_finish_line_gas(node); } static void emit_be_Copy(const ir_node *node) @@ -1643,8 +1736,8 @@ static void emit_be_Perm(const ir_node *node) const arch_register_t *in0, *in1; const arch_register_class_t *cls0, *cls1; - in0 = arch_get_irn_register(arch_env, get_irn_n(node, 0)); - in1 = arch_get_irn_register(arch_env, get_irn_n(node, 1)); + in0 = arch_get_irn_register(get_irn_n(node, 0)); + in1 = arch_get_irn_register(get_irn_n(node, 1)); cls0 = arch_register_get_class(in0); cls1 = arch_register_get_class(in1); @@ -1652,29 +1745,11 @@ static void emit_be_Perm(const ir_node *node) assert(cls0 == cls1 && "Register class mismatch at Perm"); if (cls0 == &ia32_reg_classes[CLASS_ia32_gp]) { - be_emit_cstring("\txchg "); - emit_register(in1, NULL); - be_emit_cstring(", "); - emit_register(in0, NULL); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\txchg %R, %R\n", in1, in0); } else if (cls0 == &ia32_reg_classes[CLASS_ia32_xmm]) { - be_emit_cstring("\txorpd "); - emit_register(in1, NULL); - be_emit_cstring(", "); - emit_register(in0, NULL); - be_emit_finish_line_gas(NULL); - - be_emit_cstring("\txorpd "); - emit_register(in0, NULL); - be_emit_cstring(", "); - emit_register(in1, NULL); - be_emit_finish_line_gas(NULL); - - be_emit_cstring("\txorpd "); - emit_register(in1, NULL); - be_emit_cstring(", "); - emit_register(in0, NULL); - be_emit_finish_line_gas(node); + ia32_emitf(NULL, "\txorpd %R, %R\n", in1, in0); + ia32_emitf(NULL, "\txorpd %R, %R\n", in0, in1); + ia32_emitf(node, "\txorpd %R, %R\n", in1, in0); } else if (cls0 == &ia32_reg_classes[CLASS_ia32_vfp]) { /* is a NOP */ } else if (cls0 == &ia32_reg_classes[CLASS_ia32_st]) { @@ -1689,12 +1764,7 @@ static void emit_be_Perm(const ir_node *node) */ static void emit_ia32_Const(const ir_node *node) { - be_emit_cstring("\tmovl "); - emit_ia32_Immediate(node); - be_emit_cstring(", "); - ia32_emit_dest_register(node, 0); - - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tmovl %I, %D0\n"); } /** @@ -1702,65 +1772,43 @@ static void emit_ia32_Const(const ir_node *node) */ static void emit_ia32_LdTls(const ir_node *node) { - be_emit_cstring("\tmovl %gs:0, "); - ia32_emit_dest_register(node, 0); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tmovl %%gs:0, %D0\n"); } /* helper function for emit_ia32_Minus64Bit */ static void emit_mov(const ir_node* node, const arch_register_t *src, const arch_register_t *dst) { - be_emit_cstring("\tmovl "); - emit_register(src, NULL); - be_emit_cstring(", "); - emit_register(dst, NULL); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tmovl %R, %R\n", src, dst); } /* helper function for emit_ia32_Minus64Bit */ static void emit_neg(const ir_node* node, const arch_register_t *reg) { - be_emit_cstring("\tnegl "); - emit_register(reg, NULL); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tnegl %R\n", reg); } /* helper function for emit_ia32_Minus64Bit */ static void emit_sbb0(const ir_node* node, const arch_register_t *reg) { - be_emit_cstring("\tsbbl $0, "); - emit_register(reg, NULL); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tsbbl $0, %R\n", reg); } /* helper function for emit_ia32_Minus64Bit */ static void emit_sbb(const ir_node* node, const arch_register_t *src, const arch_register_t *dst) { - be_emit_cstring("\tsbbl "); - emit_register(src, NULL); - be_emit_cstring(", "); - emit_register(dst, NULL); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\tsbbl %R, %R\n", src, dst); } /* helper function for emit_ia32_Minus64Bit */ static void emit_xchg(const ir_node* node, const arch_register_t *src, const arch_register_t *dst) { - be_emit_cstring("\txchgl "); - emit_register(src, NULL); - be_emit_cstring(", "); - emit_register(dst, NULL); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\txchgl %R, %R\n", src, dst); } /* helper function for emit_ia32_Minus64Bit */ static void emit_zero(const ir_node* node, const arch_register_t *reg) { - be_emit_cstring("\txorl "); - emit_register(reg, NULL); - be_emit_cstring(", "); - emit_register(reg, NULL); - be_emit_finish_line_gas(node); + ia32_emitf(node, "\txorl %R, %R\n", reg, reg); } static void emit_ia32_Minus64Bit(const ir_node *node) @@ -1819,30 +1867,32 @@ zero_neg: static void emit_ia32_GetEIP(const ir_node *node) { - be_emit_cstring("\tcall "); - be_emit_string(pic_base_label); - be_emit_finish_line_gas(node); - - be_emit_string(pic_base_label); - be_emit_cstring(":\n"); - be_emit_write_line(); + ia32_emitf(node, "\tcall %s\n", pic_base_label); + ia32_emitf(NULL, "%s:\n", pic_base_label); + ia32_emitf(node, "\tpopl %D0\n"); +} - be_emit_cstring("\tpopl "); - ia32_emit_dest_register(node, 0); - be_emit_char('\n'); - be_emit_write_line(); +static void emit_ia32_ClimbFrame(const ir_node *node) +{ + const ia32_climbframe_attr_t *attr = get_ia32_climbframe_attr_const(node); + + ia32_emitf(node, "\tmovl %S0, %D0\n"); + ia32_emitf(node, "\tmovl $%u, %S1\n", attr->count); + ia32_emitf(NULL, BLOCK_PREFIX "%ld:\n", get_irn_node_nr(node)); + ia32_emitf(node, "\tmovl (%D0), %D0\n"); + ia32_emitf(node, "\tdec %S1\n"); + ia32_emitf(node, "\tjnz " BLOCK_PREFIX "%ld\n", get_irn_node_nr(node)); } static void emit_be_Return(const ir_node *node) { - unsigned pop; - be_emit_cstring("\tret"); + unsigned pop = be_Return_get_pop(node); - pop = be_Return_get_pop(node); if (pop > 0 || be_Return_get_emit_pop(node)) { - be_emit_irprintf(" $%d", pop); + ia32_emitf(node, "\tret $%u\n", pop); + } else { + ia32_emitf(node, "\tret\n"); } - be_emit_finish_line_gas(node); } static void emit_Nothing(const ir_node *node) @@ -1881,40 +1931,40 @@ static void ia32_register_emitters(void) ia32_register_spec_emitters(); /* other ia32 emitter functions */ + IA32_EMIT2(Conv_I2I8Bit, Conv_I2I); IA32_EMIT(Asm); - IA32_EMIT(CMov); - IA32_EMIT(IMul); - IA32_EMIT(SwitchJmp); - IA32_EMIT(CopyB); - IA32_EMIT(CopyB_i); - IA32_EMIT(Conv_I2FP); - IA32_EMIT(Conv_FP2I); + IA32_EMIT(CMovcc); + IA32_EMIT(Call); + IA32_EMIT(Const); IA32_EMIT(Conv_FP2FP); + IA32_EMIT(Conv_FP2I); + IA32_EMIT(Conv_I2FP); IA32_EMIT(Conv_I2I); - IA32_EMIT2(Conv_I2I8Bit, Conv_I2I); - IA32_EMIT(Const); + IA32_EMIT(CopyB); + IA32_EMIT(CopyB_i); + IA32_EMIT(GetEIP); + IA32_EMIT(IMul); + IA32_EMIT(Jcc); + IA32_EMIT(Setcc); IA32_EMIT(LdTls); IA32_EMIT(Minus64Bit); - IA32_EMIT(Jcc); - IA32_EMIT(GetEIP); + IA32_EMIT(SwitchJmp); + IA32_EMIT(ClimbFrame); + IA32_EMIT(Jmp); /* benode emitter */ - BE_EMIT(Call); - BE_EMIT(IncSP); BE_EMIT(Copy); BE_EMIT(CopyKeep); + BE_EMIT(IncSP); BE_EMIT(Perm); BE_EMIT(Return); - BE_IGN(RegParams); BE_IGN(Barrier); BE_IGN(Keep); + BE_IGN(Start); /* firm emitter */ - EMIT(Jmp); - IGN(Proj); IGN(Phi); - IGN(Start); #undef BE_EMIT #undef EMIT @@ -1925,6 +1975,23 @@ static void ia32_register_emitters(void) typedef void (*emit_func_ptr) (const ir_node *); +/** + * Assign and emit an exception label if the current instruction can fail. + */ +static void ia32_assign_exc_label(ir_node *node) +{ + /* assign a new ID to the instruction */ + set_ia32_exc_label_id(node, ++exc_label_id); + /* print it */ + ia32_emit_exc_label(node); + be_emit_char(':'); + be_emit_pad_comment(); + be_emit_cstring("/* exception to Block "); + ia32_emit_cfop_target(node); + be_emit_cstring(" */\n"); + be_emit_write_line(); +} + /** * Emits code for a node. */ @@ -1934,9 +2001,22 @@ static void ia32_emit_node(ir_node *node) DBG((dbg, LEVEL_1, "emitting code for %+F\n", node)); - if (is_ia32_irn(node) && get_ia32_exc_label(node)) { - /* emit the exception label of this instruction */ - ia32_assign_exc_label(node); + if (is_ia32_irn(node)) { + if (get_ia32_exc_label(node)) { + /* emit the exception label of this instruction */ + ia32_assign_exc_label(node); + } + if (mark_spill_reload) { + if (is_ia32_is_spill(node)) { + ia32_emitf(NULL, "\txchg %ebx, %ebx /* spill mark */\n"); + } + if (is_ia32_is_reload(node)) { + ia32_emitf(NULL, "\txchg %edx, %edx /* reload mark */\n"); + } + if (is_ia32_is_remat(node)) { + ia32_emitf(NULL, "\txchg %ecx, %ecx /* remat mark */\n"); + } + } } if (op->ops.generic) { emit_func_ptr func = (emit_func_ptr) op->ops.generic; @@ -1956,9 +2036,7 @@ static void ia32_emit_node(ir_node *node) */ static void ia32_emit_alignment(unsigned align, unsigned skip) { - be_emit_cstring("\t.p2align "); - be_emit_irprintf("%u,,%u\n", align, skip); - be_emit_write_line(); + ia32_emitf(NULL, "\t.p2align %u,,%u\n", align, skip); } /** @@ -2029,7 +2107,7 @@ static void ia32_emit_block_header(ir_node *block) int i, arity; ir_exec_freq *exec_freq = cg->birg->exec_freq; - if (block == get_irg_end_block(irg) || block == get_irg_start_block(irg)) + if (block == get_irg_end_block(irg)) return; if (ia32_cg_config.label_alignment > 0) { @@ -2058,7 +2136,7 @@ static void ia32_emit_block_header(ir_node *block) } } - if (need_label || has_Block_label(block)) { + if (need_label) { ia32_emit_block_name(block); be_emit_char(':'); @@ -2074,12 +2152,16 @@ static void ia32_emit_block_header(ir_node *block) /* emit list of pred blocks in comment */ arity = get_irn_arity(block); - for (i = 0; i < arity; ++i) { - ir_node *predblock = get_Block_cfgpred_block(block, i); - be_emit_irprintf(" %d", get_irn_node_nr(predblock)); + if (arity <= 0) { + be_emit_cstring(" none"); + } else { + for (i = 0; i < arity; ++i) { + ir_node *predblock = get_Block_cfgpred_block(block, i); + be_emit_irprintf(" %d", get_irn_node_nr(predblock)); + } } if (exec_freq != NULL) { - be_emit_irprintf(" freq: %f", + be_emit_irprintf(", freq: %f", get_block_execfreq(exec_freq, block)); } be_emit_cstring(" */\n"); @@ -2135,25 +2217,6 @@ static void ia32_gen_labels(ir_node *block, void *data) } } -/** - * Assign and emit an exception label if the current instruction can fail. - */ -void ia32_assign_exc_label(ir_node *node) -{ - if (get_ia32_exc_label(node)) { - /* assign a new ID to the instruction */ - set_ia32_exc_label_id(node, ++exc_label_id); - /* print it */ - ia32_emit_exc_label(node); - be_emit_char(':'); - be_emit_pad_comment(); - be_emit_cstring("/* exception to Block "); - ia32_emit_cfop_target(node); - be_emit_cstring(" */\n"); - be_emit_write_line(); - } -} - /** * Compare two exception_entries. */ @@ -2177,10 +2240,11 @@ void ia32_gen_routine(ia32_code_gen_t *ia32_cg, ir_graph *irg) int i, n; cg = ia32_cg; - isa = (const ia32_isa_t*) cg->arch_env; - arch_env = cg->arch_env; + isa = cg->isa; do_pic = cg->birg->main_env->options->pic; + be_gas_elf_type_char = '@'; + ia32_register_emitters(); get_unique_label(pic_base_label, sizeof(pic_base_label), ".PIC_BASE"); @@ -2232,7 +2296,2065 @@ void ia32_gen_routine(ia32_code_gen_t *ia32_cg, ir_graph *irg) DEL_ARR_F(exc_list); } -void ia32_init_emitter(void) +static const lc_opt_table_entry_t ia32_emitter_options[] = { + LC_OPT_ENT_BOOL("mark_spill_reload", "mark spills and reloads with ud opcodes", &mark_spill_reload), + LC_OPT_LAST +}; + +/* ==== Experimental binary emitter ==== */ + +static unsigned char reg_gp_map[N_ia32_gp_REGS]; +//static unsigned char reg_mmx_map[N_ia32_mmx_REGS]; +//static unsigned char reg_sse_map[N_ia32_xmm_REGS]; +static unsigned char pnc_map_signed[8]; +static unsigned char pnc_map_unsigned[8]; + +static void build_reg_map(void) +{ + reg_gp_map[REG_EAX] = 0x0; + reg_gp_map[REG_ECX] = 0x1; + reg_gp_map[REG_EDX] = 0x2; + reg_gp_map[REG_EBX] = 0x3; + reg_gp_map[REG_ESP] = 0x4; + reg_gp_map[REG_EBP] = 0x5; + reg_gp_map[REG_ESI] = 0x6; + reg_gp_map[REG_EDI] = 0x7; + + pnc_map_signed[pn_Cmp_Eq] = 0x04; + pnc_map_signed[pn_Cmp_Lt] = 0x0C; + pnc_map_signed[pn_Cmp_Le] = 0x0E; + pnc_map_signed[pn_Cmp_Gt] = 0x0F; + pnc_map_signed[pn_Cmp_Ge] = 0x0D; + pnc_map_signed[pn_Cmp_Lg] = 0x05; + + pnc_map_unsigned[pn_Cmp_Eq] = 0x04; + pnc_map_unsigned[pn_Cmp_Lt] = 0x02; + pnc_map_unsigned[pn_Cmp_Le] = 0x06; + pnc_map_unsigned[pn_Cmp_Gt] = 0x07; + pnc_map_unsigned[pn_Cmp_Ge] = 0x03; + pnc_map_unsigned[pn_Cmp_Lg] = 0x05; +} + +/** Returns the encoding for a pnc field. */ +static unsigned char pnc2cc(int pnc) +{ + unsigned char cc; + if (pnc == ia32_pn_Cmp_parity) { + cc = 0x0A; + } else if (pnc & ia32_pn_Cmp_float || pnc & ia32_pn_Cmp_unsigned) { + cc = pnc_map_unsigned[pnc & 0x07]; + } else { + cc = pnc_map_signed[pnc & 0x07]; + } + assert(cc != 0); + return cc; +} + +/** Sign extension bit values for binops */ +enum SignExt { + UNSIGNED_IMM = 0, /**< unsigned immediate */ + SIGNEXT_IMM = 2, /**< sign extended immediate */ +}; + +/** The mod encoding of the ModR/M */ +enum Mod { + MOD_IND = 0x00, /**< [reg1] */ + MOD_IND_BYTE_OFS = 0x40, /**< [reg1 + byte ofs] */ + MOD_IND_WORD_OFS = 0x80, /**< [reg1 + word ofs] */ + MOD_REG = 0xC0 /**< reg1 */ +}; + +/** create R/M encoding for ModR/M */ +#define ENC_RM(x) (x) +/** create REG encoding for ModR/M */ +#define ENC_REG(x) ((x) << 3) + +/** create encoding for a SIB byte */ +#define ENC_SIB(scale, index, base) ((scale) << 6 | (index) << 3 | (base)) + +/* Node: The following routines are supposed to append bytes, words, dwords + to the output stream. + Currently the implementation is stupid in that it still creates output + for an "assembler" in the form of .byte, .long + We will change this when enough infrastructure is there to create complete + machine code in memory/object files */ + +static void bemit8(const unsigned char byte) +{ + be_emit_irprintf("\t.byte 0x%x\n", byte); + be_emit_write_line(); +} + +static void bemit16(const unsigned short u16) +{ + be_emit_irprintf("\t.word 0x%x\n", u16); + be_emit_write_line(); +} + +static void bemit32(const unsigned u32) +{ + be_emit_irprintf("\t.long 0x%x\n", u32); + be_emit_write_line(); +} + +/** + * Emit address of an entity. If @p is_relative is true then a relative + * offset from behind the address to the entity is created. + */ +static void bemit_entity(ir_entity *entity, bool entity_sign, int offset, + bool is_relative) +{ + if (entity == NULL) { + bemit32(offset); + return; + } + + /* the final version should remember the position in the bytestream + and patch it with the correct address at linktime... */ + be_emit_cstring("\t.long "); + if (entity_sign) + be_emit_char('-'); + be_gas_emit_entity(entity); + + if (get_entity_owner(entity) == get_tls_type()) { + if (get_entity_linkage(entity) & IR_LINKAGE_EXTERN) { + be_emit_cstring("@INDNTPOFF"); + } else { + be_emit_cstring("@NTPOFF"); + } + } + + if (is_relative) { + be_emit_cstring("-."); + offset -= 4; + } + + if (offset != 0) { + be_emit_irprintf("%+d", offset); + } + be_emit_char('\n'); + be_emit_write_line(); +} + +static void bemit_jmp_destination(const ir_node *dest_block) +{ + be_emit_cstring("\t.long "); + ia32_emit_block_name(dest_block); + be_emit_cstring(" - . - 4\n"); + be_emit_write_line(); +} + +/* end emit routines, all emitters following here should only use the functions + above. */ + +typedef enum reg_modifier { + REG_LOW = 0, + REG_HIGH = 1 +} reg_modifier_t; + +/** Create a ModR/M byte for src1,src2 registers */ +static void bemit_modrr(const arch_register_t *src1, + const arch_register_t *src2) { + unsigned char modrm = MOD_REG; + modrm |= ENC_RM(reg_gp_map[src1->index]); + modrm |= ENC_REG(reg_gp_map[src2->index]); + bemit8(modrm); +} + +/** Create a ModR/M8 byte for src1,src2 registers */ +static void bemit_modrr8(reg_modifier_t high_part1, const arch_register_t *src1, + reg_modifier_t high_part2, const arch_register_t *src2) +{ + unsigned char modrm = MOD_REG; + modrm |= ENC_RM(reg_gp_map[src1->index] + (high_part1 == REG_HIGH ? 4 : 0)); + modrm |= ENC_REG(reg_gp_map[src2->index] + (high_part2 == REG_HIGH ? 4 : 0)); + bemit8(modrm); +} + +/** Create a ModR/M byte for one register and extension */ +static void bemit_modru(const arch_register_t *reg, unsigned ext) +{ + unsigned char modrm = MOD_REG; + assert(ext <= 7); + modrm |= ENC_RM(reg_gp_map[reg->index]); + modrm |= ENC_REG(ext); + bemit8(modrm); +} + +/** Create a ModR/M8 byte for one register */ +static void bemit_modrm8(reg_modifier_t high_part, const arch_register_t *reg) +{ + unsigned char modrm = MOD_REG; + assert(reg_gp_map[reg->index] < 4); + modrm |= ENC_RM(reg_gp_map[reg->index] + (high_part == REG_HIGH ? 4 : 0)); + modrm |= MOD_REG; + bemit8(modrm); +} + +/** + * Calculate the size of an signed immediate in bytes. + * + * @param offset an offset + */ +static unsigned get_signed_imm_size(int offset) +{ + if (-128 <= offset && offset < 128) { + return 1; + } else if (-32768 <= offset && offset < 32768) { + return 2; + } else { + return 4; + } +} + +/** + * Emit an address mode. + * + * @param reg content of the reg field: either a register index or an opcode extension + * @param node the node + */ +static void bemit_mod_am(unsigned reg, const ir_node *node) +{ + ir_entity *ent = get_ia32_am_sc(node); + int offs = get_ia32_am_offs_int(node); + ir_node *base = get_irn_n(node, n_ia32_base); + int has_base = !is_ia32_NoReg_GP(base); + ir_node *index = get_irn_n(node, n_ia32_index); + int has_index = !is_ia32_NoReg_GP(index); + unsigned modrm = 0; + unsigned sib = 0; + unsigned emitoffs = 0; + bool emitsib = false; + unsigned base_enc; + + /* set the mod part depending on displacement */ + if (ent != NULL) { + modrm |= MOD_IND_WORD_OFS; + emitoffs = 32; + } else if (offs == 0) { + modrm |= MOD_IND; + emitoffs = 0; + } else if (-128 <= offs && offs < 128) { + modrm |= MOD_IND_BYTE_OFS; + emitoffs = 8; + } else { + modrm |= MOD_IND_WORD_OFS; + emitoffs = 32; + } + + if (has_base) { + const arch_register_t *base_reg = arch_get_irn_register(base); + base_enc = reg_gp_map[base_reg->index]; + } else { + /* Use the EBP encoding + MOD_IND if NO base register. There is + * always a 32bit offset present in this case. */ + modrm = MOD_IND; + base_enc = 0x05; + emitoffs = 32; + } + + /* Determine if we need a SIB byte. */ + if (has_index) { + const arch_register_t *reg_index = arch_get_irn_register(index); + int scale = get_ia32_am_scale(node); + assert(scale < 4); + /* R/M set to ESP means SIB in 32bit mode. */ + modrm |= ENC_RM(0x04); + sib = ENC_SIB(scale, reg_gp_map[reg_index->index], base_enc); + emitsib = true; + } else if (base_enc == 0x04) { + /* for the above reason we are forced to emit a SIB when base is ESP. + * Only the base is used, index must be ESP too, which means no index. + */ + modrm |= ENC_RM(0x04); + sib = ENC_SIB(0, 0x04, 0x04); + emitsib = true; + } else { + modrm |= ENC_RM(base_enc); + } + + /* We are forced to emit an 8bit offset as EBP base without offset is a + * special case for SIB without base register. */ + if (base_enc == 0x05 && emitoffs == 0) { + modrm |= MOD_IND_BYTE_OFS; + emitoffs = 8; + } + + modrm |= ENC_REG(reg); + + bemit8(modrm); + if (emitsib) + bemit8(sib); + + /* emit displacement */ + if (emitoffs == 8) { + bemit8((unsigned) offs); + } else if (emitoffs == 32) { + bemit_entity(ent, is_ia32_am_sc_sign(node), offs, false); + } +} + +/** + * Emit a binop with a immediate operand. + * + * @param node the node to emit + * @param opcode_eax the opcode for the op eax, imm variant + * @param opcode the opcode for the reg, imm variant + * @param ruval the opcode extension for opcode + */ +static void bemit_binop_with_imm( + const ir_node *node, + unsigned char opcode_ax, + unsigned char opcode, unsigned char ruval) +{ + /* Use in-reg, because some instructions (cmp, test) have no out-reg. */ + const ir_node *op = get_irn_n(node, n_ia32_binary_right); + const ia32_immediate_attr_t *attr = get_ia32_immediate_attr_const(op); + unsigned size; + + /* Some instructions (test) have no short form with 32bit value + 8bit + * immediate. */ + if (attr->symconst != NULL || opcode & SIGNEXT_IMM) { + size = 4; + } else { + /* check for sign extension */ + size = get_signed_imm_size(attr->offset); + } + + switch (size) { + case 1: + bemit8(opcode | SIGNEXT_IMM); + /* cmp has this special mode */ + if (get_ia32_op_type(node) == ia32_AddrModeS) { + bemit_mod_am(ruval, node); + } else { + const arch_register_t *reg = get_in_reg(node, n_ia32_binary_left); + bemit_modru(reg, ruval); + } + bemit8((unsigned char)attr->offset); + return; + case 2: + case 4: + /* check for eax variant: this variant is shorter for 32bit immediates only */ + if (get_ia32_op_type(node) == ia32_AddrModeS) { + bemit8(opcode); + bemit_mod_am(ruval, node); + } else { + const arch_register_t *reg = get_in_reg(node, n_ia32_binary_left); + if (reg->index == REG_EAX) { + bemit8(opcode_ax); + } else { + bemit8(opcode); + bemit_modru(reg, ruval); + } + } + bemit_entity(attr->symconst, attr->sc_sign, attr->offset, false); + return; + } + panic("invalid imm size?!?"); +} + +/** + * Emits a binop. + */ +static void bemit_binop_2(const ir_node *node, unsigned code) +{ + const arch_register_t *out = get_in_reg(node, n_ia32_binary_left); + bemit8(code); + if (get_ia32_op_type(node) == ia32_Normal) { + const arch_register_t *op2 = get_in_reg(node, n_ia32_binary_right); + bemit_modrr(op2, out); + } else { + bemit_mod_am(reg_gp_map[out->index], node); + } +} + +/** + * Emit a binop. + */ +static void bemit_binop(const ir_node *node, const unsigned char opcodes[4]) +{ + ir_node *right = get_irn_n(node, n_ia32_binary_right); + if (is_ia32_Immediate(right)) { + bemit_binop_with_imm(node, opcodes[1], opcodes[2], opcodes[3]); + } else { + bemit_binop_2(node, opcodes[0]); + } +} + +/** + * Emit an unop. + */ +static void bemit_unop(const ir_node *node, unsigned char code, unsigned char ext, int input) +{ + bemit8(code); + if (get_ia32_op_type(node) == ia32_Normal) { + const arch_register_t *in = get_in_reg(node, input); + bemit_modru(in, ext); + } else { + bemit_mod_am(ext, node); + } +} + +static void bemit_unop_reg(const ir_node *node, unsigned char code, int input) +{ + const arch_register_t *out = get_out_reg(node, 0); + bemit_unop(node, code, reg_gp_map[out->index], input); +} + +static void bemit_unop_mem(const ir_node *node, unsigned char code, unsigned char ext) +{ + unsigned size = get_mode_size_bits(get_ia32_ls_mode(node)); + if (size == 16) + bemit8(0x66); + bemit8(size == 8 ? code : code + 1); + bemit_mod_am(ext, node); +} + +static void bemit_immediate(const ir_node *node, bool relative) +{ + const ia32_immediate_attr_t *attr = get_ia32_immediate_attr_const(node); + bemit_entity(attr->symconst, attr->sc_sign, attr->offset, relative); +} + +static void bemit_copy(const ir_node *copy) +{ + const arch_register_t *in = get_in_reg(copy, 0); + const arch_register_t *out = get_out_reg(copy, 0); + + if (in == out || is_unknown_reg(in)) + return; + /* copies of vf nodes aren't real... */ + if (arch_register_get_class(in) == &ia32_reg_classes[CLASS_ia32_vfp]) + return; + + if (get_irn_mode(copy) == mode_E) { + panic("NIY"); + } else { + assert(arch_register_get_class(in) == &ia32_reg_classes[CLASS_ia32_gp]); + bemit8(0x8B); + bemit_modrr(in, out); + } +} + +static void bemit_perm(const ir_node *node) +{ + const arch_register_t *in0 = arch_get_irn_register(get_irn_n(node, 0)); + const arch_register_t *in1 = arch_get_irn_register(get_irn_n(node, 1)); + const arch_register_class_t *cls0 = arch_register_get_class(in0); + + assert(cls0 == arch_register_get_class(in1) && "Register class mismatch at Perm"); + + if (cls0 == &ia32_reg_classes[CLASS_ia32_gp]) { + if (in0->index == REG_EAX) { + bemit8(0x90 + reg_gp_map[in1->index]); + } else if (in1->index == REG_EAX) { + bemit8(0x90 + reg_gp_map[in0->index]); + } else { + bemit8(0x87); + bemit_modrr(in0, in1); + } + } else if (cls0 == &ia32_reg_classes[CLASS_ia32_xmm]) { + panic("unimplemented"); // TODO implement + //ia32_emitf(NULL, "\txorpd %R, %R\n", in1, in0); + //ia32_emitf(NULL, "\txorpd %R, %R\n", in0, in1); + //ia32_emitf(node, "\txorpd %R, %R\n", in1, in0); + } else if (cls0 == &ia32_reg_classes[CLASS_ia32_vfp]) { + /* is a NOP */ + } else if (cls0 == &ia32_reg_classes[CLASS_ia32_st]) { + /* is a NOP */ + } else { + panic("unexpected register class in be_Perm (%+F)", node); + } +} + +static void bemit_xor0(const ir_node *node) +{ + const arch_register_t *out = get_out_reg(node, 0); + bemit8(0x31); + bemit_modrr(out, out); +} + +static void bemit_mov_const(const ir_node *node) +{ + const arch_register_t *out = get_out_reg(node, 0); + bemit8(0xB8 + reg_gp_map[out->index]); + bemit_immediate(node, false); +} + +/** + * Creates a function for a Binop with 3 possible encodings. + */ +#define BINOP(op, op0, op1, op2, op2_ext) \ +static void bemit_ ## op(const ir_node *node) { \ + static const unsigned char op ## _codes[] = {op0, op1, op2, op2_ext}; \ + bemit_binop(node, op ## _codes); \ +} + +/* insn def eax,imm imm */ +BINOP(add, 0x03, 0x05, 0x81, 0) +BINOP(or, 0x0B, 0x0D, 0x81, 1) +BINOP(adc, 0x13, 0x15, 0x81, 2) +BINOP(sbb, 0x1B, 0x1D, 0x81, 3) +BINOP(and, 0x23, 0x25, 0x81, 4) +BINOP(sub, 0x2B, 0x2D, 0x81, 5) +BINOP(xor, 0x33, 0x35, 0x81, 6) +BINOP(test, 0x85, 0xA9, 0xF7, 0) + +#define BINOPMEM(op, ext) \ +static void bemit_##op(const ir_node *node) \ +{ \ + ir_node *val; \ + unsigned size = get_mode_size_bits(get_ia32_ls_mode(node)); \ + if (size == 16) \ + bemit8(0x66); \ + val = get_irn_n(node, n_ia32_unary_op); \ + if (is_ia32_Immediate(val)) { \ + const ia32_immediate_attr_t *attr = get_ia32_immediate_attr_const(val); \ + int offset = attr->offset; \ + if (attr->symconst == NULL && get_signed_imm_size(offset) == 1) { \ + bemit8(0x83); \ + bemit_mod_am(ext, node); \ + bemit8(offset); \ + } else { \ + bemit8(0x81); \ + bemit_mod_am(ext, node); \ + if (size == 16) { \ + bemit16(offset); \ + } else { \ + bemit_entity(attr->symconst, attr->sc_sign, offset, false); \ + } \ + } \ + } else { \ + bemit8(ext << 3 | 1); \ + bemit_mod_am(reg_gp_map[get_out_reg(val, 0)->index], node); \ + } \ +} \ + \ +static void bemit_##op##8bit(const ir_node *node) \ +{ \ + ir_node *val = get_irn_n(node, n_ia32_unary_op); \ + if (is_ia32_Immediate(val)) { \ + bemit8(0x80); \ + bemit_mod_am(ext, node); \ + bemit8(get_ia32_immediate_attr_const(val)->offset); \ + } else { \ + bemit8(ext << 3); \ + bemit_mod_am(reg_gp_map[get_out_reg(val, 0)->index], node); \ + } \ +} + +BINOPMEM(addmem, 0) +BINOPMEM(ormem, 1) +BINOPMEM(andmem, 4) +BINOPMEM(submem, 5) +BINOPMEM(xormem, 6) + + +/** + * Creates a function for an Unop with code /ext encoding. + */ +#define UNOP(op, code, ext, input) \ +static void bemit_ ## op(const ir_node *node) { \ + bemit_unop(node, code, ext, input); \ +} + +UNOP(not, 0xF7, 2, n_ia32_Not_val) +UNOP(neg, 0xF7, 3, n_ia32_Neg_val) +UNOP(mul, 0xF7, 4, n_ia32_Mul_right) +UNOP(imul1op, 0xF7, 5, n_ia32_IMul1OP_right) +UNOP(div, 0xF7, 6, n_ia32_Div_divisor) +UNOP(idiv, 0xF7, 7, n_ia32_IDiv_divisor) + +/* TODO: am support for IJmp */ +UNOP(ijmp, 0xFF, 4, n_ia32_IJmp_target) + +#define SHIFT(op, ext) \ +static void bemit_##op(const ir_node *node) \ +{ \ + const arch_register_t *out = get_out_reg(node, 0); \ + ir_node *count = get_irn_n(node, 1); \ + if (is_ia32_Immediate(count)) { \ + int offset = get_ia32_immediate_attr_const(count)->offset; \ + if (offset == 1) { \ + bemit8(0xD1); \ + bemit_modru(out, ext); \ + } else { \ + bemit8(0xC1); \ + bemit_modru(out, ext); \ + bemit8(offset); \ + } \ + } else { \ + bemit8(0xD3); \ + bemit_modru(out, ext); \ + } \ +} \ + \ +static void bemit_##op##mem(const ir_node *node) \ +{ \ + ir_node *count; \ + unsigned size = get_mode_size_bits(get_ia32_ls_mode(node)); \ + if (size == 16) \ + bemit8(0x66); \ + count = get_irn_n(node, 1); \ + if (is_ia32_Immediate(count)) { \ + int offset = get_ia32_immediate_attr_const(count)->offset; \ + if (offset == 1) { \ + bemit8(size == 8 ? 0xD0 : 0xD1); \ + bemit_mod_am(ext, node); \ + } else { \ + bemit8(size == 8 ? 0xC0 : 0xC1); \ + bemit_mod_am(ext, node); \ + bemit8(offset); \ + } \ + } else { \ + bemit8(size == 8 ? 0xD2 : 0xD3); \ + bemit_mod_am(ext, node); \ + } \ +} + +SHIFT(rol, 0) +SHIFT(ror, 1) +SHIFT(shl, 4) +SHIFT(shr, 5) +SHIFT(sar, 7) + +static void bemit_shld(const ir_node *node) +{ + const arch_register_t *in = get_in_reg(node, n_ia32_ShlD_val_low); + const arch_register_t *out = get_out_reg(node, pn_ia32_ShlD_res); + ir_node *count = get_irn_n(node, n_ia32_ShlD_count); + bemit8(0x0F); + if (is_ia32_Immediate(count)) { + bemit8(0xA4); + bemit_modrr(out, in); + bemit8(get_ia32_immediate_attr_const(count)->offset); + } else { + bemit8(0xA5); + bemit_modrr(out, in); + } +} + +static void bemit_shrd(const ir_node *node) +{ + const arch_register_t *in = get_in_reg(node, n_ia32_ShrD_val_low); + const arch_register_t *out = get_out_reg(node, pn_ia32_ShrD_res); + ir_node *count = get_irn_n(node, n_ia32_ShrD_count); + bemit8(0x0F); + if (is_ia32_Immediate(count)) { + bemit8(0xAC); + bemit_modrr(out, in); + bemit8(get_ia32_immediate_attr_const(count)->offset); + } else { + bemit8(0xAD); + bemit_modrr(out, in); + } +} + +/** + * binary emitter for setcc. + */ +static void bemit_setcc(const ir_node *node) +{ + const arch_register_t *dreg = get_out_reg(node, pn_ia32_Setcc_res); + + pn_Cmp pnc = get_ia32_condcode(node); + pnc = determine_final_pnc(node, n_ia32_Setcc_eflags, pnc); + if (pnc & ia32_pn_Cmp_float) { + switch (pnc & 0x0f) { + case pn_Cmp_Uo: + /* setp dreg */ + bemit8(0x0F); + bemit8(0x9B); + bemit_modrm8(REG_HIGH, dreg); + + /* andb %>dreg, %dreg */ + bemit8(0x0F); + bemit8(0x9A); + bemit_modrm8(REG_HIGH, dreg); + + /* orb %>dreg, %data.ins_permuted; + const arch_register_t *out = arch_irn_get_register(node, pn_ia32_res); + pn_Cmp pnc = get_ia32_condcode(node); + const arch_register_t *in_true; + const arch_register_t *in_false; + + pnc = determine_final_pnc(node, n_ia32_CMovcc_eflags, pnc); + + in_true = arch_get_irn_register(get_irn_n(node, n_ia32_CMovcc_val_true)); + in_false = arch_get_irn_register(get_irn_n(node, n_ia32_CMovcc_val_false)); + + /* should be same constraint fullfilled? */ + if (out == in_false) { + /* yes -> nothing to do */ + } else if (out == in_true) { + assert(get_ia32_op_type(node) == ia32_Normal); + ins_permuted = !ins_permuted; + in_true = in_false; + } else { + /* we need a mov */ + bemit8(0x8B); // mov %in_false, %out + bemit_modrr(in_false, out); + } + + if (ins_permuted) + pnc = ia32_get_negated_pnc(pnc); + + /* TODO: handling of Nans isn't correct yet */ + + bemit8(0x0F); + bemit8(0x40 | pnc2cc(pnc)); + if (get_ia32_op_type(node) == ia32_Normal) { + bemit_modrr(in_true, out); + } else { + bemit_mod_am(reg_gp_map[out->index], node); + } +} + +static void bemit_cmp(const ir_node *node) +{ + unsigned ls_size = get_mode_size_bits(get_ia32_ls_mode(node)); + ir_node *right; + + if (ls_size == 16) + bemit8(0x66); + + right = get_irn_n(node, n_ia32_binary_right); + if (is_ia32_Immediate(right)) { + /* Use in-reg, because some instructions (cmp, test) have no out-reg. */ + const ir_node *op = get_irn_n(node, n_ia32_binary_right); + const ia32_immediate_attr_t *attr = get_ia32_immediate_attr_const(op); + unsigned size; + + if (attr->symconst != NULL) { + size = 4; + } else { + /* check for sign extension */ + size = get_signed_imm_size(attr->offset); + } + + switch (size) { + case 1: + bemit8(0x81 | SIGNEXT_IMM); + /* cmp has this special mode */ + if (get_ia32_op_type(node) == ia32_AddrModeS) { + bemit_mod_am(7, node); + } else { + const arch_register_t *reg = get_in_reg(node, n_ia32_binary_left); + bemit_modru(reg, 7); + } + bemit8((unsigned char)attr->offset); + return; + case 2: + case 4: + /* check for eax variant: this variant is shorter for 32bit immediates only */ + if (get_ia32_op_type(node) == ia32_AddrModeS) { + bemit8(0x81); + bemit_mod_am(7, node); + } else { + const arch_register_t *reg = get_in_reg(node, n_ia32_binary_left); + if (reg->index == REG_EAX) { + bemit8(0x3D); + } else { + bemit8(0x81); + bemit_modru(reg, 7); + } + } + if (ls_size == 16) { + bemit16(attr->offset); + } else { + bemit_entity(attr->symconst, attr->sc_sign, attr->offset, false); + } + return; + } + panic("invalid imm size?!?"); + } else { + const arch_register_t *out = get_in_reg(node, n_ia32_binary_left); + bemit8(0x3B); + if (get_ia32_op_type(node) == ia32_Normal) { + const arch_register_t *op2 = get_in_reg(node, n_ia32_binary_right); + bemit_modrr(op2, out); + } else { + bemit_mod_am(reg_gp_map[out->index], node); + } + } +} + +static void bemit_cmp8bit(const ir_node *node) +{ + ir_node *right = get_irn_n(node, n_ia32_binary_right); + if (is_ia32_Immediate(right)) { + if (get_ia32_op_type(node) == ia32_Normal) { + const arch_register_t *out = get_in_reg(node, n_ia32_Cmp_left); + if (out->index == REG_EAX) { + bemit8(0x3C); + } else { + bemit8(0x80); + bemit_modru(out, 7); + } + } else { + bemit8(0x80); + bemit_mod_am(7, node); + } + bemit8(get_ia32_immediate_attr_const(right)->offset); + } else { + const arch_register_t *out = get_in_reg(node, n_ia32_Cmp_left); + bemit8(0x3A); + if (get_ia32_op_type(node) == ia32_Normal) { + const arch_register_t *in = get_in_reg(node, n_ia32_Cmp_right); + bemit_modrr(out, in); + } else { + bemit_mod_am(reg_gp_map[out->index], node); + } + } +} + +static void bemit_test8bit(const ir_node *node) +{ + ir_node *right = get_irn_n(node, n_ia32_Test8Bit_right); + if (is_ia32_Immediate(right)) { + if (get_ia32_op_type(node) == ia32_Normal) { + const arch_register_t *out = get_in_reg(node, n_ia32_Test8Bit_left); + if (out->index == REG_EAX) { + bemit8(0xA8); + } else { + bemit8(0xF6); + bemit_modru(out, 0); + } + } else { + bemit8(0xF6); + bemit_mod_am(0, node); + } + bemit8(get_ia32_immediate_attr_const(right)->offset); + } else { + const arch_register_t *out = get_in_reg(node, n_ia32_Test8Bit_left); + bemit8(0x84); + if (get_ia32_op_type(node) == ia32_Normal) { + const arch_register_t *in = get_in_reg(node, n_ia32_Test8Bit_right); + bemit_modrr(out, in); + } else { + bemit_mod_am(reg_gp_map[out->index], node); + } + } +} + +static void bemit_imul(const ir_node *node) +{ + ir_node *right = get_irn_n(node, n_ia32_IMul_right); + /* Do we need the immediate form? */ + if (is_ia32_Immediate(right)) { + int imm = get_ia32_immediate_attr_const(right)->offset; + if (get_signed_imm_size(imm) == 1) { + bemit_unop_reg(node, 0x6B, n_ia32_IMul_left); + bemit8(imm); + } else { + bemit_unop_reg(node, 0x69, n_ia32_IMul_left); + bemit32(imm); + } + } else { + bemit8(0x0F); + bemit_unop_reg(node, 0xAF, n_ia32_IMul_right); + } +} + +static void bemit_dec(const ir_node *node) +{ + const arch_register_t *out = get_out_reg(node, pn_ia32_Dec_res); + bemit8(0x48 + reg_gp_map[out->index]); +} + +static void bemit_inc(const ir_node *node) +{ + const arch_register_t *out = get_out_reg(node, pn_ia32_Inc_res); + bemit8(0x40 + reg_gp_map[out->index]); +} + +#define UNOPMEM(op, code, ext) \ +static void bemit_##op(const ir_node *node) \ +{ \ + bemit_unop_mem(node, code, ext); \ +} + +UNOPMEM(notmem, 0xF6, 2) +UNOPMEM(negmem, 0xF6, 3) +UNOPMEM(incmem, 0xFE, 0) +UNOPMEM(decmem, 0xFE, 1) + +static void bemit_ldtls(const ir_node *node) +{ + const arch_register_t *out = get_out_reg(node, 0); + + bemit8(0x65); // gs: + if (out->index == REG_EAX) { + bemit8(0xA1); // movl 0, %eax + } else { + bemit8(0x8B); // movl 0, %reg + bemit8(MOD_IND | ENC_REG(reg_gp_map[out->index]) | ENC_RM(0x05)); + } + bemit32(0); +} + +/** + * Emit a Lea. + */ +static void bemit_lea(const ir_node *node) +{ + const arch_register_t *out = get_out_reg(node, 0); + bemit8(0x8D); + bemit_mod_am(reg_gp_map[out->index], node); +} + +/* helper function for bemit_minus64bit */ +static void bemit_helper_mov(const arch_register_t *src, const arch_register_t *dst) +{ + bemit8(0x8B); // movl %src, %dst + bemit_modrr(src, dst); +} + +/* helper function for bemit_minus64bit */ +static void bemit_helper_neg(const arch_register_t *reg) +{ + bemit8(0xF7); // negl %reg + bemit_modru(reg, 3); +} + +/* helper function for bemit_minus64bit */ +static void bemit_helper_sbb0(const arch_register_t *reg) +{ + bemit8(0x83); // sbbl $0, %reg + bemit_modru(reg, 3); + bemit8(0); +} + +/* helper function for bemit_minus64bit */ +static void bemit_helper_sbb(const arch_register_t *src, const arch_register_t *dst) +{ + bemit8(0x1B); // sbbl %src, %dst + bemit_modrr(src, dst); +} + +/* helper function for bemit_minus64bit */ +static void bemit_helper_xchg(const arch_register_t *src, const arch_register_t *dst) +{ + if (src->index == REG_EAX) { + bemit8(0x90 + reg_gp_map[dst->index]); // xchgl %eax, %dst + } else if (dst->index == REG_EAX) { + bemit8(0x90 + reg_gp_map[src->index]); // xchgl %src, %eax + } else { + bemit8(0x87); // xchgl %src, %dst + bemit_modrr(src, dst); + } +} + +/* helper function for bemit_minus64bit */ +static void bemit_helper_zero(const arch_register_t *reg) +{ + bemit8(0x33); // xorl %reg, %reg + bemit_modrr(reg, reg); +} + +static void bemit_minus64bit(const ir_node *node) +{ + const arch_register_t *in_lo = get_in_reg(node, 0); + const arch_register_t *in_hi = get_in_reg(node, 1); + const arch_register_t *out_lo = get_out_reg(node, 0); + const arch_register_t *out_hi = get_out_reg(node, 1); + + if (out_lo == in_lo) { + if (out_hi != in_hi) { + /* a -> a, b -> d */ + goto zero_neg; + } else { + /* a -> a, b -> b */ + goto normal_neg; + } + } else if (out_lo == in_hi) { + if (out_hi == in_lo) { + /* a -> b, b -> a */ + bemit_helper_xchg(in_lo, in_hi); + goto normal_neg; + } else { + /* a -> b, b -> d */ + bemit_helper_mov(in_hi, out_hi); + bemit_helper_mov(in_lo, out_lo); + goto normal_neg; + } + } else { + if (out_hi == in_lo) { + /* a -> c, b -> a */ + bemit_helper_mov(in_lo, out_lo); + goto zero_neg; + } else if (out_hi == in_hi) { + /* a -> c, b -> b */ + bemit_helper_mov(in_lo, out_lo); + goto normal_neg; + } else { + /* a -> c, b -> d */ + bemit_helper_mov(in_lo, out_lo); + goto zero_neg; + } + } + +normal_neg: + bemit_helper_neg( out_hi); + bemit_helper_neg( out_lo); + bemit_helper_sbb0(out_hi); + return; + +zero_neg: + bemit_helper_zero(out_hi); + bemit_helper_neg( out_lo); + bemit_helper_sbb( in_hi, out_hi); +} + +/** + * Emit a single opcode. + */ +#define EMIT_SINGLEOP(op, code) \ +static void bemit_ ## op(const ir_node *node) { \ + (void) node; \ + bemit8(code); \ +} + +//EMIT_SINGLEOP(daa, 0x27) +//EMIT_SINGLEOP(das, 0x2F) +//EMIT_SINGLEOP(aaa, 0x37) +//EMIT_SINGLEOP(aas, 0x3F) +//EMIT_SINGLEOP(nop, 0x90) +EMIT_SINGLEOP(cwtl, 0x98) +EMIT_SINGLEOP(cltd, 0x99) +//EMIT_SINGLEOP(fwait, 0x9B) +EMIT_SINGLEOP(sahf, 0x9E) +//EMIT_SINGLEOP(popf, 0x9D) +EMIT_SINGLEOP(leave, 0xC9) +EMIT_SINGLEOP(int3, 0xCC) +//EMIT_SINGLEOP(iret, 0xCF) +//EMIT_SINGLEOP(xlat, 0xD7) +//EMIT_SINGLEOP(lock, 0xF0) +EMIT_SINGLEOP(rep, 0xF3) +//EMIT_SINGLEOP(halt, 0xF4) +EMIT_SINGLEOP(cmc, 0xF5) +EMIT_SINGLEOP(stc, 0xF9) +//EMIT_SINGLEOP(cli, 0xFA) +//EMIT_SINGLEOP(sti, 0xFB) +//EMIT_SINGLEOP(std, 0xFD) + +/** + * Emits a MOV out, [MEM]. + */ +static void bemit_load(const ir_node *node) +{ + const arch_register_t *out = get_out_reg(node, 0); + + if (out->index == REG_EAX) { + ir_node *base = get_irn_n(node, n_ia32_base); + int has_base = !is_ia32_NoReg_GP(base); + ir_node *index = get_irn_n(node, n_ia32_index); + int has_index = !is_ia32_NoReg_GP(index); + if (!has_base && !has_index) { + ir_entity *ent = get_ia32_am_sc(node); + int offs = get_ia32_am_offs_int(node); + /* load from constant address to EAX can be encoded + as 0xA1 [offset] */ + bemit8(0xA1); + bemit_entity(ent, 0, offs, false); + return; + } + } + bemit8(0x8B); + bemit_mod_am(reg_gp_map[out->index], node); +} + +/** + * Emits a MOV [mem], in. + */ +static void bemit_store(const ir_node *node) +{ + const ir_node *value = get_irn_n(node, n_ia32_Store_val); + unsigned size = get_mode_size_bits(get_ia32_ls_mode(node)); + + if (is_ia32_Immediate(value)) { + if (size == 8) { + bemit8(0xC6); + bemit_mod_am(0, node); + bemit8(get_ia32_immediate_attr_const(value)->offset); + } else if (size == 16) { + bemit8(0x66); + bemit8(0xC7); + bemit_mod_am(0, node); + bemit16(get_ia32_immediate_attr_const(value)->offset); + } else { + bemit8(0xC7); + bemit_mod_am(0, node); + bemit_immediate(value, false); + } + } else { + const arch_register_t *in = get_in_reg(node, n_ia32_Store_val); + + if (in->index == REG_EAX) { + ir_node *base = get_irn_n(node, n_ia32_base); + int has_base = !is_ia32_NoReg_GP(base); + ir_node *index = get_irn_n(node, n_ia32_index); + int has_index = !is_ia32_NoReg_GP(index); + if (!has_base && !has_index) { + ir_entity *ent = get_ia32_am_sc(node); + int offs = get_ia32_am_offs_int(node); + /* store to constant address from EAX can be encoded as + * 0xA2/0xA3 [offset]*/ + if (size == 8) { + bemit8(0xA2); + } else { + if (size == 16) + bemit8(0x66); + bemit8(0xA3); + } + bemit_entity(ent, 0, offs, false); + return; + } + } + + if (size == 8) { + bemit8(0x88); + } else { + if (size == 16) + bemit8(0x66); + bemit8(0x89); + } + bemit_mod_am(reg_gp_map[in->index], node); + } +} + +static void bemit_conv_i2i(const ir_node *node) +{ + ir_mode *smaller_mode = get_ia32_ls_mode(node); + unsigned opcode; + + bemit8(0x0F); + /* 8 16 bit source + * movzx B6 B7 + * movsx BE BF + */ + opcode = 0xB6; + if (mode_is_signed(smaller_mode)) opcode |= 0x08; + if (get_mode_size_bits(smaller_mode) == 16) opcode |= 0x01; + bemit_unop_reg(node, opcode, n_ia32_Conv_I2I_val); +} + +/** + * Emit a Push. + */ +static void bemit_push(const ir_node *node) +{ + const ir_node *value = get_irn_n(node, n_ia32_Push_val); + + if (is_ia32_Immediate(value)) { + const ia32_immediate_attr_t *attr + = get_ia32_immediate_attr_const(value); + unsigned size = get_signed_imm_size(attr->offset); + if (attr->symconst) + size = 4; + switch (size) { + case 1: + bemit8(0x6A); + bemit8((unsigned char)attr->offset); + break; + case 2: + case 4: + bemit8(0x68); + bemit_immediate(value, false); + break; + } + } else if (is_ia32_NoReg_GP(value)) { + bemit8(0xFF); + bemit_mod_am(6, node); + } else { + const arch_register_t *reg = get_in_reg(node, n_ia32_Push_val); + bemit8(0x50 + reg_gp_map[reg->index]); + } +} + +/** + * Emit a Pop. + */ +static void bemit_pop(const ir_node *node) +{ + const arch_register_t *reg = get_out_reg(node, pn_ia32_Pop_res); + bemit8(0x58 + reg_gp_map[reg->index]); +} + +static void bemit_popmem(const ir_node *node) +{ + bemit8(0x8F); + bemit_mod_am(0, node); +} + +static void bemit_call(const ir_node *node) +{ + ir_node *proc = get_irn_n(node, n_ia32_Call_addr); + + if (is_ia32_Immediate(proc)) { + bemit8(0xE8); + bemit_immediate(proc, true); + } else { + bemit_unop(node, 0xFF, 2, n_ia32_Call_addr); + } +} + +static void bemit_jmp(const ir_node *dest_block) +{ + bemit8(0xE9); + bemit_jmp_destination(dest_block); +} + +static void bemit_jump(const ir_node *node) +{ + if (can_be_fallthrough(node)) + return; + + bemit_jmp(get_cfop_target_block(node)); +} + +static void bemit_jcc(int pnc, const ir_node *dest_block) +{ + unsigned char cc = pnc2cc(pnc); + bemit8(0x0F); + bemit8(0x80 + cc); + bemit_jmp_destination(dest_block); +} + +static void bemit_jp(bool odd, const ir_node *dest_block) +{ + bemit8(0x0F); + bemit8(0x8A + odd); + bemit_jmp_destination(dest_block); +} + +static void bemit_ia32_jcc(const ir_node *node) +{ + int pnc = get_ia32_condcode(node); + const ir_node *proj_true; + const ir_node *proj_false; + const ir_node *dest_true; + const ir_node *dest_false; + const ir_node *block; + + pnc = determine_final_pnc(node, 0, pnc); + + /* get both Projs */ + proj_true = get_proj(node, pn_ia32_Jcc_true); + assert(proj_true && "Jcc without true Proj"); + + proj_false = get_proj(node, pn_ia32_Jcc_false); + assert(proj_false && "Jcc without false Proj"); + + block = get_nodes_block(node); + + if (can_be_fallthrough(proj_true)) { + /* exchange both proj's so the second one can be omitted */ + const ir_node *t = proj_true; + + proj_true = proj_false; + proj_false = t; + pnc = ia32_get_negated_pnc(pnc); + } + + dest_true = get_cfop_target_block(proj_true); + dest_false = get_cfop_target_block(proj_false); + + if (pnc & ia32_pn_Cmp_float) { + /* Some floating point comparisons require a test of the parity flag, + * which indicates that the result is unordered */ + switch (pnc & 15) { + case pn_Cmp_Uo: { + bemit_jp(false, dest_true); + break; + } + + case pn_Cmp_Leg: + bemit_jp(true, dest_true); + break; + + case pn_Cmp_Eq: + case pn_Cmp_Lt: + case pn_Cmp_Le: + /* we need a local label if the false proj is a fallthrough + * as the falseblock might have no label emitted then */ + if (can_be_fallthrough(proj_false)) { + bemit8(0x7A); + bemit8(0x06); // jp + 6 + } else { + bemit_jp(false, dest_false); + } + goto emit_jcc; + + case pn_Cmp_Ug: + case pn_Cmp_Uge: + case pn_Cmp_Ne: + bemit_jp(false, dest_true); + goto emit_jcc; + + default: + goto emit_jcc; + } + } else { +emit_jcc: + bemit_jcc(pnc, dest_true); + } + + /* the second Proj might be a fallthrough */ + if (can_be_fallthrough(proj_false)) { + /* it's a fallthrough */ + } else { + bemit_jmp(dest_false); + } +} + +static void bemit_switchjmp(const ir_node *node) +{ + unsigned long interval; + int last_value; + int i; + jmp_tbl_t tbl; + const arch_register_t *in; + + /* fill the table structure */ + generate_jump_table(&tbl, node); + + /* two-complement's magic make this work without overflow */ + interval = tbl.max_value - tbl.min_value; + + in = get_in_reg(node, 0); + /* emit the table */ + if (get_signed_imm_size(interval) == 1) { + bemit8(0x83); // cmpl $imm8, %in + bemit_modru(in, 7); + bemit8(interval); + } else { + bemit8(0x81); // cmpl $imm32, %in + bemit_modru(in, 7); + bemit32(interval); + } + bemit8(0x0F); // ja tbl.defProj + bemit8(0x87); + ia32_emitf(tbl.defProj, ".long %L - . - 4\n"); + + if (tbl.num_branches > 1) { + /* create table */ + bemit8(0xFF); // jmp *tbl.label(,%in,4) + bemit8(MOD_IND | ENC_REG(4) | ENC_RM(0x04)); + bemit8(ENC_SIB(2, reg_gp_map[in->index], 0x05)); + be_emit_irprintf("\t.long %s\n", tbl.label); + + be_gas_emit_switch_section(GAS_SECTION_RODATA); + be_emit_cstring(".align 4\n"); + be_emit_irprintf("%s:\n", tbl.label); + + last_value = tbl.branches[0].value; + for (i = 0; i != tbl.num_branches; ++i) { + while (last_value != tbl.branches[i].value) { + ia32_emitf(tbl.defProj, ".long %L\n"); + ++last_value; + } + ia32_emitf(tbl.branches[i].target, ".long %L\n"); + ++last_value; + } + be_gas_emit_switch_section(GAS_SECTION_TEXT); + } else { + /* one jump is enough */ + panic("switch only has one case"); + //ia32_emitf(tbl.branches[0].target, "\tjmp %L\n"); + } + + be_emit_write_line(); + + free(tbl.branches); +} + +/** + * Emits a return. + */ +static void bemit_return(const ir_node *node) +{ + unsigned pop = be_Return_get_pop(node); + if (pop > 0 || be_Return_get_emit_pop(node)) { + bemit8(0xC2); + assert(pop <= 0xffff); + bemit16(pop); + } else { + bemit8(0xC3); + } +} + +static void bemit_subsp(const ir_node *node) +{ + const arch_register_t *out; + /* sub %in, %esp */ + bemit_sub(node); + /* mov %esp, %out */ + bemit8(0x8B); + out = get_out_reg(node, 1); + bemit8(MOD_REG | ENC_REG(reg_gp_map[out->index]) | ENC_RM(0x04)); +} + +static void bemit_incsp(const ir_node *node) +{ + int offs; + const arch_register_t *reg; + unsigned size; + unsigned ext; + + offs = be_get_IncSP_offset(node); + if (offs == 0) + return; + + if (offs > 0) { + ext = 5; /* sub */ + } else { + ext = 0; /* add */ + offs = -offs; + } + + size = get_signed_imm_size(offs); + bemit8(size == 1 ? 0x83 : 0x81); + + reg = get_out_reg(node, 0); + bemit_modru(reg, ext); + + if (size == 1) { + bemit8(offs); + } else { + bemit32(offs); + } +} + +static void bemit_copybi(const ir_node *node) +{ + unsigned size = get_ia32_copyb_size(node); + if (size & 1) + bemit8(0xA4); // movsb + if (size & 2) { + bemit8(0x66); + bemit8(0xA5); // movsw + } + size >>= 2; + while (size--) { + bemit8(0xA5); // movsl + } +} + +static void bemit_fbinop(const ir_node *node, unsigned code, unsigned code_to) +{ + if (get_ia32_op_type(node) == ia32_Normal) { + const ia32_x87_attr_t *x87_attr = get_ia32_x87_attr_const(node); + const arch_register_t *in1 = x87_attr->x87[0]; + const arch_register_t *in = x87_attr->x87[1]; + const arch_register_t *out = x87_attr->x87[2]; + + if (out == NULL) { + out = in1; + } else if (out == in) { + in = in1; + } + + if (out->index == 0) { + bemit8(0xD8); + bemit8(MOD_REG | ENC_REG(code) | ENC_RM(in->index)); + } else { + bemit8(0xDC); + bemit8(MOD_REG | ENC_REG(code_to) | ENC_RM(out->index)); + } + } else { + if (get_mode_size_bits(get_ia32_ls_mode(node)) == 32) { + bemit8(0xD8); + } else { + bemit8(0xDC); + } + bemit_mod_am(code, node); + } +} + +static void bemit_fbinopp(const ir_node *node, unsigned const code) +{ + const ia32_x87_attr_t *x87_attr = get_ia32_x87_attr_const(node); + const arch_register_t *out = x87_attr->x87[2]; + bemit8(0xDE); + bemit8(code + out->index); +} + +static void bemit_fabs(const ir_node *node) +{ + (void)node; + + bemit8(0xD9); + bemit8(0xE1); +} + +static void bemit_fadd(const ir_node *node) +{ + bemit_fbinop(node, 0, 0); +} + +static void bemit_faddp(const ir_node *node) +{ + bemit_fbinopp(node, 0xC0); +} + +static void bemit_fchs(const ir_node *node) +{ + (void)node; + + bemit8(0xD9); + bemit8(0xE0); +} + +static void bemit_fdiv(const ir_node *node) +{ + bemit_fbinop(node, 6, 7); +} + +static void bemit_fdivp(const ir_node *node) +{ + bemit_fbinopp(node, 0xF8); +} + +static void bemit_fdivr(const ir_node *node) +{ + bemit_fbinop(node, 7, 6); +} + +static void bemit_fdivrp(const ir_node *node) +{ + bemit_fbinopp(node, 0xF0); +} + +static void bemit_fild(const ir_node *node) +{ + switch (get_mode_size_bits(get_ia32_ls_mode(node))) { + case 16: + bemit8(0xDF); // filds + bemit_mod_am(0, node); + return; + + case 32: + bemit8(0xDB); // fildl + bemit_mod_am(0, node); + return; + + case 64: + bemit8(0xDF); // fildll + bemit_mod_am(5, node); + return; + + default: + panic("invalid mode size"); + } +} + +static void bemit_fist(const ir_node *node) +{ + switch (get_mode_size_bits(get_ia32_ls_mode(node))) { + case 16: + bemit8(0xDF); // fists + break; + + case 32: + bemit8(0xDB); // fistl + break; + + default: + panic("invalid mode size"); + } + bemit_mod_am(2, node); +} + +static void bemit_fistp(const ir_node *node) +{ + switch (get_mode_size_bits(get_ia32_ls_mode(node))) { + case 16: + bemit8(0xDF); // fistps + bemit_mod_am(3, node); + return; + + case 32: + bemit8(0xDB); // fistpl + bemit_mod_am(3, node); + return; + + case 64: + bemit8(0xDF); // fistpll + bemit_mod_am(7, node); + return; + + default: + panic("invalid mode size"); + } +} + +static void bemit_fld(const ir_node *node) +{ + switch (get_mode_size_bits(get_ia32_ls_mode(node))) { + case 32: + bemit8(0xD9); // flds + bemit_mod_am(0, node); + return; + + case 64: + bemit8(0xDD); // fldl + bemit_mod_am(0, node); + return; + + case 80: + case 96: + bemit8(0xDB); // fldt + bemit_mod_am(5, node); + return; + + default: + panic("invalid mode size"); + } +} + +static void bemit_fld1(const ir_node *node) +{ + (void)node; + bemit8(0xD9); + bemit8(0xE8); // fld1 +} + +static void bemit_fldcw(const ir_node *node) +{ + bemit8(0xD9); // fldcw + bemit_mod_am(5, node); +} + +static void bemit_fldz(const ir_node *node) +{ + (void)node; + bemit8(0xD9); + bemit8(0xEE); // fldz +} + +static void bemit_fmul(const ir_node *node) +{ + bemit_fbinop(node, 1, 1); +} + +static void bemit_fmulp(const ir_node *node) +{ + bemit_fbinopp(node, 0xC8); +} + +static void bemit_fpop(const ir_node *node) +{ + const ia32_x87_attr_t *attr = get_ia32_x87_attr_const(node); + bemit8(0xDD); + bemit8(0xD8 + attr->x87[0]->index); +} + +static void bemit_fpush(const ir_node *node) +{ + const ia32_x87_attr_t *attr = get_ia32_x87_attr_const(node); + bemit8(0xD9); + bemit8(0xC0 + attr->x87[0]->index); +} + +static void bemit_fpushcopy(const ir_node *node) +{ + const ia32_x87_attr_t *attr = get_ia32_x87_attr_const(node); + bemit8(0xD9); + bemit8(0xC0 + attr->x87[0]->index); +} + +static void bemit_fst(const ir_node *node) +{ + switch (get_mode_size_bits(get_ia32_ls_mode(node))) { + case 32: + bemit8(0xD9); // fsts + break; + + case 64: + bemit8(0xDD); // fstl + break; + + default: + panic("invalid mode size"); + } + bemit_mod_am(2, node); +} + +static void bemit_fstp(const ir_node *node) +{ + switch (get_mode_size_bits(get_ia32_ls_mode(node))) { + case 32: + bemit8(0xD9); // fstps + bemit_mod_am(3, node); + return; + + case 64: + bemit8(0xDD); // fstpl + bemit_mod_am(3, node); + return; + + case 80: + case 96: + bemit8(0xDB); // fstpt + bemit_mod_am(7, node); + return; + + default: + panic("invalid mode size"); + } +} + +static void bemit_fsub(const ir_node *node) +{ + bemit_fbinop(node, 4, 5); +} + +static void bemit_fsubp(const ir_node *node) +{ + bemit_fbinopp(node, 0xE8); +} + +static void bemit_fsubr(const ir_node *node) +{ + bemit_fbinop(node, 5, 4); +} + +static void bemit_fsubrp(const ir_node *node) +{ + bemit_fbinopp(node, 0xE0); +} + +static void bemit_fnstcw(const ir_node *node) +{ + bemit8(0xD9); // fnstcw + bemit_mod_am(7, node); +} + +static void bemit_fnstsw(void) +{ + bemit8(0xDF); // fnstsw %ax + bemit8(0xE0); +} + +static void bemit_ftstfnstsw(const ir_node *node) +{ + (void)node; + + bemit8(0xD9); // ftst + bemit8(0xE4); + bemit_fnstsw(); +} + +static void bemit_fucomi(const ir_node *node) +{ + const ia32_x87_attr_t *attr = get_ia32_x87_attr_const(node); + bemit8(0xDB); // fucomi + bemit8(0xE8 + attr->x87[1]->index); +} + +static void bemit_fucomip(const ir_node *node) +{ + const ia32_x87_attr_t *attr = get_ia32_x87_attr_const(node); + bemit8(0xDF); // fucomip + bemit8(0xE8 + attr->x87[1]->index); +} + +static void bemit_fucomfnstsw(const ir_node *node) +{ + const ia32_x87_attr_t *attr = get_ia32_x87_attr_const(node); + bemit8(0xDD); // fucom + bemit8(0xE0 + attr->x87[1]->index); + bemit_fnstsw(); +} + +static void bemit_fucompfnstsw(const ir_node *node) +{ + const ia32_x87_attr_t *attr = get_ia32_x87_attr_const(node); + bemit8(0xDD); // fucomp + bemit8(0xE8 + attr->x87[1]->index); + bemit_fnstsw(); +} + +static void bemit_fucomppfnstsw(const ir_node *node) +{ + (void)node; + + bemit8(0xDA); // fucompp + bemit8(0xE9); + bemit_fnstsw(); +} + +static void bemit_fxch(const ir_node *node) +{ + const ia32_x87_attr_t *attr = get_ia32_x87_attr_const(node); + bemit8(0xD9); + bemit8(0xC8 + attr->x87[0]->index); +} + +/** + * The type of a emitter function. + */ +typedef void (*emit_func) (const ir_node *); + +/** + * Set a node emitter. Make it a bit more type safe. + */ +static void register_emitter(ir_op *op, emit_func func) +{ + op->ops.generic = (op_func) func; +} + +static void ia32_register_binary_emitters(void) +{ + /* first clear the generic function pointer for all ops */ + clear_irp_opcodes_generic_func(); + + /* benode emitter */ + register_emitter(op_be_Copy, bemit_copy); + register_emitter(op_be_CopyKeep, bemit_copy); + register_emitter(op_be_IncSP, bemit_incsp); + register_emitter(op_be_Perm, bemit_perm); + register_emitter(op_be_Return, bemit_return); + register_emitter(op_ia32_Adc, bemit_adc); + register_emitter(op_ia32_Add, bemit_add); + register_emitter(op_ia32_AddMem, bemit_addmem); + register_emitter(op_ia32_AddMem8Bit, bemit_addmem8bit); + register_emitter(op_ia32_And, bemit_and); + register_emitter(op_ia32_AndMem, bemit_andmem); + register_emitter(op_ia32_AndMem8Bit, bemit_andmem8bit); + register_emitter(op_ia32_Breakpoint, bemit_int3); + register_emitter(op_ia32_CMovcc, bemit_cmovcc); + register_emitter(op_ia32_Call, bemit_call); + register_emitter(op_ia32_Cltd, bemit_cltd); + register_emitter(op_ia32_Cmc, bemit_cmc); + register_emitter(op_ia32_Cmp, bemit_cmp); + register_emitter(op_ia32_Cmp8Bit, bemit_cmp8bit); + register_emitter(op_ia32_Const, bemit_mov_const); + register_emitter(op_ia32_Conv_I2I, bemit_conv_i2i); + register_emitter(op_ia32_Conv_I2I8Bit, bemit_conv_i2i); + register_emitter(op_ia32_CopyB_i, bemit_copybi); + register_emitter(op_ia32_Cwtl, bemit_cwtl); + register_emitter(op_ia32_Dec, bemit_dec); + register_emitter(op_ia32_DecMem, bemit_decmem); + register_emitter(op_ia32_Div, bemit_div); + register_emitter(op_ia32_FldCW, bemit_fldcw); + register_emitter(op_ia32_FnstCW, bemit_fnstcw); + register_emitter(op_ia32_FtstFnstsw, bemit_ftstfnstsw); + register_emitter(op_ia32_FucomFnstsw, bemit_fucomfnstsw); + register_emitter(op_ia32_Fucomi, bemit_fucomi); + register_emitter(op_ia32_FucompFnstsw, bemit_fucompfnstsw); + register_emitter(op_ia32_Fucompi, bemit_fucomip); + register_emitter(op_ia32_FucomppFnstsw, bemit_fucomppfnstsw); + register_emitter(op_ia32_IDiv, bemit_idiv); + register_emitter(op_ia32_IJmp, bemit_ijmp); + register_emitter(op_ia32_IMul, bemit_imul); + register_emitter(op_ia32_IMul1OP, bemit_imul1op); + register_emitter(op_ia32_Inc, bemit_inc); + register_emitter(op_ia32_IncMem, bemit_incmem); + register_emitter(op_ia32_Jcc, bemit_ia32_jcc); + register_emitter(op_ia32_Jmp, bemit_jump); + register_emitter(op_ia32_LdTls, bemit_ldtls); + register_emitter(op_ia32_Lea, bemit_lea); + register_emitter(op_ia32_Leave, bemit_leave); + register_emitter(op_ia32_Load, bemit_load); + register_emitter(op_ia32_Minus64Bit, bemit_minus64bit); + register_emitter(op_ia32_Mul, bemit_mul); + register_emitter(op_ia32_Neg, bemit_neg); + register_emitter(op_ia32_NegMem, bemit_negmem); + register_emitter(op_ia32_Not, bemit_not); + register_emitter(op_ia32_NotMem, bemit_notmem); + register_emitter(op_ia32_Or, bemit_or); + register_emitter(op_ia32_OrMem, bemit_ormem); + register_emitter(op_ia32_OrMem8Bit, bemit_ormem8bit); + register_emitter(op_ia32_Pop, bemit_pop); + register_emitter(op_ia32_PopEbp, bemit_pop); + register_emitter(op_ia32_PopMem, bemit_popmem); + register_emitter(op_ia32_Push, bemit_push); + register_emitter(op_ia32_RepPrefix, bemit_rep); + register_emitter(op_ia32_Rol, bemit_rol); + register_emitter(op_ia32_RolMem, bemit_rolmem); + register_emitter(op_ia32_Ror, bemit_ror); + register_emitter(op_ia32_RorMem, bemit_rormem); + register_emitter(op_ia32_Sahf, bemit_sahf); + register_emitter(op_ia32_Sar, bemit_sar); + register_emitter(op_ia32_SarMem, bemit_sarmem); + register_emitter(op_ia32_Sbb, bemit_sbb); + register_emitter(op_ia32_Setcc, bemit_setcc); + register_emitter(op_ia32_Shl, bemit_shl); + register_emitter(op_ia32_ShlD, bemit_shld); + register_emitter(op_ia32_ShlMem, bemit_shlmem); + register_emitter(op_ia32_Shr, bemit_shr); + register_emitter(op_ia32_ShrD, bemit_shrd); + register_emitter(op_ia32_ShrMem, bemit_shrmem); + register_emitter(op_ia32_Stc, bemit_stc); + register_emitter(op_ia32_Store, bemit_store); + register_emitter(op_ia32_Store8Bit, bemit_store); + register_emitter(op_ia32_Sub, bemit_sub); + register_emitter(op_ia32_SubMem, bemit_submem); + register_emitter(op_ia32_SubMem8Bit, bemit_submem8bit); + register_emitter(op_ia32_SubSP, bemit_subsp); + register_emitter(op_ia32_SwitchJmp, bemit_switchjmp); + register_emitter(op_ia32_Test, bemit_test); + register_emitter(op_ia32_Test8Bit, bemit_test8bit); + register_emitter(op_ia32_Xor, bemit_xor); + register_emitter(op_ia32_Xor0, bemit_xor0); + register_emitter(op_ia32_XorMem, bemit_xormem); + register_emitter(op_ia32_XorMem8Bit, bemit_xormem8bit); + register_emitter(op_ia32_fabs, bemit_fabs); + register_emitter(op_ia32_fadd, bemit_fadd); + register_emitter(op_ia32_faddp, bemit_faddp); + register_emitter(op_ia32_fchs, bemit_fchs); + register_emitter(op_ia32_fdiv, bemit_fdiv); + register_emitter(op_ia32_fdivp, bemit_fdivp); + register_emitter(op_ia32_fdivr, bemit_fdivr); + register_emitter(op_ia32_fdivrp, bemit_fdivrp); + register_emitter(op_ia32_fild, bemit_fild); + register_emitter(op_ia32_fist, bemit_fist); + register_emitter(op_ia32_fistp, bemit_fistp); + register_emitter(op_ia32_fld, bemit_fld); + register_emitter(op_ia32_fld1, bemit_fld1); + register_emitter(op_ia32_fldz, bemit_fldz); + register_emitter(op_ia32_fmul, bemit_fmul); + register_emitter(op_ia32_fmulp, bemit_fmulp); + register_emitter(op_ia32_fpop, bemit_fpop); + register_emitter(op_ia32_fpush, bemit_fpush); + register_emitter(op_ia32_fpushCopy, bemit_fpushcopy); + register_emitter(op_ia32_fst, bemit_fst); + register_emitter(op_ia32_fstp, bemit_fstp); + register_emitter(op_ia32_fsub, bemit_fsub); + register_emitter(op_ia32_fsubp, bemit_fsubp); + register_emitter(op_ia32_fsubr, bemit_fsubr); + register_emitter(op_ia32_fsubrp, bemit_fsubrp); + register_emitter(op_ia32_fxch, bemit_fxch); + + /* ignore the following nodes */ + register_emitter(op_ia32_ProduceVal, emit_Nothing); + register_emitter(op_be_Barrier, emit_Nothing); + register_emitter(op_be_Keep, emit_Nothing); + register_emitter(op_be_Start, emit_Nothing); + register_emitter(op_Phi, emit_Nothing); + register_emitter(op_Start, emit_Nothing); +} + +static void gen_binary_block(ir_node *block) +{ + ir_node *node; + + ia32_emit_block_header(block); + + /* emit the contents of the block */ + sched_foreach(block, node) { + ia32_emit_node(node); + } +} + +void ia32_gen_binary_routine(ia32_code_gen_t *ia32_cg, ir_graph *irg) +{ + ir_entity *entity = get_irg_entity(irg); + int i, n; + + cg = ia32_cg; + isa = cg->isa; + + ia32_register_binary_emitters(); + + be_gas_emit_function_prolog(entity, ia32_cg_config.function_alignment); + + /* we use links to point to target blocks */ + ir_reserve_resources(irg, IR_RESOURCE_IRN_LINK); + irg_block_walk_graph(irg, ia32_gen_labels, NULL, NULL); + + /* initialize next block links */ + n = ARR_LEN(cg->blk_sched); + for (i = 0; i < n; ++i) { + ir_node *block = cg->blk_sched[i]; + ir_node *prev = i > 0 ? cg->blk_sched[i-1] : NULL; + + set_irn_link(block, prev); + } + + for (i = 0; i < n; ++i) { + ir_node *block = cg->blk_sched[i]; + gen_binary_block(block); + } + + be_gas_emit_function_epilog(entity); + be_dbg_method_end(); + be_emit_char('\n'); + be_emit_write_line(); + + ir_free_resources(irg, IR_RESOURCE_IRN_LINK); +} + + + + +void ia32_init_emitter(void) +{ + lc_opt_entry_t *be_grp; + lc_opt_entry_t *ia32_grp; + + be_grp = lc_opt_get_grp(firm_opt_get_root(), "be"); + ia32_grp = lc_opt_get_grp(be_grp, "ia32"); + + lc_opt_add_table(ia32_grp, ia32_emitter_options); + + build_reg_map(); + FIRM_DBG_REGISTER(dbg, "firm.be.ia32.emitter"); }