2 * Copyright (C) 1995-2007 University of Karlsruhe. All right reserved.
4 * This file is part of libFirm.
6 * This file may be distributed and/or modified under the terms of the
7 * GNU General Public License version 2 as published by the Free Software
8 * Foundation and appearing in the file LICENSE.GPL included in the
9 * packaging of this file.
11 * Licensees holding valid libFirm Professional Edition licenses may use
12 * this file in accordance with the libFirm Commercial License.
13 * Agreement provided with the Software.
15 * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
16 * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * @brief This is the main ia32 firm backend driver.
23 * @author Christian Wuerdig
26 #ifndef FIRM_BE_IA32_BEARCH_IA32_T_H
27 #define FIRM_BE_IA32_BEARCH_IA32_T_H
29 #include "firm_config.h"
33 #include "ia32_nodes_attr.h"
38 #include "../bemachine.h"
39 #include "../beemitter.h"
42 #define SET_IA32_ORIG_NODE(n, o)
44 #define SET_IA32_ORIG_NODE(n, o) set_ia32_orig_node(n, o);
48 typedef enum ia32_optimize_t ia32_optimize_t;
49 typedef enum cpu_support cpu_support;
50 typedef enum fp_support fp_support;
53 * Bitmask for the backend optimization settings.
55 enum ia32_optimize_t {
56 IA32_OPT_INCDEC = 1 << 0, /**< optimize add/sub 1/-1 to inc/dec */
61 * Architectures. Clustered for easier macro implementation,
83 /** checks for l <= x <= h */
84 #define _IN_RANGE(x, l, h) ((unsigned)((x) - (l)) <= (unsigned)((h) - (l)))
86 /** returns true if it's Intel architecture */
87 #define ARCH_INTEL(x) _IN_RANGE((x), arch_i386, arch_core)
89 /** returns true if it's AMD architecture */
90 #define ARCH_AMD(x) _IN_RANGE((x), arch_k6, arch_opteron)
92 /** return true if it's a Athlon/Opteron */
93 #define ARCH_ATHLON(x) _IN_RANGE((x), arch_athlon, arch_opteron)
95 /** return true if the CPU has MMX support */
96 #define ARCH_MMX(x) _IN_RANGE((x), arch_pentium_mmx, arch_opteron)
98 #define IS_P6_ARCH(x) (_IN_RANGE((x), arch_pentium_pro, arch_core) || \
99 _IN_RANGE((x), arch_athlon, arch_opteron))
101 /** floating point support */
103 fp_none, /**< no floating point instructions are used */
104 fp_x87, /**< use x87 instructions */
105 fp_sse2 /**< use SSE2 instructions */
108 /** Returns non-zero if the current floating point architecture is SSE2. */
109 #define USE_SSE2(cg) ((cg)->fp_kind == fp_sse2)
111 /** Returns non-zero if the current floating point architecture is x87. */
112 #define USE_x87(cg) ((cg)->fp_kind == fp_x87)
114 typedef struct ia32_isa_t ia32_isa_t;
115 typedef struct ia32_code_gen_t ia32_code_gen_t;
116 typedef struct ia32_irn_ops_t ia32_irn_ops_t;
117 typedef struct ia32_intrinsic_env_t ia32_intrinsic_env_t;
120 * IA32 code generator
122 struct ia32_code_gen_t {
123 const arch_code_generator_if_t *impl; /**< implementation */
124 ir_graph *irg; /**< current irg */
125 const arch_env_t *arch_env; /**< the arch env */
126 set *reg_set; /**< set to memorize registers for non-ia32 nodes (e.g. phi nodes) */
127 ia32_isa_t *isa; /**< for fast access to the isa object */
128 be_irg_t *birg; /**< The be-irg (contains additional information about the irg) */
129 ir_node **blk_sched; /**< an array containing the scheduled blocks */
130 ia32_optimize_t opt; /**< contains optimization information */
131 int arch; /**< instruction architecture */
132 int opt_arch; /**< optimize for architecture */
133 char fp_kind; /**< floating point kind */
134 char do_x87_sim; /**< set to 1 if x87 simulation should be enforced */
135 char dump; /**< set to 1 if graphs should be dumped */
136 ir_node *unknown_gp; /**< unique Unknown_GP node */
137 ir_node *unknown_vfp; /**< unique Unknown_VFP node */
138 ir_node *unknown_xmm; /**< unique Unknown_XMM node */
139 ir_node *noreg_gp; /**< unique NoReg_GP node */
140 ir_node *noreg_vfp; /**< unique NoReg_VFP node */
141 ir_node *noreg_xmm; /**< unique NoReg_XMM node */
143 ir_node *fpu_trunc_mode; /**< truncate fpu mode */
145 struct obstack *obst;
152 arch_isa_t arch_isa; /**< must be derived from arch_isa_t */
153 pmap *regs_16bit; /**< Contains the 16bits names of the gp registers */
154 pmap *regs_8bit; /**< Contains the 8bits names of the gp registers */
155 pmap *regs_8bit_high; /**< contains the hight part of the 8 bit names of the gp registers */
156 pmap *types; /**< A map of modes to primitive types */
157 pmap *tv_ent; /**< A map of entities that store const tarvals */
158 ia32_optimize_t opt; /**< contains optimization information */
159 int arch; /**< instruction architecture */
160 int opt_arch; /**< optimize for architecture */
161 int fp_kind; /**< floating point kind */
162 ia32_code_gen_t *cg; /**< the current code generator */
163 const be_machine_t *cpu; /**< the abstract machine */
165 struct obstack *name_obst; /**< holds the original node names (for debugging) */
169 struct ia32_irn_ops_t {
170 const arch_irn_ops_if_t *impl;
175 * A helper type collecting needed info for IA32 intrinsic lowering.
177 struct ia32_intrinsic_env_t {
178 ia32_isa_t *isa; /**< the isa object */
179 ir_graph *irg; /**< the irg, these entities belong to */
180 ir_entity *ll_div_op1; /**< entity for first div operand (move into FPU) */
181 ir_entity *ll_div_op2; /**< entity for second div operand (move into FPU) */
182 ir_entity *ll_d_conv; /**< entity for converts ll -> d */
183 ir_entity *d_ll_conv; /**< entity for converts d -> ll */
184 ir_entity *divdi3; /**< entity for __divdi3 library call */
185 ir_entity *moddi3; /**< entity for __moddi3 library call */
186 ir_entity *udivdi3; /**< entity for __udivdi3 library call */
187 ir_entity *umoddi3; /**< entity for __umoddi3 library call */
188 tarval *u64_bias; /**< bias value for conversion from float to unsigned 64 */
191 /** The mode for the floating point control word. */
192 extern ir_mode *mode_fpcw;
194 /** The current code generator. */
195 extern ia32_code_gen_t *ia32_current_cg;
198 * Returns the unique per irg GP NoReg node.
200 ir_node *ia32_new_NoReg_gp(ia32_code_gen_t *cg);
201 ir_node *ia32_new_NoReg_xmm(ia32_code_gen_t *cg);
202 ir_node *ia32_new_NoReg_vfp(ia32_code_gen_t *cg);
205 * Returns the uniqure per irg GP Unknown node.
206 * (warning: cse has to be activated)
208 ir_node *ia32_new_Unknown_gp(ia32_code_gen_t *cg);
209 ir_node *ia32_new_Unknown_xmm(ia32_code_gen_t *cg);
210 ir_node *ia32_new_Unknown_vfp(ia32_code_gen_t *cg);
213 * Returns the unique per irg FP NoReg node.
215 ir_node *ia32_new_NoReg_fp(ia32_code_gen_t *cg);
218 * Returns the unique per irg FPU truncation mode node.
220 ir_node *ia32_new_Fpu_truncate(ia32_code_gen_t *cg);
223 * Returns gp_noreg or fp_noreg, depending on input requirements.
225 ir_node *ia32_get_admissible_noreg(ia32_code_gen_t *cg, ir_node *irn, int pos);
228 * Maps all intrinsic calls that the backend support
229 * and map all instructions the backend did not support
232 void ia32_handle_intrinsics(void);
235 * Ia32 implementation.
237 * @param method the method type of the emulation function entity
238 * @param op the emulated ir_op
239 * @param imode the input mode of the emulated opcode
240 * @param omode the output mode of the emulated opcode
241 * @param context the context parameter
243 ir_entity *ia32_create_intrinsic_fkt(ir_type *method, const ir_op *op,
244 const ir_mode *imode, const ir_mode *omode,