2 * Copyright (C) 1995-2007 University of Karlsruhe. All right reserved.
4 * This file is part of libFirm.
6 * This file may be distributed and/or modified under the terms of the
7 * GNU General Public License version 2 as published by the Free Software
8 * Foundation and appearing in the file LICENSE.GPL included in the
9 * packaging of this file.
11 * Licensees holding valid libFirm Professional Edition licenses may use
12 * this file in accordance with the libFirm Commercial License.
13 * Agreement provided with the Software.
15 * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
16 * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * @brief This is the main ia32 firm backend driver.
23 * @author Christian Wuerdig
26 #ifndef FIRM_BE_IA32_BEARCH_IA32_T_H
27 #define FIRM_BE_IA32_BEARCH_IA32_T_H
29 #include "firm_config.h"
33 #include "ia32_nodes_attr.h"
38 #include "../bemachine.h"
39 #include "../beemitter.h"
42 #define SET_IA32_ORIG_NODE(n, o)
44 #define SET_IA32_ORIG_NODE(n, o) set_ia32_orig_node(n, o);
48 typedef enum ia32_optimize_t ia32_optimize_t;
49 typedef enum cpu_support cpu_support;
50 typedef enum fp_support fp_support;
53 * Bitmask for the backend optimization settings.
55 enum ia32_optimize_t {
56 IA32_OPT_INCDEC = 1 << 0, /**< optimize add/sub 1/-1 to inc/dec */
61 * Architectures. Clustered for easier macro implementation,
65 arch_i386, /**< i386 */
66 arch_i486, /**< i486 */
67 arch_pentium, /**< Pentium */
68 arch_pentium_pro, /**< Pentium Pro */
69 arch_pentium_mmx, /**< Pentium MMX */
70 arch_pentium_2, /**< Pentium II */
71 arch_pentium_3, /**< Pentium III */
72 arch_pentium_4, /**< Pentium IV */
73 arch_pentium_m, /**< Pentium M */
74 arch_core, /**< Core */
76 arch_athlon, /**< Athlon */
77 arch_athlon_64, /**< Athlon64 */
78 arch_opteron, /**< Opteron */
79 arch_generic /**< generic */
82 /** checks for l <= x <= h */
83 #define _IN_RANGE(x, l, h) ((unsigned)((x) - (l)) <= (unsigned)((h) - (l)))
85 /** returns true if it's Intel architecture */
86 #define ARCH_INTEL(x) _IN_RANGE((x), arch_i386, arch_core)
88 /** returns true if it's AMD architecture */
89 #define ARCH_AMD(x) _IN_RANGE((x), arch_k6, arch_opteron)
91 /** return true if it's a Athlon/Opteron */
92 #define ARCH_ATHLON(x) _IN_RANGE((x), arch_athlon, arch_opteron)
94 /** return true if the CPU has MMX support */
95 #define ARCH_MMX(x) _IN_RANGE((x), arch_pentium_mmx, arch_opteron)
97 #define IS_P6_ARCH(x) (_IN_RANGE((x), arch_pentium_pro, arch_core) || \
98 _IN_RANGE((x), arch_athlon, arch_opteron))
100 /** floating point support */
102 fp_none, /**< no floating point instructions are used */
103 fp_x87, /**< use x87 instructions */
104 fp_sse2 /**< use SSE2 instructions */
107 /** Returns non-zero if the current floating point architecture is SSE2. */
108 #define USE_SSE2(cg) ((cg)->fp_kind == fp_sse2)
110 /** Returns non-zero if the current floating point architecture is x87. */
111 #define USE_x87(cg) ((cg)->fp_kind == fp_x87)
113 typedef struct ia32_isa_t ia32_isa_t;
114 typedef struct ia32_code_gen_t ia32_code_gen_t;
115 typedef struct ia32_irn_ops_t ia32_irn_ops_t;
116 typedef struct ia32_intrinsic_env_t ia32_intrinsic_env_t;
119 * IA32 code generator
121 struct ia32_code_gen_t {
122 const arch_code_generator_if_t *impl; /**< implementation */
123 ir_graph *irg; /**< current irg */
124 const arch_env_t *arch_env; /**< the arch env */
125 set *reg_set; /**< set to memorize registers for non-ia32 nodes (e.g. phi nodes) */
126 ia32_isa_t *isa; /**< for fast access to the isa object */
127 be_irg_t *birg; /**< The be-irg (contains additional information about the irg) */
128 ir_node **blk_sched; /**< an array containing the scheduled blocks */
129 ia32_optimize_t opt; /**< contains optimization information */
130 int arch; /**< instruction architecture */
131 int opt_arch; /**< optimize for architecture */
132 char fp_kind; /**< floating point kind */
133 char do_x87_sim; /**< set to 1 if x87 simulation should be enforced */
134 char dump; /**< set to 1 if graphs should be dumped */
135 ir_node *unknown_gp; /**< unique Unknown_GP node */
136 ir_node *unknown_vfp; /**< unique Unknown_VFP node */
137 ir_node *unknown_xmm; /**< unique Unknown_XMM node */
138 ir_node *noreg_gp; /**< unique NoReg_GP node */
139 ir_node *noreg_vfp; /**< unique NoReg_VFP node */
140 ir_node *noreg_xmm; /**< unique NoReg_XMM node */
142 ir_node *fpu_trunc_mode; /**< truncate fpu mode */
144 struct obstack *obst;
151 arch_isa_t arch_isa; /**< must be derived from arch_isa_t */
152 pmap *regs_16bit; /**< Contains the 16bits names of the gp registers */
153 pmap *regs_8bit; /**< Contains the 8bits names of the gp registers */
154 pmap *regs_8bit_high; /**< contains the hight part of the 8 bit names of the gp registers */
155 pmap *types; /**< A map of modes to primitive types */
156 pmap *tv_ent; /**< A map of entities that store const tarvals */
157 ia32_optimize_t opt; /**< contains optimization information */
158 int arch; /**< instruction architecture */
159 int opt_arch; /**< optimize for architecture */
160 int fp_kind; /**< floating point kind */
161 ia32_code_gen_t *cg; /**< the current code generator */
162 const be_machine_t *cpu; /**< the abstract machine */
164 struct obstack *name_obst; /**< holds the original node names (for debugging) */
168 struct ia32_irn_ops_t {
169 const arch_irn_ops_if_t *impl;
174 * A helper type collecting needed info for IA32 intrinsic lowering.
176 struct ia32_intrinsic_env_t {
177 ia32_isa_t *isa; /**< the isa object */
178 ir_graph *irg; /**< the irg, these entities belong to */
179 ir_entity *ll_div_op1; /**< entity for first div operand (move into FPU) */
180 ir_entity *ll_div_op2; /**< entity for second div operand (move into FPU) */
181 ir_entity *ll_d_conv; /**< entity for converts ll -> d */
182 ir_entity *d_ll_conv; /**< entity for converts d -> ll */
183 ir_entity *divdi3; /**< entity for __divdi3 library call */
184 ir_entity *moddi3; /**< entity for __moddi3 library call */
185 ir_entity *udivdi3; /**< entity for __udivdi3 library call */
186 ir_entity *umoddi3; /**< entity for __umoddi3 library call */
187 tarval *u64_bias; /**< bias value for conversion from float to unsigned 64 */
190 /** The mode for the floating point control word. */
191 extern ir_mode *mode_fpcw;
193 /** The current code generator. */
194 extern ia32_code_gen_t *ia32_current_cg;
197 * Returns the unique per irg GP NoReg node.
199 ir_node *ia32_new_NoReg_gp(ia32_code_gen_t *cg);
200 ir_node *ia32_new_NoReg_xmm(ia32_code_gen_t *cg);
201 ir_node *ia32_new_NoReg_vfp(ia32_code_gen_t *cg);
204 * Returns the uniqure per irg GP Unknown node.
205 * (warning: cse has to be activated)
207 ir_node *ia32_new_Unknown_gp(ia32_code_gen_t *cg);
208 ir_node *ia32_new_Unknown_xmm(ia32_code_gen_t *cg);
209 ir_node *ia32_new_Unknown_vfp(ia32_code_gen_t *cg);
212 * Returns the unique per irg FP NoReg node.
214 ir_node *ia32_new_NoReg_fp(ia32_code_gen_t *cg);
217 * Returns the unique per irg FPU truncation mode node.
219 ir_node *ia32_new_Fpu_truncate(ia32_code_gen_t *cg);
222 * Returns gp_noreg or fp_noreg, depending on input requirements.
224 ir_node *ia32_get_admissible_noreg(ia32_code_gen_t *cg, ir_node *irn, int pos);
227 * Maps all intrinsic calls that the backend support
228 * and map all instructions the backend did not support
231 void ia32_handle_intrinsics(void);
234 * Ia32 implementation.
236 * @param method the method type of the emulation function entity
237 * @param op the emulated ir_op
238 * @param imode the input mode of the emulated opcode
239 * @param omode the output mode of the emulated opcode
240 * @param context the context parameter
242 ir_entity *ia32_create_intrinsic_fkt(ir_type *method, const ir_op *op,
243 const ir_mode *imode, const ir_mode *omode,