2 * Copyright (C) 1995-2008 University of Karlsruhe. All right reserved.
4 * This file is part of libFirm.
6 * This file may be distributed and/or modified under the terms of the
7 * GNU General Public License version 2 as published by the Free Software
8 * Foundation and appearing in the file LICENSE.GPL included in the
9 * packaging of this file.
11 * Licensees holding valid libFirm Professional Edition licenses may use
12 * this file in accordance with the libFirm Commercial License.
13 * Agreement provided with the Software.
15 * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
16 * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * @brief code selection (transform FIRM into amd64 FIRM)
23 * @version $Id: amd64_transform.c 26673 2009-10-01 16:43:13Z matze $
28 #include "irgraph_t.h"
37 #include "../benode.h"
38 #include "../betranshlp.h"
39 #include "../beutil.h"
40 #include "bearch_amd64_t.h"
42 #include "amd64_nodes_attr.h"
43 #include "amd64_transform.h"
44 #include "amd64_new_nodes.h"
46 #include "gen_amd64_regalloc_if.h"
48 DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)
50 /* Some support functions: */
52 static inline int mode_needs_gp_reg(ir_mode *mode)
54 return mode_is_int(mode) || mode_is_reference(mode);
58 * Create a DAG constructing a given Const.
60 * @param irn a Firm const
62 static ir_node *create_const_graph(ir_node *irn, ir_node *block)
64 ir_tarval *tv = get_Const_tarval(irn);
65 ir_mode *mode = get_tarval_mode(tv);
66 dbg_info *dbgi = get_irn_dbg_info(irn);
69 if (mode_is_reference(mode)) {
70 /* AMD64 is 64bit, so we can safely convert a reference tarval into Iu */
71 assert(get_mode_size_bits(mode) == get_mode_size_bits(mode_Lu));
72 tv = tarval_convert_to(tv, mode_Lu);
75 value = get_tarval_long(tv);
76 //d// printf ("TEST GENERATE %d\n", value);
78 return new_bd_amd64_Immediate(dbgi, block, value);
81 /* Op transformers: */
84 * Transforms a Const node.
86 * @return The transformed AMD64 node.
88 static ir_node *gen_Const(ir_node *node) {
89 ir_node *block = be_transform_node(get_nodes_block(node));
90 ir_mode *mode = get_irn_mode(node);
91 ir_node *res = create_const_graph(node, block);
100 * Transforms a SymConst node.
102 * @return The transformed ARM node.
104 static ir_node *gen_SymConst(ir_node *node)
106 ir_node *block = be_transform_node(get_nodes_block(node));
107 ir_entity *entity = get_SymConst_entity(node);
108 dbg_info *dbgi = get_irn_dbg_info(node);
111 new_node = new_bd_amd64_SymConst(dbgi, block, entity);
112 be_dep_on_frame(new_node);
117 * Transforms an Add node.
119 * @return The transformed AMD64 node.
121 static ir_node *gen_Add(ir_node *node) {
122 ir_node *block = be_transform_node(get_nodes_block(node));
123 /* ir_mode *mode = get_irn_mode(node); */
124 ir_node *op1 = get_Add_left(node);
125 ir_node *op2 = get_Add_right(node);
126 dbg_info *dbgi = get_irn_dbg_info(node);
127 ir_node *new_op1 = be_transform_node(op1);
128 ir_node *new_op2 = be_transform_node(op2);
130 ir_node *res = new_bd_amd64_Add(dbgi, block, new_op1, new_op2);
131 be_dep_on_frame (res);
136 * Transforms an Sub node.
138 * @return The transformed AMD64 node.
140 static ir_node *gen_Sub(ir_node *node) {
141 ir_node *block = be_transform_node(get_nodes_block(node));
142 /* ir_mode *mode = get_irn_mode(node); */
143 ir_node *op1 = get_Sub_left(node);
144 ir_node *op2 = get_Sub_right(node);
145 dbg_info *dbgi = get_irn_dbg_info(node);
146 ir_node *new_op1 = be_transform_node(op1);
147 ir_node *new_op2 = be_transform_node(op2);
149 ir_node *res = new_bd_amd64_Sub(dbgi, block, new_op1, new_op2);
150 be_dep_on_frame (res);
154 static ir_node *gen_Mul(ir_node *node) {
155 ir_node *block = be_transform_node(get_nodes_block(node));
156 /* ir_mode *mode = get_irn_mode(node); */
157 ir_node *op1 = get_Mul_left(node);
158 ir_node *op2 = get_Mul_right(node);
159 dbg_info *dbgi = get_irn_dbg_info(node);
160 ir_node *new_op1 = be_transform_node(op1);
161 ir_node *new_op2 = be_transform_node(op2);
163 ir_node *res = new_bd_amd64_Mul(dbgi, block, new_op1, new_op2);
164 be_dep_on_frame (res);
168 static ir_node *gen_Minus(ir_node *node)
170 ir_node *block = be_transform_node(get_nodes_block(node));
171 ir_node *val = be_transform_node(get_Minus_op(node));
172 dbg_info *dbgi = get_irn_dbg_info(node);
174 return new_bd_amd64_Neg(dbgi, block, val);
177 static ir_node *gen_Jmp(ir_node *node)
179 ir_node *block = get_nodes_block(node);
180 ir_node *new_block = be_transform_node(block);
181 dbg_info *dbgi = get_irn_dbg_info(node);
183 return new_bd_amd64_Jmp(dbgi, new_block);
186 static ir_node *gen_be_Call(ir_node *node)
188 ir_node *res = be_duplicate_node(node);
189 arch_irn_add_flags(res, arch_irn_flags_modify_flags);
194 static ir_node *gen_Cmp(ir_node *node)
196 ir_node *block = be_transform_node(get_nodes_block(node));
197 ir_node *op1 = get_Cmp_left(node);
198 ir_node *op2 = get_Cmp_right(node);
199 ir_mode *cmp_mode = get_irn_mode(op1);
200 dbg_info *dbgi = get_irn_dbg_info(node);
205 if (mode_is_float(cmp_mode)) {
206 panic("Floating point not implemented yet (in gen_Cmp)!");
209 assert(get_irn_mode(op2) == cmp_mode);
210 is_unsigned = !mode_is_signed(cmp_mode);
212 new_op1 = be_transform_node(op1);
213 /* new_op1 = gen_extension(dbgi, block, new_op1, cmp_mode); */
214 new_op2 = be_transform_node(op2);
215 /* new_op2 = gen_extension(dbgi, block, new_op2, cmp_mode); */
216 return new_bd_amd64_Cmp(dbgi, block, new_op1, new_op2, false,
223 * @return the created ARM Cond node
225 static ir_node *gen_Cond(ir_node *node)
227 ir_node *selector = get_Cond_selector(node);
228 ir_mode *mode = get_irn_mode(selector);
231 ir_relation relation;
234 if (mode != mode_b) {
235 panic ("create_Switch not implemented yet!");
236 // return gen_SwitchJmp(node);
238 assert(is_Cmp(selector));
240 block = be_transform_node(get_nodes_block(node));
241 dbgi = get_irn_dbg_info(node);
242 flag_node = be_transform_node(selector);
243 relation = get_Cmp_relation(selector);
245 return new_bd_amd64_Jcc(dbgi, block, flag_node, relation);
250 * Create an And that will zero out upper bits.
252 * @param dbgi debug info
253 * @param block the basic block
254 * @param op the original node
255 * param src_bits number of lower bits that will remain
257 static ir_node *gen_zero_extension(dbg_info *dbgi, ir_node *block, ir_node *op,
261 return new_bd_arm_And_imm(dbgi, block, op, 0xFF, 0);
262 } else if (src_bits == 16) {
263 ir_node *lshift = new_bd_arm_Mov_reg_shift_imm(dbgi, block, op, ARM_SHF_LSL_IMM, 16);
264 ir_node *rshift = new_bd_arm_Mov_reg_shift_imm(dbgi, block, lshift, ARM_SHF_LSR_IMM, 16);
267 panic("zero extension only supported for 8 and 16 bits");
272 * Generate code for a sign extension.
274 static ir_node *gen_sign_extension(dbg_info *dbgi, ir_node *block, ir_node *op,
277 int shift_width = 32 - src_bits;
278 ir_node *lshift_node = new_bd_arm_Mov_reg_shift_imm(dbgi, block, op, ARM_SHF_LSL_IMM, shift_width);
279 ir_node *rshift_node = new_bd_arm_Mov_reg_shift_imm(dbgi, block, lshift_node, ARM_SHF_ASR_IMM, shift_width);
283 static ir_node *gen_extension(dbg_info *dbgi, ir_node *block, ir_node *op,
286 int bits = get_mode_size_bits(orig_mode);
290 if (mode_is_signed(orig_mode)) {
291 return gen_sign_extension(dbgi, block, op, bits);
293 return gen_zero_extension(dbgi, block, op, bits);
298 * returns true if it is assured, that the upper bits of a node are "clean"
299 * which means for a 16 or 8 bit value, that the upper bits in the register
300 * are 0 for unsigned and a copy of the last significant bit for signed
303 static bool upper_bits_clean(ir_node *transformed_node, ir_mode *mode)
305 (void) transformed_node;
313 * Change some phi modes
315 static ir_node *gen_Phi(ir_node *node)
317 const arch_register_req_t *req;
318 ir_node *block = be_transform_node(get_nodes_block(node));
319 ir_graph *irg = current_ir_graph;
320 dbg_info *dbgi = get_irn_dbg_info(node);
321 ir_mode *mode = get_irn_mode(node);
324 if (mode_needs_gp_reg(mode)) {
325 /* all integer operations are on 64bit registers now */
327 req = amd64_reg_classes[CLASS_amd64_gp].class_req;
329 req = arch_no_register_req;
332 /* phi nodes allow loops, so we use the old arguments for now
333 * and fix this later */
334 phi = new_ir_node(dbgi, irg, block, op_Phi, mode, get_irn_arity(node),
335 get_irn_in(node) + 1);
336 copy_node_attr(irg, node, phi);
337 be_duplicate_deps(node, phi);
339 arch_set_out_register_req(phi, 0, req);
341 be_enqueue_preds(node);
349 * Transforms a Conv node.
351 * @return The created ia32 Conv node
353 static ir_node *gen_Conv(ir_node *node)
355 ir_node *block = be_transform_node(get_nodes_block(node));
356 ir_node *op = get_Conv_op(node);
357 ir_node *new_op = be_transform_node(op);
358 ir_mode *src_mode = get_irn_mode(op);
359 ir_mode *dst_mode = get_irn_mode(node);
360 dbg_info *dbgi = get_irn_dbg_info(node);
362 if (src_mode == dst_mode)
365 if (mode_is_float(src_mode) || mode_is_float(dst_mode)) {
366 panic("float not supported yet");
367 } else { /* complete in gp registers */
368 int src_bits = get_mode_size_bits(src_mode);
369 int dst_bits = get_mode_size_bits(dst_mode);
373 if (src_bits == dst_bits) {
374 /* kill unnecessary conv */
378 if (src_bits < dst_bits) {
387 return new_bd_amd64_Conv(dbgi, block, new_op, min_mode);
390 if (upper_bits_clean(new_op, min_mode)) {
394 if (mode_is_signed(min_mode)) {
395 return gen_sign_extension(dbg, block, new_op, min_bits);
397 return gen_zero_extension(dbg, block, new_op, min_bits);
404 * Transforms a Store.
406 * @return the created AMD64 Store node
408 static ir_node *gen_Store(ir_node *node)
410 ir_node *block = be_transform_node(get_nodes_block(node));
411 ir_node *ptr = get_Store_ptr(node);
412 ir_node *new_ptr = be_transform_node(ptr);
413 ir_node *mem = get_Store_mem(node);
414 ir_node *new_mem = be_transform_node(mem);
415 ir_node *val = get_Store_value(node);
416 ir_node *new_val = be_transform_node(val);
417 ir_mode *mode = get_irn_mode(val);
418 dbg_info *dbgi = get_irn_dbg_info(node);
419 ir_node *new_store = NULL;
421 if (mode_is_float(mode)) {
422 panic("Float not supported yet");
424 assert(mode_is_data(mode) && "unsupported mode for Store");
425 new_store = new_bd_amd64_Store(dbgi, block, new_ptr, new_val, new_mem, 0);
427 set_irn_pinned(new_store, get_irn_pinned(node));
434 * @return the created AMD64 Load node
436 static ir_node *gen_Load(ir_node *node)
438 ir_node *block = be_transform_node(get_nodes_block(node));
439 ir_node *ptr = get_Load_ptr(node);
440 ir_node *new_ptr = be_transform_node(ptr);
441 ir_node *mem = get_Load_mem(node);
442 ir_node *new_mem = be_transform_node(mem);
443 ir_mode *mode = get_Load_mode(node);
444 dbg_info *dbgi = get_irn_dbg_info(node);
445 ir_node *new_load = NULL;
447 if (mode_is_float(mode)) {
448 panic("Float not supported yet");
450 assert(mode_is_data(mode) && "unsupported mode for Load");
451 new_load = new_bd_amd64_Load(dbgi, block, new_ptr, new_mem, 0);
453 set_irn_pinned(new_load, get_irn_pinned(node));
456 /* check for special case: the loaded value might not be used */
457 if (be_get_Proj_for_pn(node, pn_Load_res) == NULL) {
458 /* add a result proj and a Keep to produce a pseudo use */
459 ir_node *proj = new_r_Proj(new_load, mode_Iu, pn_amd64_Load_res);
460 be_new_Keep(block, 1, &proj);
468 * Transform a Proj from a Load.
470 static ir_node *gen_Proj_Load(ir_node *node)
472 ir_node *load = get_Proj_pred(node);
473 ir_node *new_load = be_transform_node(load);
474 dbg_info *dbgi = get_irn_dbg_info(node);
475 long proj = get_Proj_proj(node);
477 /* renumber the proj */
478 switch (get_amd64_irn_opcode(new_load)) {
480 /* handle all gp loads equal: they have the same proj numbers. */
481 if (proj == pn_Load_res) {
482 return new_rd_Proj(dbgi, new_load, mode_Lu, pn_amd64_Load_res);
483 } else if (proj == pn_Load_M) {
484 return new_rd_Proj(dbgi, new_load, mode_M, pn_amd64_Load_M);
488 case iro_sparc_fpaLoad:
489 panic("FP not implemented yet");
493 panic("Unsupported Proj from Load");
496 return be_duplicate_node(node);
500 * Transform a Proj node.
502 static ir_node *gen_Proj(ir_node *node)
504 ir_graph *irg = current_ir_graph;
505 dbg_info *dbgi = get_irn_dbg_info(node);
506 ir_node *pred = get_Proj_pred(node);
507 long proj = get_Proj_proj(node);
512 if (is_Store(pred)) {
513 if (proj == pn_Store_M) {
514 return be_transform_node(pred);
516 panic("Unsupported Proj from Store");
518 } else if (is_Load(pred)) {
519 return gen_Proj_Load(node);
521 } else if (be_is_SubSP(pred)) {
522 //panic("gen_Proj not implemented for SubSP");
523 return gen_Proj_be_SubSP(node);
524 } else if (be_is_AddSP(pred)) {
525 //panic("gen_Proj not implemented for AddSP");
526 return gen_Proj_be_AddSP(node);
527 } else if (is_Cmp(pred)) {
528 //panic("gen_Proj not implemented for Cmp");
529 return gen_Proj_Cmp(node);
530 } else if (is_Div(pred)) {
531 return gen_Proj_Div(node);
533 } else if (is_Start(pred)) {
535 if (node == get_irg_anchor(irg, anchor_tls)) {
536 return gen_Proj_tls(node);
539 ir_node *new_pred = be_transform_node(pred);
540 ir_mode *mode = get_irn_mode(node);
541 if (mode_needs_gp_reg(mode)) {
542 ir_node *new_proj = new_r_Proj(new_pred, mode_Iu, get_Proj_proj(node));
543 new_proj->node_nr = node->node_nr;
549 return be_duplicate_node(node);
553 * Transforms a FrameAddr into an AMD64 Add.
555 static ir_node *gen_be_FrameAddr(ir_node *node)
557 ir_node *block = be_transform_node(get_nodes_block(node));
558 ir_entity *ent = be_get_frame_entity(node);
559 ir_node *fp = be_get_FrameAddr_frame(node);
560 ir_node *new_fp = be_transform_node(fp);
561 dbg_info *dbgi = get_irn_dbg_info(node);
564 new_node = new_bd_amd64_FrameAddr(dbgi, block, new_fp, ent);
568 /* Boilerplate code for transformation: */
570 static void amd64_register_transformers(void)
572 be_start_transform_setup();
574 be_set_transform_function(op_Const, gen_Const);
575 be_set_transform_function(op_SymConst, gen_SymConst);
576 be_set_transform_function(op_Add, gen_Add);
577 be_set_transform_function(op_Sub, gen_Sub);
578 be_set_transform_function(op_Mul, gen_Mul);
579 be_set_transform_function(op_be_Call, gen_be_Call);
580 be_set_transform_function(op_be_FrameAddr, gen_be_FrameAddr);
581 be_set_transform_function(op_Conv, gen_Conv);
582 be_set_transform_function(op_Jmp, gen_Jmp);
583 be_set_transform_function(op_Cmp, gen_Cmp);
584 be_set_transform_function(op_Cond, gen_Cond);
585 be_set_transform_function(op_Phi, gen_Phi);
586 be_set_transform_function(op_Load, gen_Load);
587 be_set_transform_function(op_Store, gen_Store);
588 be_set_transform_function(op_Proj, gen_Proj);
589 be_set_transform_function(op_Minus, gen_Minus);
592 void amd64_transform_graph(ir_graph *irg)
594 amd64_register_transformers();
595 be_transform_graph(irg, NULL);
598 void amd64_init_transform(void)
600 FIRM_DBG_REGISTER(dbg, "firm.be.amd64.transform");