amd64_finish.c 7.55 KB
Newer Older
1
2
/*
 * This file is part of libFirm.
3
 * Copyright (C) 2014 University of Karlsruhe.
4
5
6
7
8
9
10
 */

/**
 * @file
 * @brief   This file implements functions to finalize the irg for emit.
 */
#include "amd64_finish.h"
Matthias Braun's avatar
Matthias Braun committed
11
12
#include "amd64_new_nodes.h"
#include "amd64_nodes_attr.h"
13
#include "amd64_transform.h"
14
#include "bearch.h"
15
#include "bearch_amd64_t.h"
16
17
18
#include "benode.h"
#include "besched.h"
#include "debug.h"
Matthias Braun's avatar
Matthias Braun committed
19
#include "panic.h"
20
#include "gen_amd64_new_nodes.h"
21
#include "gen_amd64_regalloc_if.h"
22
#include "iredges_t.h"
23
#include "irgwalk.h"
Matthias Braun's avatar
Matthias Braun committed
24
#include "util.h"
25
#include "irgmod.h"
26
27
28
29
30
31

DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)

/**
 * Returns the index of the first "same" register.
 */
Matthias Braun's avatar
Matthias Braun committed
32
static unsigned get_first_same(arch_register_req_t const *const req)
33
{
34
	unsigned const other = req->should_be_same;
Matthias Braun's avatar
Matthias Braun committed
35
	for (unsigned i = 0; i != 32; ++i) {
36
37
38
39
40
41
		if (other & (1U << i))
			return i;
	}
	panic("same position not found");
}

42
43
44
45
46
static bool is_commutative(const ir_node *node)
{
	return arch_get_irn_flags(node) & amd64_arch_irn_flag_commutative_binop;
}

Matthias Braun's avatar
Matthias Braun committed
47
48
49
static bool try_swap_inputs(ir_node *node)
{
	/* commutative operation, just switch the inputs */
50
51
	if (is_commutative(node)) {
		assert(get_amd64_attr_const(node)->op_mode == AMD64_OP_REG_REG);
Matthias Braun's avatar
Matthias Braun committed
52
53
54
55
56
57
58
59
60
61
		/* TODO: support Cmp input swapping */
		ir_node *in0 = get_irn_n(node, 0);
		ir_node *in1 = get_irn_n(node, 1);
		set_irn_n(node, 0, in1);
		set_irn_n(node, 1, in0);
		return true;
	}
	return false;
}

62
63
64
65
66
67
68
69
70
71
/**
  * Transforms a Sub to a Neg + Add, which subsequently allows swapping
  * of the inputs. The swapping is also (implicitly) done here.
  */
static void transform_sub_to_neg_add(ir_node *node,
                                     const arch_register_t *out_reg)
{
	ir_node  *block = get_nodes_block(node);
	dbg_info *dbgi  = get_irn_dbg_info(node);

72
73
	ir_node *in1 = get_irn_n(node, 0);
	ir_node *in2 = get_irn_n(node, 1);
74

75
	const arch_register_t *in2_reg = arch_get_irn_register(in2);
76

77
	const amd64_binop_addr_attr_t *attr = get_amd64_binop_addr_attr(node);
78
79
	ir_node                       *add;
	unsigned                       pos;
80
	if (is_amd64_subs(node)) {
81
82
83
		int bits = get_insn_mode_bits(attr->base.insn_mode);
		ir_tarval *tv = get_mode_one(amd64_mode_xmm);
		tv = tarval_shl_unsigned(tv, bits - 1);
84
		ir_entity *sign_bit_const = create_float_const_entity(tv);
85
86
87

		amd64_binop_addr_attr_t xor_attr;
		memset(&xor_attr, 0, sizeof(xor_attr));
Matthias Braun's avatar
Matthias Braun committed
88
		xor_attr.base.insn_mode             = INSN_MODE_64;
89
		xor_attr.base.base.op_mode          = AMD64_OP_REG_ADDR;
90
		init_lconst_addr(&xor_attr.base.addr, sign_bit_const);
91
92

		ir_node *xor_in[] = { in2 };
93
		ir_node *const xor = new_bd_amd64_xorp(dbgi, block, ARRAY_SIZE(xor_in), xor_in, amd64_xmm_reqs, &xor_attr);
94
		sched_add_before(node, xor);
95
		ir_node *const neg = be_new_Proj_reg(xor, pn_amd64_xorp_res, in2_reg);
96
97

		ir_node *in[] = { neg, in1 };
98
		add = new_bd_amd64_adds(dbgi, block, ARRAY_SIZE(in), in, amd64_xmm_xmm_reqs, attr);
99
		pos = pn_amd64_adds_res;
100
	} else {
101
102
		assert(is_amd64_sub(node));
		ir_node *neg = new_bd_amd64_neg(dbgi, block, in2, attr->base.insn_mode);
103
		sched_add_before(node, neg);
104
		ir_node *const neg_res = be_new_Proj_reg(neg, pn_amd64_neg_res, out_reg);
105

106
		ir_node *in[] = { neg_res, in1 };
107
		add = new_bd_amd64_add(dbgi, block, ARRAY_SIZE(in), in, amd64_reg_reg_reqs, attr);
108
		pos = pn_amd64_add_res;
109
	}
110
	arch_set_irn_register_out(add, pos, out_reg);
111
112
113

	/* exchange the add and the sub */
	sched_replace(node, add);
114
	exchange(node, add);
115
116
}

117
static void amd64_turn_back_am(ir_node *const node, arch_register_t const *const out_reg)
Matthias Braun's avatar
Matthias Braun committed
118
{
Matthias Braun's avatar
Matthias Braun committed
119
120
121
	dbg_info          *dbgi  = get_irn_dbg_info(node);
	ir_node           *block = get_nodes_block(node);
	amd64_addr_attr_t *attr  = get_amd64_addr_attr(node);
Matthias Braun's avatar
Matthias Braun committed
122

Matthias Braun's avatar
Matthias Braun committed
123
	amd64_addr_t new_addr = attr->addr;
Matthias Braun's avatar
Matthias Braun committed
124
125
	ir_node *load_in[3];
	int      load_arity = 0;
126
127
	if (attr->addr.base_input != NO_INPUT &&
	    attr->addr.base_input != RIP_INPUT) {
Matthias Braun's avatar
Matthias Braun committed
128
129
		new_addr.base_input = load_arity;
		load_in[load_arity++] = get_irn_n(node, attr->addr.base_input);
Matthias Braun's avatar
Matthias Braun committed
130
	}
Matthias Braun's avatar
Matthias Braun committed
131
132
133
	if (attr->addr.index_input != NO_INPUT) {
		new_addr.index_input = load_arity;
		load_in[load_arity++] = get_irn_n(node, attr->addr.index_input);
Matthias Braun's avatar
Matthias Braun committed
134
	}
Matthias Braun's avatar
Matthias Braun committed
135
136
137
	assert(attr->addr.mem_input != NO_INPUT);
	new_addr.mem_input = load_arity;
	load_in[load_arity++] = get_irn_n(node, attr->addr.mem_input);
Matthias Braun's avatar
Matthias Braun committed
138

139
	ir_node *const load     = new_bd_amd64_mov_gp(dbgi, block, load_arity, load_in, gp_am_reqs[load_arity - 1], attr->insn_mode, AMD64_OP_ADDR, new_addr);
140
	ir_node *const load_res = be_new_Proj_reg(load, pn_amd64_mov_gp_res, out_reg);
Matthias Braun's avatar
Matthias Braun committed
141
142

	/* change operation */
Matthias Braun's avatar
Matthias Braun committed
143
144
	const amd64_binop_addr_attr_t *binop_attr
		= (const amd64_binop_addr_attr_t*)attr;
Matthias Braun's avatar
Matthias Braun committed
145
	ir_node *new_in[2];
Matthias Braun's avatar
Matthias Braun committed
146
	new_in[0] = get_irn_n(node, binop_attr->u.reg_input);
Matthias Braun's avatar
Matthias Braun committed
147
148
	new_in[1] = load_res;
	set_irn_in(node, ARRAY_SIZE(new_in), new_in);
Matthias Braun's avatar
Matthias Braun committed
149
150
151
	attr->base.op_mode     = AMD64_OP_REG_REG;
	attr->addr.base_input  = NO_INPUT;
	attr->addr.index_input = NO_INPUT;
Matthias Braun's avatar
Matthias Braun committed
152
153
154
155
156
157

	/* rewire mem-proj */
	foreach_out_edge(node, edge) {
		ir_node *out = get_edge_src_irn(edge);
		if (get_irn_mode(out) == mode_M) {
			set_Proj_pred(out, load);
158
			set_Proj_num(out, pn_amd64_mov_gp_M);
Matthias Braun's avatar
Matthias Braun committed
159
160
161
162
163
164
165
166
			break;
		}
	}

	if (sched_is_scheduled(node))
		sched_add_before(node, load);
}

167
168
169
170
171
172
173
/**
 * Insert copies for all amd64 nodes where the should_be_same requirement is
 * not fulfilled.
 */
static void assure_should_be_same_requirements(ir_node *const node)
{
	/* Check all OUT requirements, if there is a should_be_same. */
Christoph Mallon's avatar
Christoph Mallon committed
174
	be_foreach_out(node, i) {
Matthias Braun's avatar
Matthias Braun committed
175
176
		arch_register_req_t const *const req
			= arch_get_irn_register_req_out(node, i);
177
		if (req->should_be_same == 0)
Matthias Braun's avatar
Matthias Braun committed
178
179
180
181
182
183
184
185
			continue;
		unsigned               const same_pos = get_first_same(req);
		ir_node               *const in_node  = get_irn_n(node, same_pos);
		arch_register_t const *const in_reg   = arch_get_irn_register(in_node);
		arch_register_t const *const out_reg
			= arch_get_irn_register_out(node, i);
		if (in_reg == out_reg)
			continue;
186

Matthias Braun's avatar
Matthias Braun committed
187
		/* test if any other input is using the out register */
188
189
		foreach_irn_in(node, i2, in) {
			arch_register_t const *const reg = arch_get_irn_register(in);
Matthias Braun's avatar
Matthias Braun committed
190
191
			if (reg == out_reg && (unsigned)i2 != same_pos) {
				if (!is_amd64_irn(node))
192
					panic("cannot fulfill should_be_same on non-amd64 node");
Matthias Braun's avatar
Matthias Braun committed
193
194
				/* see what role this register has */
				const amd64_attr_t *attr = get_amd64_attr_const(node);
Matthias Braun's avatar
Matthias Braun committed
195
196
197
				if (attr->op_mode == AMD64_OP_ADDR
				 || attr->op_mode == AMD64_OP_REG
				 || attr->op_mode == AMD64_OP_REG_IMM) {
Matthias Braun's avatar
Matthias Braun committed
198
					panic("unexpected op_mode");
Matthias Braun's avatar
Matthias Braun committed
199
				} else if (attr->op_mode == AMD64_OP_REG_REG) {
Matthias Braun's avatar
Matthias Braun committed
200
201
202
203
swap:;
					bool res = try_swap_inputs(node);
					if (res)
						return;
204

205
					if (is_amd64_sub(node) || is_amd64_subs(node)) {
206
207
208
						transform_sub_to_neg_add(node, out_reg);
						return;
					}
Matthias Braun's avatar
Matthias Braun committed
209
210
					panic("couldn't swap inputs of %+F", node);
				} else {
211
					assert(attr->op_mode == AMD64_OP_REG_ADDR);
Matthias Braun's avatar
Matthias Braun committed
212
					/* extract load into an own instruction */
213
					amd64_turn_back_am(node, out_reg);
Matthias Braun's avatar
Matthias Braun committed
214
215
216
217
218
					goto swap;
				}
			}
		}

219
		ir_node *const copy = be_new_Copy_before_reg(in_node, node, out_reg);
Matthias Braun's avatar
Matthias Braun committed
220
221
222
223
		/* Set copy as in. */
		set_irn_n(node, same_pos, copy);

		DBG((dbg, LEVEL_1, "created copy %+F for should be same argument at input %d of %+F\n", copy, same_pos, node));
224
225
226
227
228
229
230
231
232
233
	}
}

/**
 * Block walker: finishes a block.
 */
static void amd64_finish_irg_walker(ir_node *const block, void *const env)
{
	(void) env;

234
	/* Insert copies for should_be_same constraints. */
235
236
	sched_foreach_safe(block, irn) {
		if (is_amd64_irn(irn))
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
			assure_should_be_same_requirements(irn);
	}
}

/**
 * Add Copy nodes for not fulfilled should_be_same constraints.
 */
void amd64_finish_irg(ir_graph *const irg)
{
	irg_block_walk_graph(irg, 0, amd64_finish_irg_walker, 0);
}

void amd64_init_finish(void)
{
	FIRM_DBG_REGISTER(dbg, "firm.be.amd64.finish");
}