amd64_transform.c 88.2 KB
Newer Older
1
2
/*
 * This file is part of libFirm.
3
 * Copyright (C) 2012 University of Karlsruhe.
4
5
6
7
8
9
 */

/**
 * @file
 * @brief   code selection (transform FIRM into amd64 FIRM)
 */
Matthias Braun's avatar
Matthias Braun committed
10
#include "debug.h"
Matthias Braun's avatar
Matthias Braun committed
11
#include "panic.h"
Matthias Braun's avatar
Matthias Braun committed
12
13
#include "heights.h"
#include "ircons.h"
14
#include "iredges.h"
Matthias Braun's avatar
Matthias Braun committed
15
#include "irgmod.h"
16
17
#include "irgraph_t.h"
#include "irmode_t.h"
Matthias Braun's avatar
Matthias Braun committed
18
#include "irnode_t.h"
19
#include "iropt_t.h"
20
#include "tv_t.h"
Matthias Braun's avatar
Matthias Braun committed
21
#include "util.h"
22

23
24
#include "benode.h"
#include "betranshlp.h"
25
#include "bearch_amd64_t.h"
26
#include "beirg.h"
Matthias Braun's avatar
Matthias Braun committed
27
#include "besched.h"
28

Matthias Braun's avatar
Matthias Braun committed
29
#include "amd64_new_nodes.h"
30
31
#include "amd64_nodes_attr.h"
#include "amd64_transform.h"
32
#include "amd64_varargs.h"
Matthias Braun's avatar
Matthias Braun committed
33
#include "../ia32/x86_address_mode.h"
34
#include "../ia32/x86_cconv.h"
35
36
37
38
39

#include "gen_amd64_regalloc_if.h"

DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)

40
static ir_mode         *mode_gp;
41
static x86_cconv_t     *current_cconv = NULL;
42
43
static pmap            *node_to_stack;
static be_stackorder_t *stackorder;
44

45
46
47
/** we don't have a concept of aliasing registers, so enumerate them
 * manually for the asm nodes. */
const x86_clobber_name_t amd64_additional_clobber_names[] = {
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
	{ "al", REG_RAX }, { "ah", REG_RAX }, { "ax", REG_RAX }, { "eax", REG_RAX },
	{ "bl", REG_RBX }, { "bh", REG_RBX }, { "bx", REG_RBX }, { "ebx", REG_RBX },
	{ "cl", REG_RCX }, { "ch", REG_RCX }, { "cx", REG_RCX }, { "ecx", REG_RCX },
	{ "dl", REG_RDX }, { "dh", REG_RDX }, { "dx", REG_RDX }, { "edx", REG_RDX },
	{ "sil",  REG_RSI }, { "si",   REG_RSI }, { "esi",  REG_RSI },
	{ "dil",  REG_RDI }, { "di",   REG_RDI }, { "edi",  REG_RDI },
	{ "bpl",  REG_RBP }, { "bp",   REG_RBP }, { "ebp",  REG_RBP },
	{ "spl",  REG_RSP }, { "sp",   REG_RSP }, { "esp",  REG_RSP },
	{ "r8b",  REG_R8  }, { "r8w",  REG_R8  }, { "r8d",  REG_R8  },
	{ "r9b",  REG_R9  }, { "r9w",  REG_R9  }, { "r9d",  REG_R9  },
	{ "r10b", REG_R10 }, { "r10w", REG_R10 }, { "r10d", REG_R10 },
	{ "r11b", REG_R11 }, { "r11w", REG_R11 }, { "r11d", REG_R11 },
	{ "r12b", REG_R12 }, { "r12w", REG_R12 }, { "r12d", REG_R12 },
	{ "r13b", REG_R13 }, { "r13w", REG_R13 }, { "r13d", REG_R13 },
	{ "r14b", REG_R14 }, { "r14w", REG_R14 }, { "r14d", REG_R14 },
	{ "r15b", REG_R15 }, { "r15w", REG_R15 }, { "r15d", REG_R15 },
64
65
66
67
	{ NULL, ~0u }
};

#define GP &amd64_reg_classes[CLASS_amd64_gp]
68
const x86_asm_constraint_list_t amd64_asm_constraints = {
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
	['A'] = { MATCH_REG, GP, 1 << REG_GP_RAX | 1 << REG_GP_RDX },
	['D'] = { MATCH_REG, GP, 1 << REG_GP_RDI },
	['I'] = { MATCH_IMM, GP, 0 },
	['J'] = { MATCH_IMM, GP, 0 },
	['K'] = { MATCH_IMM, GP, 0 },
	['L'] = { MATCH_IMM, GP, 0 },
	['M'] = { MATCH_IMM, GP, 0 },
	['N'] = { MATCH_IMM, GP, 0 },
	['O'] = { MATCH_IMM, GP, 0 },
	['R'] = { MATCH_REG, GP, 1 << REG_GP_RAX | 1 << REG_GP_RBX
		| 1 << REG_GP_RCX | 1 << REG_GP_RDX | 1 << REG_GP_RSI
		| 1 << REG_GP_RDI | 1 << REG_GP_RBP | 1 << REG_GP_RSP },
	['S'] = { MATCH_REG, GP, 1 << REG_GP_RSI },
	['Q'] = { MATCH_REG, GP, 1 << REG_GP_RAX | 1 << REG_GP_RBX
		| 1 << REG_GP_RCX | 1 << REG_GP_RDX },
	['V'] = { MATCH_MEM, GP, 0 },
	['X'] = { MATCH_ANY, GP, 0 },
	['a'] = { MATCH_REG, GP, 1 << REG_GP_RAX },
	['b'] = { MATCH_REG, GP, 1 << REG_GP_RBX },
	['c'] = { MATCH_REG, GP, 1 << REG_GP_RCX },
	['d'] = { MATCH_REG, GP, 1 << REG_GP_RDX },
	['g'] = { MATCH_ANY, GP, 0 },
	['i'] = { MATCH_IMM, GP, 0 },
	['l'] = { MATCH_REG, GP, 1 << REG_GP_RAX | 1 << REG_GP_RBX
		| 1 << REG_GP_RCX | 1 << REG_GP_RDX | 1 << REG_GP_RSI
		| 1 << REG_GP_RDI | 1 << REG_GP_RBP },
	['m'] = { MATCH_MEM, GP, 0 },
	['n'] = { MATCH_IMM, GP, 0 },
	['o'] = { MATCH_MEM, GP, 0 },
	['p'] = { MATCH_REG, GP, 0 },
	['q'] = { MATCH_REG, GP, 0 },
	['r'] = { MATCH_REG, GP, 0 },
	['x'] = { MATCH_REG, &amd64_reg_classes[CLASS_amd64_xmm], 0 },

	// see comments in ia32_transform.c about unimplemented stuff.
};
#undef GP

Matthias Braun's avatar
Matthias Braun committed
107
108
109
#define BIT(x)    (1u << x)

static const arch_register_req_t amd64_requirement_gp_same_0 = {
110
111
112
	.cls               = &amd64_reg_classes[CLASS_amd64_gp],
	.should_be_same    = BIT(0),
	.width             = 1,
Matthias Braun's avatar
Matthias Braun committed
113
114
};

115
static const arch_register_req_t amd64_requirement_xmm_same_0 = {
116
117
118
	.cls               = &amd64_reg_classes[CLASS_amd64_xmm],
	.should_be_same    = BIT(0),
	.width             = 1,
119
120
};

Matthias Braun's avatar
Matthias Braun committed
121
static const arch_register_req_t amd64_requirement_gp_same_0_not_1 = {
122
123
124
125
	.cls               = &amd64_reg_classes[CLASS_amd64_gp],
	.should_be_same    = BIT(0),
	.must_be_different = BIT(1),
	.width             = 1,
Matthias Braun's avatar
Matthias Braun committed
126
127
};

128
static const arch_register_req_t amd64_requirement_xmm_same_0_not_1 = {
129
130
131
132
	.cls               = &amd64_reg_classes[CLASS_amd64_xmm],
	.should_be_same    = BIT(0),
	.must_be_different = BIT(1),
	.width             = 1,
133
134
};

Matthias Braun's avatar
Matthias Braun committed
135
static const arch_register_req_t *mem_reqs[] = {
136
	&arch_memory_requirement,
Matthias Braun's avatar
Matthias Braun committed
137
138
139
};

static const arch_register_req_t *reg_mem_reqs[] = {
140
	&amd64_class_reg_req_gp,
141
	&arch_memory_requirement,
Matthias Braun's avatar
Matthias Braun committed
142
143
};

Tobias Rapp's avatar
Tobias Rapp committed
144
static const arch_register_req_t *rsp_mem_reqs[] = {
145
	&amd64_single_reg_req_gp_rsp,
146
	&arch_memory_requirement,
Tobias Rapp's avatar
Tobias Rapp committed
147
148
};

149
arch_register_req_t const *rsp_reg_mem_reqs[] = {
150
151
	&amd64_single_reg_req_gp_rsp,
	&amd64_class_reg_req_gp,
152
	&arch_memory_requirement,
Tobias Rapp's avatar
Tobias Rapp committed
153
154
};

155
static const arch_register_req_t *xmm_mem_reqs[] = {
156
	&amd64_class_reg_req_xmm,
157
	&arch_memory_requirement,
158
159
};

Matthias Braun's avatar
Matthias Braun committed
160
static const arch_register_req_t *reg_reg_mem_reqs[] = {
161
162
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
163
	&arch_memory_requirement,
Matthias Braun's avatar
Matthias Braun committed
164
165
};

166
arch_register_req_t const *xmm_reg_mem_reqs[] = {
167
168
	&amd64_class_reg_req_xmm,
	&amd64_class_reg_req_gp,
169
	&arch_memory_requirement,
170
171
};

Matthias Braun's avatar
Matthias Braun committed
172
static const arch_register_req_t *reg_reg_reg_mem_reqs[] = {
173
174
175
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
176
	&arch_memory_requirement,
Matthias Braun's avatar
Matthias Braun committed
177
178
};

179
static const arch_register_req_t *xmm_reg_reg_mem_reqs[] = {
180
181
182
	&amd64_class_reg_req_xmm,
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
183
	&arch_memory_requirement,
184
185
};

Tobias Rapp's avatar
Tobias Rapp committed
186
static const arch_register_req_t *reg_flags_reqs[] = {
187
188
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_flags,
189
190
};

191
arch_register_req_t const *amd64_reg_reg_reqs[] = {
192
193
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
194
195
};

196
static const arch_register_req_t *reg_rax_reqs[] = {
197
	&amd64_class_reg_req_gp,
198
	&amd64_single_reg_req_gp_rax,
199
200
};

201
static const arch_register_req_t *reg_rax_rdx_mem_reqs[] = {
202
	&amd64_class_reg_req_gp,
203
	&amd64_single_reg_req_gp_rax,
204
	&amd64_single_reg_req_gp_rdx,
205
	&arch_memory_requirement,
206
207
};

208
arch_register_req_t const *reg_reqs[] = {
209
	&amd64_class_reg_req_gp,
Matthias Braun's avatar
Matthias Braun committed
210
211
};

212
arch_register_req_t const *amd64_xmm_reqs[] = {
213
	&amd64_class_reg_req_xmm,
214
215
};

Matthias Braun's avatar
Matthias Braun committed
216
static const arch_register_req_t *reg_rcx_reqs[] = {
217
218
	&amd64_class_reg_req_gp,
	&amd64_single_reg_req_gp_rcx,
Matthias Braun's avatar
Matthias Braun committed
219
220
};

221
222
223
static const arch_register_req_t *no_reqs[] = {
};

224
arch_register_req_t const *amd64_xmm_xmm_reqs[] = {
225
226
	&amd64_class_reg_req_xmm,
	&amd64_class_reg_req_xmm,
227
228
};

229
arch_register_req_t const **const gp_am_reqs[] = {
230
231
232
233
234
235
236
237
238
239
240
241
242
	mem_reqs,
	reg_mem_reqs,
	reg_reg_mem_reqs,
	reg_reg_reg_mem_reqs,
};

static arch_register_req_t const **const xmm_am_reqs[] = {
	mem_reqs,
	xmm_mem_reqs,
	xmm_reg_mem_reqs,
	xmm_reg_reg_mem_reqs,
};

Matthias Braun's avatar
Matthias Braun committed
243
244
static inline bool mode_needs_gp_reg(ir_mode *mode)
{
245
246
	return get_mode_arithmetic(mode) == irma_twos_complement
	    && mode != amd64_mode_xmm; /* mode_xmm is 128bit int at the moment */
Matthias Braun's avatar
Matthias Braun committed
247
248
}

249
250
static ir_node *get_initial_sp(ir_graph *irg)
{
Christoph Mallon's avatar
Christoph Mallon committed
251
	return be_get_Start_proj(irg, &amd64_registers[REG_RSP]);
252
253
254
255
}

static ir_node *get_initial_fp(ir_graph *irg)
{
Christoph Mallon's avatar
Christoph Mallon committed
256
	return be_get_Start_proj(irg, &amd64_registers[REG_RBP]);
257
258
259
260
261
262
263
264
265
266
}

static ir_node *get_frame_base(ir_graph *irg)
{
	if (current_cconv->omit_fp) {
		return get_initial_sp(irg);
	} else {
		return get_initial_fp(irg);
	}
}
267

268
269
270
static amd64_insn_mode_t get_insn_mode_from_mode(const ir_mode *mode)
{
	switch (get_mode_size_bits(mode)) {
271
272
273
274
275
	case   8: return INSN_MODE_8;
	case  16: return INSN_MODE_16;
	case  32: return INSN_MODE_32;
	case  64: return INSN_MODE_64;
	case 128: return INSN_MODE_128;
276
	}
277
	panic("unexpected mode %+F", mode);
278
279
}

280
ir_entity *create_float_const_entity(ir_tarval *const tv)
281
{
282
	ir_entity *entity = pmap_get(ir_entity, amd64_constants, tv);
283
284
285
286
287
288
289
290
291
292
293
294
295
296
	if (entity != NULL)
		return entity;

	ir_mode *mode = get_tarval_mode(tv);
	ir_type *type = get_type_for_mode(mode);
	ir_type *glob = get_glob_type();

	entity = new_entity(glob, id_unique("C%u"), type);
	set_entity_visibility(entity, ir_visibility_private);
	add_entity_linkage(entity, IR_LINKAGE_CONSTANT);

	ir_initializer_t *initializer = create_initializer_tarval(tv);
	set_entity_initializer(entity, initializer);

297
	pmap_insert(amd64_constants, tv, entity);
298
299
300
	return entity;
}

301
void init_lconst_addr(amd64_addr_t *addr, ir_entity *entity)
302
{
303
304
305
306
307
308
309
310
311
	assert(entity_has_definition(entity));
	assert(get_entity_linkage(entity) == IR_LINKAGE_CONSTANT);
	assert(get_entity_visibility(entity) == ir_visibility_private);
	memset(addr, 0, sizeof(*addr));
	x86_immediate_kind_t kind = be_options.pic ? X86_IMM_PCREL : X86_IMM_ADDR;
	addr->immediate.entity = entity;
	addr->immediate.kind = kind;
	addr->index_input = NO_INPUT;
	addr->base_input = kind == X86_IMM_PCREL ? RIP_INPUT : NO_INPUT;
312
313
}

314
static ir_node *create_float_const(dbg_info *dbgi, ir_node *block,
Matthias Braun's avatar
Matthias Braun committed
315
                                   ir_tarval *tv)
316
317
318
{
	ir_graph  *irg     = get_irn_irg(block);
	ir_mode   *tv_mode = get_tarval_mode(tv);
319
	ir_entity *entity  = create_float_const_entity(tv);
320
321
322
323
	ir_node   *nomem   = get_irg_no_mem(irg);

	ir_node *in[] = { nomem };
	amd64_addr_t addr;
324
	init_lconst_addr(&addr, entity);
325

326
	ir_node *load;
327
	unsigned pn_res;
328
	amd64_insn_mode_t insn_mode = get_insn_mode_from_mode(tv_mode);
329
	if (insn_mode == INSN_MODE_128) {
330
		load = new_bd_amd64_movdqa(dbgi, block, ARRAY_SIZE(in), in, mem_reqs, AMD64_OP_ADDR, addr);
331
		pn_res = pn_amd64_movdqa_res;
332
	} else {
333
		load = new_bd_amd64_movs_xmm(dbgi, block, ARRAY_SIZE(in), in, mem_reqs, insn_mode, AMD64_OP_ADDR, addr);
334
		pn_res = pn_amd64_movs_xmm_res;
335
	}
Matthias Braun's avatar
Matthias Braun committed
336
	set_irn_pinned(load, false);
337

338
	return be_new_Proj(load, pn_res);
339
340
341
342
343
}

ir_tarval *create_sign_tv(ir_mode *mode)
{
	unsigned size = get_mode_size_bits(mode);
Matthias Braun's avatar
Matthias Braun committed
344
345
346
347
	assert(size == 32 || size == 64 || size == 128);
	ir_mode *intmode = size == 128 ? amd64_mode_xmm
	                 : size == 64  ? mode_Lu
	                               : mode_Iu;
348
349
350
	ir_tarval *one  = get_mode_one(intmode);
	ir_tarval *sign = tarval_shl_unsigned(one, size-1);
	return tarval_bitcast(sign, mode);
351
352
}

353
354
static ir_node *gen_Const(ir_node *node)
{
355
	ir_node  *block = be_transform_nodes_block(node);
356
	dbg_info *dbgi  = get_irn_dbg_info(node);
357
	ir_mode  *mode  = get_irn_mode(node);
358
	ir_tarval *tv = get_Const_tarval(node);
359
360
361

	if (!mode_needs_gp_reg(mode)) {
		if (tarval_is_null(tv)) {
362
			return new_bd_amd64_xorpd_0(dbgi, block);
363
364
		}

365
		return create_float_const(dbgi, block, tv);
366
367
	}

368
369
	uint64_t val = get_tarval_uint64(tv);
	amd64_insn_mode_t imode = val > UINT32_MAX ? INSN_MODE_64 : INSN_MODE_32;
Matthias Braun's avatar
Matthias Braun committed
370
371
372
373
374
	amd64_imm64_t const imm = {
		.kind   = X86_IMM_VALUE,
		.offset = val,
	};
	return new_bd_amd64_mov_imm(dbgi, block, imode, &imm);
375
376
}

377
static ir_node *gen_Address(ir_node *node)
378
{
379
	ir_node   *block  = be_transform_nodes_block(node);
380
	dbg_info  *dbgi   = get_irn_dbg_info(node);
381
	ir_entity *entity = get_Address_entity(node);
382

383
384
385
386
387
388
	amd64_imm64_t const imm = {
		.kind   = X86_IMM_ADDR,
		.entity = entity,
	};
	return new_bd_amd64_mov_imm(dbgi, block, INSN_MODE_64, &imm);
}
Matthias Braun's avatar
Matthias Braun committed
389

390
391
392
393
394
395
static ir_node *gen_be_Relocation(ir_node *node)
{
	ir_node             *const block  = be_transform_nodes_block(node);
	ir_entity           *const entity = be_get_Relocation_entity(node);
	x86_immediate_kind_t const kind
		= (x86_immediate_kind_t)be_get_Relocation_kind(node);
Matthias Braun's avatar
Matthias Braun committed
396

397
398
399
	switch (kind) {
	case X86_IMM_ADDR: {
		amd64_imm64_t const imm = {
Matthias Braun's avatar
Matthias Braun committed
400
401
402
			.kind   = X86_IMM_ADDR,
			.entity = entity,
		};
403
404
405
406
407
408
409
410
411
		return new_bd_amd64_mov_imm(NULL, block, INSN_MODE_64, &imm);
	}
	case X86_IMM_PCREL:
	case X86_IMM_GOTPCREL: { /* can GOTPCREL happen here? */
		amd64_addr_t addr;
		memset(&addr, 0, sizeof(addr));
		addr.base_input  = RIP_INPUT;
		addr.index_input = NO_INPUT;
		addr.mem_input   = NO_INPUT;
Matthias Braun's avatar
Matthias Braun committed
412
		addr.immediate = (x86_imm32_t) {
413
			.kind   = kind,
Matthias Braun's avatar
Matthias Braun committed
414
415
			.entity = entity,
		};
416
		return new_bd_amd64_lea(NULL, block, 0, NULL, NULL, INSN_MODE_64, addr);
Matthias Braun's avatar
Matthias Braun committed
417
	}
418
419
420
421
	default:
		break;
	}
	panic("Unexpected relocation kind");
Matthias Braun's avatar
Matthias Braun committed
422
423
}

424
425
ir_node *amd64_new_IncSP(ir_node *block, ir_node *old_sp, int offset,
                         unsigned align)
Tobias Rapp's avatar
Tobias Rapp committed
426
{
427
428
429
430
	ir_node *incsp = be_new_IncSP(&amd64_registers[REG_RSP], block, old_sp,
	                              offset, align);
	arch_add_irn_flags(incsp, arch_irn_flag_modify_flags);
	return incsp;
Tobias Rapp's avatar
Tobias Rapp committed
431
432
}

433
typedef ir_node *(*construct_binop_func)(dbg_info *dbgi, ir_node *block, int arity, ir_node *const *in, arch_register_req_t const **in_reqs, amd64_binop_addr_attr_t const *attr_init);
Matthias Braun's avatar
Matthias Braun committed
434

435
typedef ir_node *(*construct_rax_binop_func)(dbg_info *dbgi, ir_node *block, int arity, ir_node *const *in, arch_register_req_t const **in_reqs, amd64_insn_mode_t insn_mode, amd64_op_mode_t op_mode, amd64_addr_t addr);
436

Matthias Braun's avatar
Matthias Braun committed
437
438
439
440
441
442
443
444
typedef enum match_flags_t {
	match_am           = 1 << 0,
	match_mode_neutral = 1 << 1,
	match_immediate    = 1 << 2,
	match_commutative  = 1 << 3,
} match_flags_t;

typedef struct amd64_args_t {
Matthias Braun's avatar
Matthias Braun committed
445
446
447
448
	amd64_binop_addr_attr_t     attr;
	ir_node                    *mem_proj;
	ir_node                    *in[4];
	int                         arity;
Matthias Braun's avatar
Matthias Braun committed
449
450
451
	const arch_register_req_t **reqs;
} amd64_args_t;

Matthias Braun's avatar
Matthias Braun committed
452
static bool match_immediate_32(x86_imm32_t *imm, const ir_node *op,
453
454
                               bool can_match_ip_relative,
                               bool upper32_dont_care)
Matthias Braun's avatar
Matthias Braun committed
455
456
{
	assert(mode_needs_gp_reg(get_irn_mode(op)));
Matthias Braun's avatar
Matthias Braun committed
457
458
	assert(imm->offset == 0 && imm->entity == NULL
	       && imm->kind == X86_IMM_VALUE);
459
460
461

	ir_tarval *tv;
	ir_entity *entity;
Matthias Braun's avatar
Matthias Braun committed
462
463
	unsigned   reloc_kind;
	if (!be_match_immediate(op, &tv, &entity, &reloc_kind))
464
465
466
467
		return false;

	int32_t val;
	if (tv) {
Matthias Braun's avatar
Matthias Braun committed
468
469
		if (!tarval_is_long(tv))
			return false;
470
471
		long lval = get_tarval_long(tv);
		val = (int32_t)lval;
Matthias Braun's avatar
Matthias Braun committed
472
473
		if ((long)val != lval)
			return false;
474
475
476
477
478
		/** the immediate value is signed extended to 64bit, sometimes
		 * this is not what we want. */
		if (!upper32_dont_care && val < 0
		    && !mode_is_signed(get_tarval_mode(tv)))
		    return false;
479
480
481
482
	} else {
		val = 0;
	}

Matthias Braun's avatar
Matthias Braun committed
483
	x86_immediate_kind_t kind = (x86_immediate_kind_t)reloc_kind;
Matthias Braun's avatar
Matthias Braun committed
484
	if (entity != NULL) {
485
486
487
488
489
		if (!can_match_ip_relative)
			return false;
		if (kind == X86_IMM_VALUE || kind == X86_IMM_ADDR) {
			kind = X86_IMM_PCREL;
		} else if (kind != X86_IMM_PCREL)
Matthias Braun's avatar
Matthias Braun committed
490
			return false;
Matthias Braun's avatar
Matthias Braun committed
491
	}
492
493

	imm->entity = entity;
Matthias Braun's avatar
Matthias Braun committed
494
495
	imm->offset = val;
	imm->kind   = kind;
496
	return true;
Matthias Braun's avatar
Matthias Braun committed
497
498
499
500
}

static ir_heights_t *heights;

501
502
503
504
505
506
507
508
509
static bool input_depends_on_load(ir_node *load, ir_node *input)
{
	ir_node *block = get_nodes_block(load);
	/* if the dependency is in another block, then we ignore it for now
	   as we only match address mode loads in the same block. */
	return get_nodes_block(input) == block
	    && heights_reachable_in_block(heights, input, load);
}

Tobias Rapp's avatar
Tobias Rapp committed
510
511
512
513
514
515
516
517
518
static void fix_node_mem_proj(ir_node *node, ir_node *mem_proj)
{
	if (mem_proj == NULL)
		return;

	ir_node *load = get_Proj_pred(mem_proj);
	be_set_transformed_node(load, node);
}

519
static ir_node *source_am_possible(ir_node *block, ir_node *node)
Matthias Braun's avatar
Matthias Braun committed
520
521
{
	if (!is_Proj(node))
522
		return NULL;
Matthias Braun's avatar
Matthias Braun committed
523
524
	ir_node *load = get_Proj_pred(node);
	if (!is_Load(load))
525
		return NULL;
526
	assert(get_Proj_num(node) == pn_Load_res);
Matthias Braun's avatar
Matthias Braun committed
527
	if (get_nodes_block(load) != block)
528
		return NULL;
Matthias Braun's avatar
Matthias Braun committed
529
530
	/* make sure we are the only user */
	if (get_irn_n_edges(node) != 1)
531
		return NULL;
532
533
534
535
536
537
	/* From ia32_transform.c:751:
	 * in some edge cases with address mode we might reach the load normally
	 * and through some AM sequence, if it is already materialized then we
	 * can't create an AM node from it */
	if (be_is_transformed(node))
		return NULL;
538
	return load;
Matthias Braun's avatar
Matthias Braun committed
539
540
541
542
543
544
545
546
547
548
}

static bool needs_extension(ir_node *op)
{
	ir_mode *mode = get_irn_mode(op);
	if (get_mode_size_bits(mode) >= 32)
		return false;
	return !be_upper_bits_clean(op, mode);
}

549
static ir_node *create_sext(ir_node *new_block, ir_node *const node, ir_mode *mode)
550
551
552
{
	amd64_insn_mode_t insn_mode = get_insn_mode_from_mode(mode);
	dbg_info *const   dbgi      = get_irn_dbg_info(node);
Tobias Rapp's avatar
Tobias Rapp committed
553
	ir_node  *const   new_node  = be_transform_node(node);
554
555
556
557
558
559

	amd64_shift_attr_t attr;
	memset(&attr, 0, sizeof(attr));
	attr.base.op_mode = AMD64_OP_SHIFT_IMM;
	attr.insn_mode    = insn_mode;
	attr.immediate    = get_mode_size_bits(mode) - 1;
Tobias Rapp's avatar
Tobias Rapp committed
560
	ir_node *in[1]    = { new_node };
561
	ir_node *const sar = new_bd_amd64_sar(dbgi, new_block, ARRAY_SIZE(in), in, reg_reqs, &attr);
562
	arch_set_irn_register_req_out(sar, 0, &amd64_requirement_gp_same_0);
563
	return be_new_Proj(sar, pn_amd64_sar_res);
564
565
}

566
static ir_node *create_zext(ir_node *new_block, ir_node *const node)
567
{
568
569
	dbg_info *const dbgi = get_irn_dbg_info(node);
	ir_node  *const xor0 = new_bd_amd64_xor_0(dbgi, new_block);
570
	return be_new_Proj(xor0, pn_amd64_xor_0_res);
571
572
}

Tobias Rapp's avatar
Tobias Rapp committed
573
574
static bool use_address_matching(ir_mode *mode, match_flags_t flags,
                                 ir_node *block,
575
576
577
                                 ir_node *op1, ir_node *op2,
                                 ir_node **out_load, ir_node **out_op)
{
578
579
	if (! (flags & match_am))
		return false;
580

Tobias Rapp's avatar
Tobias Rapp committed
581
582
583
584
	unsigned mode_bits = get_mode_size_bits(mode);
	if (mode_bits == 8 || mode_bits == 16)
		return false;

585
586
587
	ir_node *load2 = source_am_possible(block, op2);
	if (load2 != NULL && !input_depends_on_load(load2, op1)) {
		(*out_load) = load2;
588
589
		(*out_op)   = op1;
		return true;
590
591
592
593
594
595
596
597
598
	}

	if (flags & match_commutative) {
		ir_node *load1 = source_am_possible(block, op1);
		if (load1 != NULL && !input_depends_on_load(load1, op2)) {
			(*out_load) = load1;
			(*out_op)   = op2;
			return true;
		}
599
600
601
602
	}
	return false;
}

603
604
static void perform_address_matching(ir_node *ptr, int *arity,
                                     ir_node **in, amd64_addr_t *addr)
605
606
607
{
	x86_address_t maddr;
	memset(&maddr, 0, sizeof(maddr));
608
	x86_create_address_mode(&maddr, ptr, x86_create_am_normal);
609
610
611
612
613
614

	if (maddr.base != NULL) {
		int base_input   = (*arity)++;
		addr->base_input = base_input;
		in[base_input]   = be_transform_node(maddr.base);
	} else {
615
		addr->base_input = maddr.ip_base ? RIP_INPUT : NO_INPUT;
616
617
618
619
620
621
622
623
	}
	if (maddr.index != NULL) {
		int index_input = (*arity)++;
		addr->index_input = index_input;
		in[index_input]  = be_transform_node(maddr.index);
	} else {
		addr->index_input = NO_INPUT;
	}
624
	ir_entity *entity = maddr.imm.entity;
625
	if (entity != NULL && is_parameter_entity(entity) &&
626
		get_entity_parameter_number(entity) == IR_VA_START_PARAMETER_NUMBER)
Andreas Fried's avatar
Andreas Fried committed
627
		panic("perform_address_matching: Request for invalid parameter (va_start parameter)");
628

Matthias Braun's avatar
Matthias Braun committed
629
630
	addr->immediate = maddr.imm;
	addr->log_scale = maddr.scale;
631
632
}

Matthias Braun's avatar
Matthias Braun committed
633
634
635
static void match_binop(amd64_args_t *args, ir_node *block,
                        ir_mode *mode, ir_node *op1, ir_node *op2,
                        match_flags_t flags)
Matthias Braun's avatar
Matthias Braun committed
636
637
638
{
	memset(args, 0, sizeof(*args));

639
	bool use_am;
640
	bool use_xmm       = mode_is_float(mode);
Matthias Braun's avatar
Matthias Braun committed
641
	bool use_immediate = flags & match_immediate;
642
	bool mode_neutral  = flags & match_mode_neutral;
Matthias Braun's avatar
Matthias Braun committed
643

Matthias Braun's avatar
Matthias Braun committed
644
	args->attr.base.insn_mode = get_insn_mode_from_mode(mode);
Matthias Braun's avatar
Matthias Braun committed
645
646

	/* TODO: legalize phase */
647
	if (mode_neutral) {
648
649
		op1 = be_skip_downconv(op1, true);
		op2 = be_skip_downconv(op2, true);
Matthias Braun's avatar
Matthias Braun committed
650
651
652
653
654
655
656
	} else {
		/* TODO: extend inputs? */
		(void)needs_extension;
	}

	ir_node *load;
	ir_node *op;
657

Tobias Rapp's avatar
Tobias Rapp committed
658
	use_am = use_address_matching(mode, flags, block, op1, op2, &load, &op);
659

660
661
	if (use_immediate
	    && match_immediate_32(&args->attr.u.immediate, op2, false, mode_neutral)) {
662
		assert(!use_xmm && "Can't (yet) match binop with xmm immediate");
Matthias Braun's avatar
Matthias Braun committed
663
		/* fine, we found an immediate */
Matthias Braun's avatar
Matthias Braun committed
664
665
666
		args->attr.base.base.op_mode = AMD64_OP_REG_IMM;
		args->in[args->arity++]      = be_transform_node(op1);
		args->reqs                   = reg_reqs;
667
	} else if (use_am) {
Matthias Braun's avatar
Matthias Braun committed
668
669
670
671
		ir_node *new_op        = be_transform_node(op);
		int      reg_input     = args->arity++;
		args->attr.u.reg_input = reg_input;
		args->in[reg_input]    = new_op;
672
		amd64_addr_t *addr     = &args->attr.base.addr;
Matthias Braun's avatar
Matthias Braun committed
673

674
675
676
		ir_node *ptr = get_Load_ptr(load);
		perform_address_matching(ptr, &(args->arity), args->in, addr);

677
678
		args->reqs = (use_xmm ? xmm_am_reqs : gp_am_reqs)[args->arity];

679
680
681
682
		ir_node *new_mem    = be_transform_node(get_Load_mem(load));
		int mem_input       = args->arity++;
		args->in[mem_input] = new_mem;
		addr->mem_input     = mem_input;
683

684
		args->mem_proj      = get_Proj_for_pn(load, pn_Load_M);
685
		args->attr.base.base.op_mode = AMD64_OP_REG_ADDR;
Matthias Braun's avatar
Matthias Braun committed
686
687
688
689
	} else {
		/* simply transform the arguments */
		args->in[args->arity++] = be_transform_node(op1);
		args->in[args->arity++] = be_transform_node(op2);
Matthias Braun's avatar
Matthias Braun committed
690
		args->attr.base.base.op_mode = AMD64_OP_REG_REG;
691

692
		args->reqs = use_xmm ? amd64_xmm_xmm_reqs : amd64_reg_reg_reqs;
Matthias Braun's avatar
Matthias Braun committed
693
694
695
696
	}
}

static ir_node *gen_binop_am(ir_node *node, ir_node *op1, ir_node *op2,
697
698
                             construct_binop_func func, unsigned pn_res,
                             match_flags_t flags)
Matthias Braun's avatar
Matthias Braun committed
699
700
701
702
{
	ir_node *block = get_nodes_block(node);
	ir_mode *mode  = get_irn_mode(node);
	amd64_args_t args;
Matthias Braun's avatar
Matthias Braun committed
703
	match_binop(&args, block, mode, op1, op2, flags);
Matthias Braun's avatar
Matthias Braun committed
704
705
706

	dbg_info *const dbgi      = get_irn_dbg_info(node);
	ir_node  *const new_block = be_transform_node(block);
707
	ir_node  *const new_node  = func(dbgi, new_block, args.arity, args.in, args.reqs, &args.attr);
708

Tobias Rapp's avatar
Tobias Rapp committed
709
	fix_node_mem_proj(new_node, args.mem_proj);
Matthias Braun's avatar
Matthias Braun committed
710

711
712
713
714
715
716
717
	if (mode_is_float(mode)) {
		arch_set_irn_register_req_out(new_node, 0,
		                              &amd64_requirement_xmm_same_0);
	} else {
		arch_set_irn_register_req_out(new_node, 0,
		                              &amd64_requirement_gp_same_0);
	}
718
	return be_new_Proj(new_node, pn_res);
Matthias Braun's avatar
Matthias Braun committed
719
720
}

721
722
723
724
725
726
727
728
729
730
731
732
733
static ir_node *gen_binop_rax(ir_node *node, ir_node *op1, ir_node *op2,
                              construct_rax_binop_func make_node,
                              match_flags_t flags)
{
	bool use_am;
	bool mode_neutral  = flags & match_mode_neutral;
	assert(! (flags & match_immediate));

	ir_mode *mode = get_irn_mode(op1);
	amd64_insn_mode_t insn_mode = get_insn_mode_from_mode(mode);

	/* TODO: legalize phase */
	if (mode_neutral) {
734
735
		op1 = be_skip_downconv(op1, true);
		op2 = be_skip_downconv(op2, true);
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
	} else {
		/* TODO: extend inputs? */
		(void)needs_extension;
	}

	ir_node *load;
	ir_node *op;
	ir_node *block = get_nodes_block(node);
	ir_node *in[4];
	int      arity = 0;
	const arch_register_req_t **reqs;
	amd64_op_mode_t op_mode;
	amd64_addr_t    addr;
	memset(&addr, 0, sizeof(addr));

Tobias Rapp's avatar
Tobias Rapp committed
751
	use_am = use_address_matching(mode, flags, block, op1, op2, &load, &op);
752

753
	ir_node *mem_proj = NULL;
754
755
756
757
758
	if (use_am) {
		ir_node *new_op    = be_transform_node(op);
		int      reg_input = arity++;
		in[reg_input]      = new_op;

759
760
761
		ir_node *ptr = get_Load_ptr(load);
		perform_address_matching(ptr, &arity, in, &addr);

762
		reqs = gp_am_reqs[arity];
763
764
765
766
767

		ir_node *new_mem = be_transform_node(get_Load_mem(load));
		int mem_input    = arity++;
		in[mem_input]    = new_mem;
		addr.mem_input   = mem_input;
768

769
		mem_proj                = get_Proj_for_pn(load, pn_Load_M);
770
		op_mode                 = AMD64_OP_ADDR;
771
772
	} else {
		/* simply transform the arguments */
773
774
		in[arity++] = be_transform_node(op1);
		in[arity++] = be_transform_node(op2);
775
776
		reqs        = reg_rax_reqs;
		op_mode     = AMD64_OP_REG;
777
778
	}

779
	assert((size_t)arity <= ARRAY_SIZE(in));
780
781
782
	dbg_info *const dbgi      = get_irn_dbg_info(node);
	ir_node  *const new_block = be_transform_node(block);
	ir_node  *const new_node  = make_node(dbgi, new_block, arity, in, reqs, insn_mode, op_mode, addr);
783
784
785
	if (mem_proj != NULL) {
		be_set_transformed_node(load, new_node);
	}
786
787
788
	return new_node;
}

789
790
791
792
793
794
795
796
static ir_node *gen_binop_xmm(ir_node *node, ir_node *op0, ir_node *op1,
                              construct_binop_func make_node,
                              match_flags_t flags)
{
	ir_node *block = get_nodes_block(node);
	ir_mode *mode  = get_irn_mode(op0);
	amd64_args_t args;
	memset(&args, 0, sizeof(args));
797
	args.attr.base.insn_mode = INSN_MODE_64;
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812

	ir_node *load;
	ir_node *op;
	bool use_am = use_address_matching(mode, flags, block, op0, op1, &load,
	                                   &op);

	if (use_am) {
		int reg_input = args.arity++;
		args.attr.u.reg_input = reg_input;
		args.in[reg_input]    = be_transform_node(op);

		amd64_addr_t *addr = &args.attr.base.addr;
		ir_node      *ptr  = get_Load_ptr(load);
		perform_address_matching(ptr, &args.arity, args.in, addr);

813
		args.reqs = xmm_am_reqs[args.arity];
814
815
816
817
818
819
820

		ir_node *new_mem   = be_transform_node(get_Load_mem(load));
		int mem_input      = args.arity++;
		args.in[mem_input] = new_mem;
		addr->mem_input    = mem_input;

		args.mem_proj      = get_Proj_for_pn(load, pn_Load_M);
821
		args.attr.base.base.op_mode = AMD64_OP_REG_ADDR;
822
823
824
825
	} else {
		args.in[args.arity++] = be_transform_node(op0);
		args.in[args.arity++] = be_transform_node(op1);
		args.attr.base.base.op_mode = AMD64_OP_REG_REG;
826
		args.reqs = amd64_xmm_xmm_reqs;
827
828
829
830
	}

	dbg_info *const dbgi      = get_irn_dbg_info(node);
	ir_node  *const new_block = be_transform_node(block);
831
	ir_node  *const new_node  = make_node(dbgi, new_block, args.arity, args.in, args.reqs, &args.attr);
832
833
834
835
836

	fix_node_mem_proj(new_node, args.mem_proj);

	arch_set_irn_register_req_out(new_node, 0,
								  &amd64_requirement_xmm_same_0);
837
	return be_new_Proj(new_node, pn_amd64_subs_res);
838
839
}

840
typedef ir_node *(*construct_shift_func)(dbg_info *dbgi, ir_node *block, int arity, ir_node *const *in, arch_register_req_t const **in_reqs, amd64_shift_attr_t const *attr_init);
Matthias Braun's avatar
Matthias Braun committed
841
842

static ir_node *gen_shift_binop(ir_node *node, ir_node *op1, ir_node *op2,
843
844
                                construct_shift_func func, unsigned pn_res,
                                match_flags_t flags)
Matthias Braun's avatar
Matthias Braun committed
845
846
847
848
849
850
851
852
853
854
{
	ir_mode *mode = get_irn_mode(node);
	assert(!mode_is_float(mode));

	if (get_mode_modulo_shift(mode) != 32 && get_mode_size_bits(mode) != 64)
		panic("insupported modulo shift used");

	ir_node *in[3];
	int      arity = 0;
	if (flags & match_mode_neutral) {
855
		op1 = be_skip_downconv(op1, true);
Matthias Braun's avatar
Matthias Braun committed
856
		in[arity++] = be_transform_node(op1);
Matthias Braun's avatar
Matthias Braun committed
857
		mode = get_mode_size_bits(mode) > 32 ? mode_gp : mode_Iu;
Matthias Braun's avatar
Matthias Braun committed
858
	} else {
859
		op1 = be_skip_sameconv(op1);
860
861
862

		/* Use 8/16bit operations instead of doing zext/upconv */
		in[arity++] = be_transform_node(op1);
Matthias Braun's avatar
Matthias Braun committed
863
864
865
866
867
868
	}

	/* we can skip any convs for the shift count, as it only uses the lowest
	 * 5/6 bits anyway */
	while (is_Conv(op2) && get_irn_n_edges(op2) == 1) {
		ir_node *const op = get_Conv_op(op2);
869
		if (get_mode_arithmetic(get_irn_mode(op)) != irma_twos_complement)
Matthias Braun's avatar
Matthias Braun committed
870
871
872
873
			break;
		op2 = op;
	}

Matthias Braun's avatar
Matthias Braun committed
874
875
	amd64_shift_attr_t attr;
	memset(&attr, 0, sizeof(attr));
Matthias Braun's avatar
Matthias Braun committed
876
877
878
	const arch_register_req_t **reqs;
	const arch_register_req_t  *out_req0;
	if (is_Const(op2)) {
Matthias Braun's avatar
Matthias Braun committed
879
880
881
		attr.base.op_mode = AMD64_OP_SHIFT_IMM;
		reqs              = reg_reqs;
		out_req0          = &amd64_requirement_gp_same_0;
882
		attr.immediate    = get_Const_long(op2);
Matthias Braun's avatar
Matthias Braun committed
883
	} else {
Matthias Braun's avatar
Matthias Braun committed
884
885
886
887
		attr.base.op_mode = AMD64_OP_SHIFT_REG;
		in[arity++]       = be_transform_node(op2);
		reqs              = reg_rcx_reqs;
		out_req0          = &amd64_requirement_gp_same_0_not_1;
Matthias Braun's avatar
Matthias Braun committed
888
	}
Matthias Braun's avatar
Matthias Braun committed
889
	attr.insn_mode = get_insn_mode_from_mode(mode);
Matthias Braun's avatar
Matthias Braun committed
890

Matthias Braun's avatar
Matthias Braun committed
891
	dbg_info *const dbgi      = get_irn_dbg_info(node);
892
	ir_node  *const new_block = be_transform_nodes_block(node);
893
	ir_node  *const new_node  = func(dbgi, new_block, arity, in, reqs, &attr);
Matthias Braun's avatar
Matthias Braun committed
894
	arch_set_irn_register_req_out(new_node, 0, out_req0);
895
	return be_new_Proj(new_node, pn_res);
896
897
}

898
static ir_node *create_lea_as_add(ir_node *node, ir_node *op1, ir_node *op2)
899
900
{
	dbg_info *const dbgi = get_irn_dbg_info(node);
901
	ir_node  *new_block  = be_transform_nodes_block(node);
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
	ir_mode *mode        = get_irn_mode(node);

	amd64_insn_mode_t insn_mode;
	if (get_mode_size_bits(mode) <= 32)
		insn_mode = INSN_MODE_32;
	else
		insn_mode = INSN_MODE_64;

	const arch_register_req_t **reqs;
	amd64_addr_t addr;
	memset(&addr, 0, sizeof(addr));

	ir_node *in[2];
	int arity = 0;

	if (match_immediate_32(&addr.immediate, op2, false, true)) {
		in[arity++]      = be_transform_node(op1);
		reqs             = reg_reqs;
		addr.index_input = NO_INPUT;
	} else {
		in[arity++]      = be_transform_node(op1);
		in[arity++]      = be_transform_node(op2);
924
925
		addr.base_input  = 0;
		addr.index_input = 1;
926
		reqs             = amd64_reg_reg_reqs;
927
928
	}

929
	return new_bd_amd64_lea(dbgi, new_block, arity, in, reqs, insn_mode, addr);
930
931
}

Matthias Braun's avatar
Matthias Braun committed
932
933
static ir_node *gen_Add(ir_node *const node)
{
934
935
936
	match_flags_t flags = match_immediate | match_am | match_mode_neutral
	                      | match_commutative;

Matthias Braun's avatar
Matthias Braun committed
937
938
	ir_node *op1 = get_Add_left(node);
	ir_node *op2 = get_Add_right(node);
939
940
941
942
943

	ir_mode *mode  = get_irn_mode(node);
	ir_node *block = get_nodes_block(node);
	ir_node *load, *op;

944
	if (mode_is_float(mode)) {
945
946
		return gen_binop_am(node, op1, op2, new_bd_amd64_adds,
							pn_amd64_adds_res, match_commutative | match_am);
947
948
	}

949
950
951
952
	bool use_am = use_address_matching(mode, flags, block, op1, op2, &load, &op);

	ir_node *res;
	if (use_am)
953
954
		res = gen_binop_am(node, op1, op2, new_bd_amd64_add, pn_amd64_add_res,
		                   flags);
955
	else
956
		res = create_lea_as_add(node, op1, op2);
957

Matthias Braun's avatar
Matthias Braun committed
958
959
960
	x86_mark_non_am(node);
	return res;
}
961

Matthias Braun's avatar
Matthias Braun committed
962
static ir_node *gen_Sub(ir_node *const node)
963
{
Matthias Braun's avatar
Matthias Braun committed
964
965
	ir_node  *const op1     = get_Sub_left(node);
	ir_node  *const op2     = get_Sub_right(node);
966
	ir_mode  *const mode    = get_irn_mode(node);
967
968

	if (mode_is_float(mode)) {
969
970
		return gen_binop_am(node, op1, op2, new_bd_amd64_subs,
		                    pn_amd64_subs_res, match_am);
971
	} else {
972
		/* TODO: do not match AM yet until we have a sub->neg+add rule
973
		 * in amd64_finish */
974
975
		return gen_binop_am(node, op1, op2, new_bd_amd64_sub, pn_amd64_sub_res,
		                    match_immediate);
976
	}