amd64_transform.c 90.3 KB
Newer Older
1
2
/*
 * This file is part of libFirm.
3
 * Copyright (C) 2012 University of Karlsruhe.
4
5
6
7
8
9
 */

/**
 * @file
 * @brief   code selection (transform FIRM into amd64 FIRM)
 */
Matthias Braun's avatar
Matthias Braun committed
10
#include "debug.h"
Matthias Braun's avatar
Matthias Braun committed
11
#include "panic.h"
Matthias Braun's avatar
Matthias Braun committed
12
13
#include "heights.h"
#include "ircons.h"
14
#include "iredges.h"
Matthias Braun's avatar
Matthias Braun committed
15
#include "irgmod.h"
16
17
#include "irgraph_t.h"
#include "irmode_t.h"
Matthias Braun's avatar
Matthias Braun committed
18
#include "irnode_t.h"
19
#include "iropt_t.h"
20
#include "tv_t.h"
Matthias Braun's avatar
Matthias Braun committed
21
#include "util.h"
22

23
24
#include "benode.h"
#include "betranshlp.h"
25
#include "bearch_amd64_t.h"
26
#include "beirg.h"
Matthias Braun's avatar
Matthias Braun committed
27
#include "besched.h"
28

Matthias Braun's avatar
Matthias Braun committed
29
#include "amd64_new_nodes.h"
30
31
#include "amd64_nodes_attr.h"
#include "amd64_transform.h"
32
#include "amd64_varargs.h"
Matthias Braun's avatar
Matthias Braun committed
33
#include "../ia32/x86_address_mode.h"
34
#include "../ia32/x86_cconv.h"
35
36
37
38
39

#include "gen_amd64_regalloc_if.h"

DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)

40
static ir_mode         *mode_gp;
41
static x86_cconv_t     *current_cconv = NULL;
42
43
static pmap            *node_to_stack;
static be_stackorder_t *stackorder;
44

45
46
47
/** we don't have a concept of aliasing registers, so enumerate them
 * manually for the asm nodes. */
const x86_clobber_name_t amd64_additional_clobber_names[] = {
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
	{ "al", REG_RAX }, { "ah", REG_RAX }, { "ax", REG_RAX }, { "eax", REG_RAX },
	{ "bl", REG_RBX }, { "bh", REG_RBX }, { "bx", REG_RBX }, { "ebx", REG_RBX },
	{ "cl", REG_RCX }, { "ch", REG_RCX }, { "cx", REG_RCX }, { "ecx", REG_RCX },
	{ "dl", REG_RDX }, { "dh", REG_RDX }, { "dx", REG_RDX }, { "edx", REG_RDX },
	{ "sil",  REG_RSI }, { "si",   REG_RSI }, { "esi",  REG_RSI },
	{ "dil",  REG_RDI }, { "di",   REG_RDI }, { "edi",  REG_RDI },
	{ "bpl",  REG_RBP }, { "bp",   REG_RBP }, { "ebp",  REG_RBP },
	{ "spl",  REG_RSP }, { "sp",   REG_RSP }, { "esp",  REG_RSP },
	{ "r8b",  REG_R8  }, { "r8w",  REG_R8  }, { "r8d",  REG_R8  },
	{ "r9b",  REG_R9  }, { "r9w",  REG_R9  }, { "r9d",  REG_R9  },
	{ "r10b", REG_R10 }, { "r10w", REG_R10 }, { "r10d", REG_R10 },
	{ "r11b", REG_R11 }, { "r11w", REG_R11 }, { "r11d", REG_R11 },
	{ "r12b", REG_R12 }, { "r12w", REG_R12 }, { "r12d", REG_R12 },
	{ "r13b", REG_R13 }, { "r13w", REG_R13 }, { "r13d", REG_R13 },
	{ "r14b", REG_R14 }, { "r14w", REG_R14 }, { "r14d", REG_R14 },
	{ "r15b", REG_R15 }, { "r15w", REG_R15 }, { "r15d", REG_R15 },
64
65
66
67
	{ NULL, ~0u }
};

#define GP &amd64_reg_classes[CLASS_amd64_gp]
68
const x86_asm_constraint_list_t amd64_asm_constraints = {
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
	['A'] = { MATCH_REG, GP, 1 << REG_GP_RAX | 1 << REG_GP_RDX },
	['D'] = { MATCH_REG, GP, 1 << REG_GP_RDI },
	['I'] = { MATCH_IMM, GP, 0 },
	['J'] = { MATCH_IMM, GP, 0 },
	['K'] = { MATCH_IMM, GP, 0 },
	['L'] = { MATCH_IMM, GP, 0 },
	['M'] = { MATCH_IMM, GP, 0 },
	['N'] = { MATCH_IMM, GP, 0 },
	['O'] = { MATCH_IMM, GP, 0 },
	['R'] = { MATCH_REG, GP, 1 << REG_GP_RAX | 1 << REG_GP_RBX
		| 1 << REG_GP_RCX | 1 << REG_GP_RDX | 1 << REG_GP_RSI
		| 1 << REG_GP_RDI | 1 << REG_GP_RBP | 1 << REG_GP_RSP },
	['S'] = { MATCH_REG, GP, 1 << REG_GP_RSI },
	['Q'] = { MATCH_REG, GP, 1 << REG_GP_RAX | 1 << REG_GP_RBX
		| 1 << REG_GP_RCX | 1 << REG_GP_RDX },
	['V'] = { MATCH_MEM, GP, 0 },
	['X'] = { MATCH_ANY, GP, 0 },
	['a'] = { MATCH_REG, GP, 1 << REG_GP_RAX },
	['b'] = { MATCH_REG, GP, 1 << REG_GP_RBX },
	['c'] = { MATCH_REG, GP, 1 << REG_GP_RCX },
	['d'] = { MATCH_REG, GP, 1 << REG_GP_RDX },
	['g'] = { MATCH_ANY, GP, 0 },
	['i'] = { MATCH_IMM, GP, 0 },
	['l'] = { MATCH_REG, GP, 1 << REG_GP_RAX | 1 << REG_GP_RBX
		| 1 << REG_GP_RCX | 1 << REG_GP_RDX | 1 << REG_GP_RSI
		| 1 << REG_GP_RDI | 1 << REG_GP_RBP },
	['m'] = { MATCH_MEM, GP, 0 },
	['n'] = { MATCH_IMM, GP, 0 },
	['o'] = { MATCH_MEM, GP, 0 },
	['p'] = { MATCH_REG, GP, 0 },
	['q'] = { MATCH_REG, GP, 0 },
	['r'] = { MATCH_REG, GP, 0 },
	['x'] = { MATCH_REG, &amd64_reg_classes[CLASS_amd64_xmm], 0 },

	// see comments in ia32_transform.c about unimplemented stuff.
};
#undef GP

Matthias Braun's avatar
Matthias Braun committed
107
108
109
#define BIT(x)    (1u << x)

static const arch_register_req_t amd64_requirement_gp_same_0 = {
110
111
112
	.cls               = &amd64_reg_classes[CLASS_amd64_gp],
	.should_be_same    = BIT(0),
	.width             = 1,
Matthias Braun's avatar
Matthias Braun committed
113
114
};

115
static const arch_register_req_t amd64_requirement_xmm_same_0 = {
116
117
118
	.cls               = &amd64_reg_classes[CLASS_amd64_xmm],
	.should_be_same    = BIT(0),
	.width             = 1,
119
120
};

Matthias Braun's avatar
Matthias Braun committed
121
static const arch_register_req_t amd64_requirement_gp_same_0_not_1 = {
122
123
124
125
	.cls               = &amd64_reg_classes[CLASS_amd64_gp],
	.should_be_same    = BIT(0),
	.must_be_different = BIT(1),
	.width             = 1,
Matthias Braun's avatar
Matthias Braun committed
126
127
};

128
static const arch_register_req_t amd64_requirement_xmm_same_0_not_1 = {
129
130
131
132
	.cls               = &amd64_reg_classes[CLASS_amd64_xmm],
	.should_be_same    = BIT(0),
	.must_be_different = BIT(1),
	.width             = 1,
133
134
};

Matthias Braun's avatar
Matthias Braun committed
135
static const arch_register_req_t *mem_reqs[] = {
136
	&arch_memory_requirement,
Matthias Braun's avatar
Matthias Braun committed
137
138
139
};

static const arch_register_req_t *reg_mem_reqs[] = {
140
	&amd64_class_reg_req_gp,
141
	&arch_memory_requirement,
Matthias Braun's avatar
Matthias Braun committed
142
143
};

Tobias Rapp's avatar
Tobias Rapp committed
144
static const arch_register_req_t *rsp_mem_reqs[] = {
145
	&amd64_single_reg_req_gp_rsp,
146
	&arch_memory_requirement,
Tobias Rapp's avatar
Tobias Rapp committed
147
148
};

149
arch_register_req_t const *rsp_reg_mem_reqs[] = {
150
151
	&amd64_single_reg_req_gp_rsp,
	&amd64_class_reg_req_gp,
152
	&arch_memory_requirement,
Tobias Rapp's avatar
Tobias Rapp committed
153
154
};

155
static const arch_register_req_t *xmm_mem_reqs[] = {
156
	&amd64_class_reg_req_xmm,
157
	&arch_memory_requirement,
158
159
};

Matthias Braun's avatar
Matthias Braun committed
160
static const arch_register_req_t *reg_reg_mem_reqs[] = {
161
162
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
163
	&arch_memory_requirement,
Matthias Braun's avatar
Matthias Braun committed
164
165
};

166
arch_register_req_t const *xmm_reg_mem_reqs[] = {
167
168
	&amd64_class_reg_req_xmm,
	&amd64_class_reg_req_gp,
169
	&arch_memory_requirement,
170
171
};

Matthias Braun's avatar
Matthias Braun committed
172
static const arch_register_req_t *reg_reg_reg_mem_reqs[] = {
173
174
175
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
176
	&arch_memory_requirement,
Matthias Braun's avatar
Matthias Braun committed
177
178
};

179
static const arch_register_req_t *xmm_reg_reg_mem_reqs[] = {
180
181
182
	&amd64_class_reg_req_xmm,
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
183
	&arch_memory_requirement,
184
185
};

Tobias Rapp's avatar
Tobias Rapp committed
186
static const arch_register_req_t *reg_flags_reqs[] = {
187
188
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_flags,
189
190
};

191
arch_register_req_t const *amd64_reg_reg_reqs[] = {
192
193
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
194
195
};

196
static const arch_register_req_t *reg_rax_reqs[] = {
197
	&amd64_class_reg_req_gp,
198
	&amd64_single_reg_req_gp_rax,
199
200
};

201
static const arch_register_req_t *reg_rax_rdx_mem_reqs[] = {
202
	&amd64_class_reg_req_gp,
203
	&amd64_single_reg_req_gp_rax,
204
	&amd64_single_reg_req_gp_rdx,
205
	&arch_memory_requirement,
206
207
};

208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
static const arch_register_req_t *rax_reg_mem_reqs[] = {
	&amd64_single_reg_req_gp_rax,
	&amd64_class_reg_req_gp,
	&arch_memory_requirement,
};

static const arch_register_req_t *reg_rax_reg_mem_reqs[] = {
	&amd64_class_reg_req_gp,
	&amd64_single_reg_req_gp_rax,
	&amd64_class_reg_req_gp,
	&arch_memory_requirement,
};

static const arch_register_req_t *reg_reg_rax_reg_mem_reqs[] = {
	&amd64_class_reg_req_gp,
	&amd64_class_reg_req_gp,
	&amd64_single_reg_req_gp_rax,
	&amd64_class_reg_req_gp,
	&arch_memory_requirement,
};

229
arch_register_req_t const *reg_reqs[] = {
230
	&amd64_class_reg_req_gp,
Matthias Braun's avatar
Matthias Braun committed
231
232
};

233
arch_register_req_t const *amd64_xmm_reqs[] = {
234
	&amd64_class_reg_req_xmm,
235
236
};

Matthias Braun's avatar
Matthias Braun committed
237
static const arch_register_req_t *reg_rcx_reqs[] = {
238
239
	&amd64_class_reg_req_gp,
	&amd64_single_reg_req_gp_rcx,
Matthias Braun's avatar
Matthias Braun committed
240
241
};

242
243
244
static const arch_register_req_t *no_reqs[] = {
};

245
arch_register_req_t const *amd64_xmm_xmm_reqs[] = {
246
247
	&amd64_class_reg_req_xmm,
	&amd64_class_reg_req_xmm,
248
249
};

250
arch_register_req_t const **const gp_am_reqs[] = {
251
252
253
254
255
256
257
258
259
260
261
262
263
	mem_reqs,
	reg_mem_reqs,
	reg_reg_mem_reqs,
	reg_reg_reg_mem_reqs,
};

static arch_register_req_t const **const xmm_am_reqs[] = {
	mem_reqs,
	xmm_mem_reqs,
	xmm_reg_mem_reqs,
	xmm_reg_reg_mem_reqs,
};

Matthias Braun's avatar
Matthias Braun committed
264
265
static inline bool mode_needs_gp_reg(ir_mode *mode)
{
266
267
	return get_mode_arithmetic(mode) == irma_twos_complement
	    && mode != amd64_mode_xmm; /* mode_xmm is 128bit int at the moment */
Matthias Braun's avatar
Matthias Braun committed
268
269
}

270
271
static ir_node *get_initial_sp(ir_graph *irg)
{
Christoph Mallon's avatar
Christoph Mallon committed
272
	return be_get_Start_proj(irg, &amd64_registers[REG_RSP]);
273
274
275
276
}

static ir_node *get_initial_fp(ir_graph *irg)
{
Christoph Mallon's avatar
Christoph Mallon committed
277
	return be_get_Start_proj(irg, &amd64_registers[REG_RBP]);
278
279
280
281
282
283
284
285
286
287
}

static ir_node *get_frame_base(ir_graph *irg)
{
	if (current_cconv->omit_fp) {
		return get_initial_sp(irg);
	} else {
		return get_initial_fp(irg);
	}
}
288

289
290
291
static amd64_insn_mode_t get_insn_mode_from_mode(const ir_mode *mode)
{
	switch (get_mode_size_bits(mode)) {
292
293
294
295
296
	case   8: return INSN_MODE_8;
	case  16: return INSN_MODE_16;
	case  32: return INSN_MODE_32;
	case  64: return INSN_MODE_64;
	case 128: return INSN_MODE_128;
297
	}
298
	panic("unexpected mode %+F", mode);
299
300
}

301
ir_entity *create_float_const_entity(ir_tarval *const tv)
302
{
303
	ir_entity *entity = pmap_get(ir_entity, amd64_constants, tv);
304
305
306
307
308
309
310
311
312
313
314
315
316
317
	if (entity != NULL)
		return entity;

	ir_mode *mode = get_tarval_mode(tv);
	ir_type *type = get_type_for_mode(mode);
	ir_type *glob = get_glob_type();

	entity = new_entity(glob, id_unique("C%u"), type);
	set_entity_visibility(entity, ir_visibility_private);
	add_entity_linkage(entity, IR_LINKAGE_CONSTANT);

	ir_initializer_t *initializer = create_initializer_tarval(tv);
	set_entity_initializer(entity, initializer);

318
	pmap_insert(amd64_constants, tv, entity);
319
320
321
	return entity;
}

322
void init_lconst_addr(amd64_addr_t *addr, ir_entity *entity)
323
{
324
325
326
327
328
329
330
331
332
	assert(entity_has_definition(entity));
	assert(get_entity_linkage(entity) == IR_LINKAGE_CONSTANT);
	assert(get_entity_visibility(entity) == ir_visibility_private);
	memset(addr, 0, sizeof(*addr));
	x86_immediate_kind_t kind = be_options.pic ? X86_IMM_PCREL : X86_IMM_ADDR;
	addr->immediate.entity = entity;
	addr->immediate.kind = kind;
	addr->index_input = NO_INPUT;
	addr->base_input = kind == X86_IMM_PCREL ? RIP_INPUT : NO_INPUT;
333
334
}

335
static ir_node *create_float_const(dbg_info *dbgi, ir_node *block,
Matthias Braun's avatar
Matthias Braun committed
336
                                   ir_tarval *tv)
337
338
339
{
	ir_graph  *irg     = get_irn_irg(block);
	ir_mode   *tv_mode = get_tarval_mode(tv);
340
	ir_entity *entity  = create_float_const_entity(tv);
341
342
343
344
	ir_node   *nomem   = get_irg_no_mem(irg);

	ir_node *in[] = { nomem };
	amd64_addr_t addr;
345
	init_lconst_addr(&addr, entity);
346

347
	ir_node *load;
348
	unsigned pn_res;
349
	amd64_insn_mode_t insn_mode = get_insn_mode_from_mode(tv_mode);
350
	if (insn_mode == INSN_MODE_128) {
351
		load = new_bd_amd64_movdqa(dbgi, block, ARRAY_SIZE(in), in, mem_reqs, AMD64_OP_ADDR, addr);
352
		pn_res = pn_amd64_movdqa_res;
353
	} else {
354
		load = new_bd_amd64_movs_xmm(dbgi, block, ARRAY_SIZE(in), in, mem_reqs, insn_mode, AMD64_OP_ADDR, addr);
355
		pn_res = pn_amd64_movs_xmm_res;
356
	}
Matthias Braun's avatar
Matthias Braun committed
357
	set_irn_pinned(load, false);
358

359
	return be_new_Proj(load, pn_res);
360
361
362
363
364
}

ir_tarval *create_sign_tv(ir_mode *mode)
{
	unsigned size = get_mode_size_bits(mode);
Matthias Braun's avatar
Matthias Braun committed
365
366
367
368
	assert(size == 32 || size == 64 || size == 128);
	ir_mode *intmode = size == 128 ? amd64_mode_xmm
	                 : size == 64  ? mode_Lu
	                               : mode_Iu;
369
370
371
	ir_tarval *one  = get_mode_one(intmode);
	ir_tarval *sign = tarval_shl_unsigned(one, size-1);
	return tarval_bitcast(sign, mode);
372
373
}

374
375
static ir_node *gen_Const(ir_node *node)
{
376
	ir_node  *block = be_transform_nodes_block(node);
377
	dbg_info *dbgi  = get_irn_dbg_info(node);
378
	ir_mode  *mode  = get_irn_mode(node);
379
	ir_tarval *tv = get_Const_tarval(node);
380
381
382

	if (!mode_needs_gp_reg(mode)) {
		if (tarval_is_null(tv)) {
383
			return new_bd_amd64_xorpd_0(dbgi, block);
384
385
		}

386
		return create_float_const(dbgi, block, tv);
387
388
	}

389
390
	uint64_t val = get_tarval_uint64(tv);
	amd64_insn_mode_t imode = val > UINT32_MAX ? INSN_MODE_64 : INSN_MODE_32;
Matthias Braun's avatar
Matthias Braun committed
391
392
393
394
395
	amd64_imm64_t const imm = {
		.kind   = X86_IMM_VALUE,
		.offset = val,
	};
	return new_bd_amd64_mov_imm(dbgi, block, imode, &imm);
396
397
}

398
static ir_node *gen_Address(ir_node *node)
399
{
400
	ir_node   *block  = be_transform_nodes_block(node);
401
	dbg_info  *dbgi   = get_irn_dbg_info(node);
402
	ir_entity *entity = get_Address_entity(node);
403

404
405
406
407
408
409
	amd64_imm64_t const imm = {
		.kind   = X86_IMM_ADDR,
		.entity = entity,
	};
	return new_bd_amd64_mov_imm(dbgi, block, INSN_MODE_64, &imm);
}
Matthias Braun's avatar
Matthias Braun committed
410

411
412
413
414
415
416
static ir_node *gen_be_Relocation(ir_node *node)
{
	ir_node             *const block  = be_transform_nodes_block(node);
	ir_entity           *const entity = be_get_Relocation_entity(node);
	x86_immediate_kind_t const kind
		= (x86_immediate_kind_t)be_get_Relocation_kind(node);
Matthias Braun's avatar
Matthias Braun committed
417

418
419
420
	switch (kind) {
	case X86_IMM_ADDR: {
		amd64_imm64_t const imm = {
Matthias Braun's avatar
Matthias Braun committed
421
422
423
			.kind   = X86_IMM_ADDR,
			.entity = entity,
		};
424
425
426
427
428
429
430
431
432
		return new_bd_amd64_mov_imm(NULL, block, INSN_MODE_64, &imm);
	}
	case X86_IMM_PCREL:
	case X86_IMM_GOTPCREL: { /* can GOTPCREL happen here? */
		amd64_addr_t addr;
		memset(&addr, 0, sizeof(addr));
		addr.base_input  = RIP_INPUT;
		addr.index_input = NO_INPUT;
		addr.mem_input   = NO_INPUT;
Matthias Braun's avatar
Matthias Braun committed
433
		addr.immediate = (x86_imm32_t) {
434
			.kind   = kind,
Matthias Braun's avatar
Matthias Braun committed
435
436
			.entity = entity,
		};
437
		return new_bd_amd64_lea(NULL, block, 0, NULL, NULL, INSN_MODE_64, addr);
Matthias Braun's avatar
Matthias Braun committed
438
	}
439
440
441
442
	default:
		break;
	}
	panic("Unexpected relocation kind");
Matthias Braun's avatar
Matthias Braun committed
443
444
}

445
446
ir_node *amd64_new_IncSP(ir_node *block, ir_node *old_sp, int offset,
                         unsigned align)
Tobias Rapp's avatar
Tobias Rapp committed
447
{
448
449
450
451
	ir_node *incsp = be_new_IncSP(&amd64_registers[REG_RSP], block, old_sp,
	                              offset, align);
	arch_add_irn_flags(incsp, arch_irn_flag_modify_flags);
	return incsp;
Tobias Rapp's avatar
Tobias Rapp committed
452
453
}

454
typedef ir_node *(*construct_binop_func)(dbg_info *dbgi, ir_node *block, int arity, ir_node *const *in, arch_register_req_t const **in_reqs, amd64_binop_addr_attr_t const *attr_init);
Matthias Braun's avatar
Matthias Braun committed
455

456
typedef ir_node *(*construct_rax_binop_func)(dbg_info *dbgi, ir_node *block, int arity, ir_node *const *in, arch_register_req_t const **in_reqs, amd64_insn_mode_t insn_mode, amd64_op_mode_t op_mode, amd64_addr_t addr);
457

Matthias Braun's avatar
Matthias Braun committed
458
459
460
461
462
463
464
465
typedef enum match_flags_t {
	match_am           = 1 << 0,
	match_mode_neutral = 1 << 1,
	match_immediate    = 1 << 2,
	match_commutative  = 1 << 3,
} match_flags_t;

typedef struct amd64_args_t {
Matthias Braun's avatar
Matthias Braun committed
466
467
468
469
	amd64_binop_addr_attr_t     attr;
	ir_node                    *mem_proj;
	ir_node                    *in[4];
	int                         arity;
Matthias Braun's avatar
Matthias Braun committed
470
471
472
	const arch_register_req_t **reqs;
} amd64_args_t;

Matthias Braun's avatar
Matthias Braun committed
473
static bool match_immediate_32(x86_imm32_t *imm, const ir_node *op,
474
475
                               bool can_match_ip_relative,
                               bool upper32_dont_care)
Matthias Braun's avatar
Matthias Braun committed
476
477
{
	assert(mode_needs_gp_reg(get_irn_mode(op)));
Matthias Braun's avatar
Matthias Braun committed
478
479
	assert(imm->offset == 0 && imm->entity == NULL
	       && imm->kind == X86_IMM_VALUE);
480
481
482

	ir_tarval *tv;
	ir_entity *entity;
Matthias Braun's avatar
Matthias Braun committed
483
484
	unsigned   reloc_kind;
	if (!be_match_immediate(op, &tv, &entity, &reloc_kind))
485
486
487
488
		return false;

	int32_t val;
	if (tv) {
Matthias Braun's avatar
Matthias Braun committed
489
490
		if (!tarval_is_long(tv))
			return false;
491
492
		long lval = get_tarval_long(tv);
		val = (int32_t)lval;
Matthias Braun's avatar
Matthias Braun committed
493
494
		if ((long)val != lval)
			return false;
495
496
497
498
499
		/** the immediate value is signed extended to 64bit, sometimes
		 * this is not what we want. */
		if (!upper32_dont_care && val < 0
		    && !mode_is_signed(get_tarval_mode(tv)))
		    return false;
500
501
502
503
	} else {
		val = 0;
	}

Matthias Braun's avatar
Matthias Braun committed
504
	x86_immediate_kind_t kind = (x86_immediate_kind_t)reloc_kind;
Matthias Braun's avatar
Matthias Braun committed
505
	if (entity != NULL) {
506
507
508
509
510
		if (!can_match_ip_relative)
			return false;
		if (kind == X86_IMM_VALUE || kind == X86_IMM_ADDR) {
			kind = X86_IMM_PCREL;
		} else if (kind != X86_IMM_PCREL)
Matthias Braun's avatar
Matthias Braun committed
511
			return false;
Matthias Braun's avatar
Matthias Braun committed
512
	}
513
514

	imm->entity = entity;
Matthias Braun's avatar
Matthias Braun committed
515
516
	imm->offset = val;
	imm->kind   = kind;
517
	return true;
Matthias Braun's avatar
Matthias Braun committed
518
519
520
521
}

static ir_heights_t *heights;

522
523
524
525
526
527
528
529
530
static bool input_depends_on_load(ir_node *load, ir_node *input)
{
	ir_node *block = get_nodes_block(load);
	/* if the dependency is in another block, then we ignore it for now
	   as we only match address mode loads in the same block. */
	return get_nodes_block(input) == block
	    && heights_reachable_in_block(heights, input, load);
}

Tobias Rapp's avatar
Tobias Rapp committed
531
532
533
534
535
536
537
538
539
static void fix_node_mem_proj(ir_node *node, ir_node *mem_proj)
{
	if (mem_proj == NULL)
		return;

	ir_node *load = get_Proj_pred(mem_proj);
	be_set_transformed_node(load, node);
}

540
static ir_node *source_am_possible(ir_node *block, ir_node *node)
Matthias Braun's avatar
Matthias Braun committed
541
542
{
	if (!is_Proj(node))
543
		return NULL;
Matthias Braun's avatar
Matthias Braun committed
544
545
	ir_node *load = get_Proj_pred(node);
	if (!is_Load(load))
546
		return NULL;
547
	assert(get_Proj_num(node) == pn_Load_res);
Matthias Braun's avatar
Matthias Braun committed
548
	if (get_nodes_block(load) != block)
549
		return NULL;
Matthias Braun's avatar
Matthias Braun committed
550
551
	/* make sure we are the only user */
	if (get_irn_n_edges(node) != 1)
552
		return NULL;
553
554
555
556
557
558
	/* From ia32_transform.c:751:
	 * in some edge cases with address mode we might reach the load normally
	 * and through some AM sequence, if it is already materialized then we
	 * can't create an AM node from it */
	if (be_is_transformed(node))
		return NULL;
559
	return load;
Matthias Braun's avatar
Matthias Braun committed
560
561
562
563
564
565
566
567
568
569
}

static bool needs_extension(ir_node *op)
{
	ir_mode *mode = get_irn_mode(op);
	if (get_mode_size_bits(mode) >= 32)
		return false;
	return !be_upper_bits_clean(op, mode);
}

570
static ir_node *create_sext(ir_node *new_block, ir_node *const node, ir_mode *mode)
571
572
573
{
	amd64_insn_mode_t insn_mode = get_insn_mode_from_mode(mode);
	dbg_info *const   dbgi      = get_irn_dbg_info(node);
Tobias Rapp's avatar
Tobias Rapp committed
574
	ir_node  *const   new_node  = be_transform_node(node);
575
576
577
578
579
580

	amd64_shift_attr_t attr;
	memset(&attr, 0, sizeof(attr));
	attr.base.op_mode = AMD64_OP_SHIFT_IMM;
	attr.insn_mode    = insn_mode;
	attr.immediate    = get_mode_size_bits(mode) - 1;
Tobias Rapp's avatar
Tobias Rapp committed
581
	ir_node *in[1]    = { new_node };
582
	ir_node *const sar = new_bd_amd64_sar(dbgi, new_block, ARRAY_SIZE(in), in, reg_reqs, &attr);
583
	arch_set_irn_register_req_out(sar, 0, &amd64_requirement_gp_same_0);
584
	return be_new_Proj(sar, pn_amd64_sar_res);
585
586
}

587
static ir_node *create_zext(ir_node *new_block, ir_node *const node)
588
{
589
590
	dbg_info *const dbgi = get_irn_dbg_info(node);
	ir_node  *const xor0 = new_bd_amd64_xor_0(dbgi, new_block);
591
	return be_new_Proj(xor0, pn_amd64_xor_0_res);
592
593
}

Tobias Rapp's avatar
Tobias Rapp committed
594
595
static bool use_address_matching(ir_mode *mode, match_flags_t flags,
                                 ir_node *block,
596
597
598
                                 ir_node *op1, ir_node *op2,
                                 ir_node **out_load, ir_node **out_op)
{
599
600
	if (! (flags & match_am))
		return false;
601

Tobias Rapp's avatar
Tobias Rapp committed
602
603
604
605
	unsigned mode_bits = get_mode_size_bits(mode);
	if (mode_bits == 8 || mode_bits == 16)
		return false;

606
607
608
	ir_node *load2 = source_am_possible(block, op2);
	if (load2 != NULL && !input_depends_on_load(load2, op1)) {
		(*out_load) = load2;
609
610
		(*out_op)   = op1;
		return true;
611
612
613
614
615
616
617
618
619
	}

	if (flags & match_commutative) {
		ir_node *load1 = source_am_possible(block, op1);
		if (load1 != NULL && !input_depends_on_load(load1, op2)) {
			(*out_load) = load1;
			(*out_op)   = op2;
			return true;
		}
620
621
622
623
	}
	return false;
}

624
625
static void perform_address_matching(ir_node *ptr, int *arity,
                                     ir_node **in, amd64_addr_t *addr)
626
627
628
{
	x86_address_t maddr;
	memset(&maddr, 0, sizeof(maddr));
629
	x86_create_address_mode(&maddr, ptr, x86_create_am_normal);
630
631
632
633
634
635

	if (maddr.base != NULL) {
		int base_input   = (*arity)++;
		addr->base_input = base_input;
		in[base_input]   = be_transform_node(maddr.base);
	} else {
636
		addr->base_input = maddr.ip_base ? RIP_INPUT : NO_INPUT;
637
638
639
640
641
642
643
644
	}
	if (maddr.index != NULL) {
		int index_input = (*arity)++;
		addr->index_input = index_input;
		in[index_input]  = be_transform_node(maddr.index);
	} else {
		addr->index_input = NO_INPUT;
	}
645
	ir_entity *entity = maddr.imm.entity;
646
	if (entity != NULL && is_parameter_entity(entity) &&
647
		get_entity_parameter_number(entity) == IR_VA_START_PARAMETER_NUMBER)
Andreas Fried's avatar
Andreas Fried committed
648
		panic("perform_address_matching: Request for invalid parameter (va_start parameter)");
649

Matthias Braun's avatar
Matthias Braun committed
650
651
	addr->immediate = maddr.imm;
	addr->log_scale = maddr.scale;
652
653
}

Matthias Braun's avatar
Matthias Braun committed
654
655
656
static void match_binop(amd64_args_t *args, ir_node *block,
                        ir_mode *mode, ir_node *op1, ir_node *op2,
                        match_flags_t flags)
Matthias Braun's avatar
Matthias Braun committed
657
658
659
{
	memset(args, 0, sizeof(*args));

660
	bool use_am;
661
	bool use_xmm       = mode_is_float(mode);
Matthias Braun's avatar
Matthias Braun committed
662
	bool use_immediate = flags & match_immediate;
663
	bool mode_neutral  = flags & match_mode_neutral;
Matthias Braun's avatar
Matthias Braun committed
664

Matthias Braun's avatar
Matthias Braun committed
665
	args->attr.base.insn_mode = get_insn_mode_from_mode(mode);
Matthias Braun's avatar
Matthias Braun committed
666
667

	/* TODO: legalize phase */
668
	if (mode_neutral) {
669
670
		op1 = be_skip_downconv(op1, true);
		op2 = be_skip_downconv(op2, true);
Matthias Braun's avatar
Matthias Braun committed
671
672
673
674
675
676
677
	} else {
		/* TODO: extend inputs? */
		(void)needs_extension;
	}

	ir_node *load;
	ir_node *op;
678

Tobias Rapp's avatar
Tobias Rapp committed
679
	use_am = use_address_matching(mode, flags, block, op1, op2, &load, &op);
680

681
682
	if (use_immediate
	    && match_immediate_32(&args->attr.u.immediate, op2, false, mode_neutral)) {
683
		assert(!use_xmm && "Can't (yet) match binop with xmm immediate");
Matthias Braun's avatar
Matthias Braun committed
684
		/* fine, we found an immediate */
Matthias Braun's avatar
Matthias Braun committed
685
686
687
		args->attr.base.base.op_mode = AMD64_OP_REG_IMM;
		args->in[args->arity++]      = be_transform_node(op1);
		args->reqs                   = reg_reqs;
688
	} else if (use_am) {
Matthias Braun's avatar
Matthias Braun committed
689
690
691
692
		ir_node *new_op        = be_transform_node(op);
		int      reg_input     = args->arity++;
		args->attr.u.reg_input = reg_input;
		args->in[reg_input]    = new_op;
693
		amd64_addr_t *addr     = &args->attr.base.addr;
Matthias Braun's avatar
Matthias Braun committed
694

695
696
697
		ir_node *ptr = get_Load_ptr(load);
		perform_address_matching(ptr, &(args->arity), args->in, addr);

698
699
		args->reqs = (use_xmm ? xmm_am_reqs : gp_am_reqs)[args->arity];

700
701
702
703
		ir_node *new_mem    = be_transform_node(get_Load_mem(load));
		int mem_input       = args->arity++;
		args->in[mem_input] = new_mem;
		addr->mem_input     = mem_input;
704

705
		args->mem_proj      = get_Proj_for_pn(load, pn_Load_M);
706
		args->attr.base.base.op_mode = AMD64_OP_REG_ADDR;
Matthias Braun's avatar
Matthias Braun committed
707
708
709
710
	} else {
		/* simply transform the arguments */
		args->in[args->arity++] = be_transform_node(op1);
		args->in[args->arity++] = be_transform_node(op2);
Matthias Braun's avatar
Matthias Braun committed
711
		args->attr.base.base.op_mode = AMD64_OP_REG_REG;
712

713
		args->reqs = use_xmm ? amd64_xmm_xmm_reqs : amd64_reg_reg_reqs;
Matthias Braun's avatar
Matthias Braun committed
714
715
716
717
	}
}

static ir_node *gen_binop_am(ir_node *node, ir_node *op1, ir_node *op2,
718
719
                             construct_binop_func func, unsigned pn_res,
                             match_flags_t flags)
Matthias Braun's avatar
Matthias Braun committed
720
721
722
723
{
	ir_node *block = get_nodes_block(node);
	ir_mode *mode  = get_irn_mode(node);
	amd64_args_t args;
Matthias Braun's avatar
Matthias Braun committed
724
	match_binop(&args, block, mode, op1, op2, flags);
Matthias Braun's avatar
Matthias Braun committed
725
726
727

	dbg_info *const dbgi      = get_irn_dbg_info(node);
	ir_node  *const new_block = be_transform_node(block);
728
	ir_node  *const new_node  = func(dbgi, new_block, args.arity, args.in, args.reqs, &args.attr);
729

Tobias Rapp's avatar
Tobias Rapp committed
730
	fix_node_mem_proj(new_node, args.mem_proj);
Matthias Braun's avatar
Matthias Braun committed
731

732
733
734
735
736
737
738
	if (mode_is_float(mode)) {
		arch_set_irn_register_req_out(new_node, 0,
		                              &amd64_requirement_xmm_same_0);
	} else {
		arch_set_irn_register_req_out(new_node, 0,
		                              &amd64_requirement_gp_same_0);
	}
739
	return be_new_Proj(new_node, pn_res);
Matthias Braun's avatar
Matthias Braun committed
740
741
}

742
743
744
745
746
747
748
749
750
751
752
753
754
static ir_node *gen_binop_rax(ir_node *node, ir_node *op1, ir_node *op2,
                              construct_rax_binop_func make_node,
                              match_flags_t flags)
{
	bool use_am;
	bool mode_neutral  = flags & match_mode_neutral;
	assert(! (flags & match_immediate));

	ir_mode *mode = get_irn_mode(op1);
	amd64_insn_mode_t insn_mode = get_insn_mode_from_mode(mode);

	/* TODO: legalize phase */
	if (mode_neutral) {
755
756
		op1 = be_skip_downconv(op1, true);
		op2 = be_skip_downconv(op2, true);
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
	} else {
		/* TODO: extend inputs? */
		(void)needs_extension;
	}

	ir_node *load;
	ir_node *op;
	ir_node *block = get_nodes_block(node);
	ir_node *in[4];
	int      arity = 0;
	const arch_register_req_t **reqs;
	amd64_op_mode_t op_mode;
	amd64_addr_t    addr;
	memset(&addr, 0, sizeof(addr));

Tobias Rapp's avatar
Tobias Rapp committed
772
	use_am = use_address_matching(mode, flags, block, op1, op2, &load, &op);
773

774
	ir_node *mem_proj = NULL;
775
776
777
778
779
	if (use_am) {
		ir_node *new_op    = be_transform_node(op);
		int      reg_input = arity++;
		in[reg_input]      = new_op;

780
781
782
		ir_node *ptr = get_Load_ptr(load);
		perform_address_matching(ptr, &arity, in, &addr);

783
		reqs = gp_am_reqs[arity];
784
785
786
787
788

		ir_node *new_mem = be_transform_node(get_Load_mem(load));
		int mem_input    = arity++;
		in[mem_input]    = new_mem;
		addr.mem_input   = mem_input;
789

790
		mem_proj                = get_Proj_for_pn(load, pn_Load_M);
791
		op_mode                 = AMD64_OP_ADDR;
792
793
	} else {
		/* simply transform the arguments */
794
795
		in[arity++] = be_transform_node(op1);
		in[arity++] = be_transform_node(op2);
796
797
		reqs        = reg_rax_reqs;
		op_mode     = AMD64_OP_REG;
798
799
	}

800
	assert((size_t)arity <= ARRAY_SIZE(in));
801
802
803
	dbg_info *const dbgi      = get_irn_dbg_info(node);
	ir_node  *const new_block = be_transform_node(block);
	ir_node  *const new_node  = make_node(dbgi, new_block, arity, in, reqs, insn_mode, op_mode, addr);
804
805
806
	if (mem_proj != NULL) {
		be_set_transformed_node(load, new_node);
	}
807
808
809
	return new_node;
}

810
811
812
813
814
815
816
817
static ir_node *gen_binop_xmm(ir_node *node, ir_node *op0, ir_node *op1,
                              construct_binop_func make_node,
                              match_flags_t flags)
{
	ir_node *block = get_nodes_block(node);
	ir_mode *mode  = get_irn_mode(op0);
	amd64_args_t args;
	memset(&args, 0, sizeof(args));
818
	args.attr.base.insn_mode = INSN_MODE_64;
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833

	ir_node *load;
	ir_node *op;
	bool use_am = use_address_matching(mode, flags, block, op0, op1, &load,
	                                   &op);

	if (use_am) {
		int reg_input = args.arity++;
		args.attr.u.reg_input = reg_input;
		args.in[reg_input]    = be_transform_node(op);

		amd64_addr_t *addr = &args.attr.base.addr;
		ir_node      *ptr  = get_Load_ptr(load);
		perform_address_matching(ptr, &args.arity, args.in, addr);

834
		args.reqs = xmm_am_reqs[args.arity];
835
836
837
838
839
840
841

		ir_node *new_mem   = be_transform_node(get_Load_mem(load));
		int mem_input      = args.arity++;
		args.in[mem_input] = new_mem;
		addr->mem_input    = mem_input;

		args.mem_proj      = get_Proj_for_pn(load, pn_Load_M);
842
		args.attr.base.base.op_mode = AMD64_OP_REG_ADDR;
843
844
845
846
	} else {
		args.in[args.arity++] = be_transform_node(op0);
		args.in[args.arity++] = be_transform_node(op1);
		args.attr.base.base.op_mode = AMD64_OP_REG_REG;
847
		args.reqs = amd64_xmm_xmm_reqs;
848
849
850
851
	}

	dbg_info *const dbgi      = get_irn_dbg_info(node);
	ir_node  *const new_block = be_transform_node(block);
852
	ir_node  *const new_node  = make_node(dbgi, new_block, args.arity, args.in, args.reqs, &args.attr);
853
854
855
856
857

	fix_node_mem_proj(new_node, args.mem_proj);

	arch_set_irn_register_req_out(new_node, 0,
								  &amd64_requirement_xmm_same_0);
858
	return be_new_Proj(new_node, pn_amd64_subs_res);
859
860
}

861
typedef ir_node *(*construct_shift_func)(dbg_info *dbgi, ir_node *block, int arity, ir_node *const *in, arch_register_req_t const **in_reqs, amd64_shift_attr_t const *attr_init);
Matthias Braun's avatar
Matthias Braun committed
862
863

static ir_node *gen_shift_binop(ir_node *node, ir_node *op1, ir_node *op2,
864
865
                                construct_shift_func func, unsigned pn_res,
                                match_flags_t flags)
Matthias Braun's avatar
Matthias Braun committed
866
867
868
869
870
871
872
873
874
875
{
	ir_mode *mode = get_irn_mode(node);
	assert(!mode_is_float(mode));

	if (get_mode_modulo_shift(mode) != 32 && get_mode_size_bits(mode) != 64)
		panic("insupported modulo shift used");

	ir_node *in[3];
	int      arity = 0;
	if (flags & match_mode_neutral) {
876
		op1 = be_skip_downconv(op1, true);
Matthias Braun's avatar
Matthias Braun committed
877
		in[arity++] = be_transform_node(op1);
Matthias Braun's avatar
Matthias Braun committed
878
		mode = get_mode_size_bits(mode) > 32 ? mode_gp : mode_Iu;
Matthias Braun's avatar
Matthias Braun committed
879
	} else {
880
		op1 = be_skip_sameconv(op1);
881
882
883

		/* Use 8/16bit operations instead of doing zext/upconv */
		in[arity++] = be_transform_node(op1);
Matthias Braun's avatar
Matthias Braun committed
884
885
886
887
888
889
	}

	/* we can skip any convs for the shift count, as it only uses the lowest
	 * 5/6 bits anyway */
	while (is_Conv(op2) && get_irn_n_edges(op2) == 1) {
		ir_node *const op = get_Conv_op(op2);
890
		if (get_mode_arithmetic(get_irn_mode(op)) != irma_twos_complement)
Matthias Braun's avatar
Matthias Braun committed
891
892
893
894
			break;
		op2 = op;
	}

Matthias Braun's avatar
Matthias Braun committed
895
896
	amd64_shift_attr_t attr;
	memset(&attr, 0, sizeof(attr));
Matthias Braun's avatar
Matthias Braun committed
897
898
899
	const arch_register_req_t **reqs;
	const arch_register_req_t  *out_req0;
	if (is_Const(op2)) {
Matthias Braun's avatar
Matthias Braun committed
900
901
902
		attr.base.op_mode = AMD64_OP_SHIFT_IMM;
		reqs              = reg_reqs;
		out_req0          = &amd64_requirement_gp_same_0;
903
		attr.immediate    = get_Const_long(op2);
Matthias Braun's avatar
Matthias Braun committed
904
	} else {
Matthias Braun's avatar
Matthias Braun committed
905
906
907
908
		attr.base.op_mode = AMD64_OP_SHIFT_REG;
		in[arity++]       = be_transform_node(op2);
		reqs              = reg_rcx_reqs;
		out_req0          = &amd64_requirement_gp_same_0_not_1;
Matthias Braun's avatar
Matthias Braun committed
909
	}
Matthias Braun's avatar
Matthias Braun committed
910
	attr.insn_mode = get_insn_mode_from_mode(mode);
Matthias Braun's avatar
Matthias Braun committed
911

Matthias Braun's avatar
Matthias Braun committed
912
	dbg_info *const dbgi      = get_irn_dbg_info(node);
913
	ir_node  *const new_block = be_transform_nodes_block(node);
914
	ir_node  *const new_node  = func(dbgi, new_block, arity, in, reqs, &attr);
Matthias Braun's avatar
Matthias Braun committed
915
	arch_set_irn_register_req_out(new_node, 0, out_req0);
916
	return be_new_Proj(new_node, pn_res);
917
918
}

919
static ir_node *create_lea_as_add(ir_node *node, ir_node *op1, ir_node *op2)
920
921
{
	dbg_info *const dbgi = get_irn_dbg_info(node);
922
	ir_node  *new_block  = be_transform_nodes_block(node);
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
	ir_mode *mode        = get_irn_mode(node);

	amd64_insn_mode_t insn_mode;
	if (get_mode_size_bits(mode) <= 32)
		insn_mode = INSN_MODE_32;
	else
		insn_mode = INSN_MODE_64;

	const arch_register_req_t **reqs;
	amd64_addr_t addr;
	memset(&addr, 0, sizeof(addr));

	ir_node *in[2];
	int arity = 0;

	if (match_immediate_32(&addr.immediate, op2, false, true)) {
		in[arity++]      = be_transform_node(op1);
		reqs             = reg_reqs;
		addr.index_input = NO_INPUT;
	} else {
		in[arity++]      = be_transform_node(op1);
		in[arity++]      = be_transform_node(op2);
945
946
		addr.base_input  = 0;
		addr.index_input = 1;
947
		reqs             = amd64_reg_reg_reqs;
948
949
	}

950
	return new_bd_amd64_lea(dbgi, new_block, arity, in, reqs, insn_mode, addr);
951
952
}

Matthias Braun's avatar
Matthias Braun committed
953
954
static ir_node *gen_Add(ir_node *const node)
{
955
956
957
	match_flags_t flags = match_immediate | match_am | match_mode_neutral
	                      | match_commutative;

Matthias Braun's avatar
Matthias Braun committed
958
959
	ir_node *op1 = get_Add_left(node);
	ir_node *op2 = get_Add_right(node);
960
961
962
963
964

	ir_mode *mode  = get_irn_mode(node);
	ir_node *block = get_nodes_block(node);
	ir_node *load, *op;

965
	if (mode_is_float(mode)) {
966
967
		return gen_binop_am(node, op1, op2, new_bd_amd64_adds,
							pn_amd64_adds_res, match_commutative | match_am);
968
969
	}

970
971
972
973
	bool use_am = use_address_matching(mode, flags, block, op1, op2, &load, &op);

	ir_node *res;
	if (use_am)
974
975
		res = gen_binop_am(node, op1, op2, new_bd_amd64_add, pn_amd64_add_res,
		                   flags);
976
	else
977
		res = create_lea_as_add(node, op1, op2);
978

Matthias Braun's avatar
Matthias Braun committed
979
980
981
	x86_mark_non_am(node);
	return res;
}
982

Matthias Braun's avatar
Matthias Braun committed
983
static ir_node *gen_Sub(ir_node *const node)
984
{
Matthias Braun's avatar
Matthias Braun committed
985
986
	ir_node  *const op1     = get_Sub_left(node);
	ir_node  *const op2     = get_Sub_right(node);
987
	ir_mode  *const mode    = get_irn_mode(node);
988
989

	if (mode_is_float(mode)) {
990
991
		return gen_binop_am(node, op1, op2, new_bd_amd64_subs,
		                    pn_amd64_subs_res, match_am);
992
	} else {