ia32_emitter.c 81.9 KB
Newer Older
Christian Würdig's avatar
Christian Würdig committed
1
2
/*
 * This file is part of libFirm.
3
 * Copyright (C) 2012 University of Karlsruhe.
Christian Würdig's avatar
Christian Würdig committed
4
5
 */

6
/**
7
 * @file
Christian Würdig's avatar
Christian Würdig committed
8
9
 * @brief       This file implements the ia32 node emitter.
 * @author      Christian Wuerdig, Matthias Braun
10
11
 *
 * Summary table for x86 floatingpoint compares:
12
13
 * (remember effect of unordered on x86: ZF=1, PF=1, CF=1)
 *
14
15
16
17
18
 *   pnc_Eq  => !P && E
 *   pnc_Lt  => !P && B
 *   pnc_Le  => !P && BE
 *   pnc_Gt  => A
 *   pnc_Ge  => AE
19
 *   pnc_Lg  => NE
20
21
22
23
24
25
26
 *   pnc_Leg => NP  (ordered)
 *   pnc_Uo  => P
 *   pnc_Ue  => E
 *   pnc_Ul  => B
 *   pnc_Ule => BE
 *   pnc_Ug  => P || A
 *   pnc_Uge => P || AE
27
 *   pnc_Ne  => P || NE
28
 */
Christian Würdig's avatar
Christian Würdig committed
29
#include <limits.h>
30
#include <inttypes.h>
Christian Würdig's avatar
Christian Würdig committed
31

32
#include "beblocksched.h"
Matthias Braun's avatar
Matthias Braun committed
33
#include "util.h"
34
#include "xmalloc.h"
35
36
#include "tv.h"
#include "iredges.h"
Christian Würdig's avatar
Christian Würdig committed
37
38
39
40
#include "debug.h"
#include "irgwalk.h"
#include "irprintf.h"
#include "irop_t.h"
Christian Würdig's avatar
Christian Würdig committed
41
#include "irargs_t.h"
42
#include "irprog_t.h"
43
#include "iredges_t.h"
44
#include "irtools.h"
45
#include "execfreq.h"
Matthias Braun's avatar
Matthias Braun committed
46
#include "panic.h"
47
#include "dbginfo.h"
48
#include "lc_opts.h"
49
#include "ircons.h"
Christian Würdig's avatar
Christian Würdig committed
50

51
52
#include "besched.h"
#include "benode.h"
53
#include "bedwarf.h"
54
55
#include "beemitter.h"
#include "begnuas.h"
56
#include "bestack.h"
57
#include "beutil.h"
Christian Würdig's avatar
Christian Würdig committed
58

59
#include "ia32_emitter.h"
Christian Würdig's avatar
Christian Würdig committed
60
#include "gen_ia32_emitter.h"
Christian Würdig's avatar
Christian Würdig committed
61
#include "gen_ia32_regalloc_if.h"
62
63
#include "ia32_nodes_attr.h"
#include "ia32_new_nodes.h"
64
#include "ia32_architecture.h"
Christian Würdig's avatar
Christian Würdig committed
65
#include "bearch_ia32_t.h"
Christian Würdig's avatar
Christian Würdig committed
66

67
68
DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)

69
70
71
static char       pic_base_label[128];
static ir_label_t exc_label_id;
static bool       mark_spill_reload;
72

73
74
75
static bool       sp_relative;
static int        frame_type_size;
static int        callframe_offset;
76

77
78
79
/** Return the next block in Block schedule */
static ir_node *get_prev_block_sched(const ir_node *block)
{
80
	return (ir_node*)get_irn_link(block);
81
82
}

83
/** Checks if the current block is a fall-through target. */
84
static bool is_fallthrough(const ir_node *cfgpred)
85
{
Christoph Mallon's avatar
Christoph Mallon committed
86
	if (!is_Proj(cfgpred))
87
88
		return true;
	ir_node *pred = get_Proj_pred(cfgpred);
Christoph Mallon's avatar
Christoph Mallon committed
89
	if (is_ia32_SwitchJmp(pred))
90
91
		return false;
	return true;
92
93
}

94
95
96
97
/**
 * returns non-zero if the given block needs a label
 * because of being a jump-target (and not a fall-through)
 */
98
static bool block_needs_label(const ir_node *block)
99
{
100
	if (get_Block_entity(block) != NULL)
101
		return true;
102

103
104
	int  n_cfgpreds = get_Block_n_cfgpreds(block);
	bool need_label = true;
105
	if (n_cfgpreds == 0) {
106
		need_label = 0;
107
	} else if (n_cfgpreds == 1) {
Christoph Mallon's avatar
Christoph Mallon committed
108
109
		ir_node *cfgpred       = get_Block_cfgpred(block, 0);
		ir_node *cfgpred_block = get_nodes_block(cfgpred);
110
		if (get_prev_block_sched(block) == cfgpred_block
111
		    && is_fallthrough(cfgpred)) {
112
			need_label = 0;
113
114
115
116
117
118
		}
	}

	return need_label;
}

Michael Beck's avatar
Michael Beck committed
119
/**
120
 * Add a number to a prefix. This number will not be used a second time.
Michael Beck's avatar
Michael Beck committed
121
 */
122
123
static char *get_unique_label(char *buf, size_t buflen, const char *prefix)
{
124
	static unsigned long id = 0;
125
	snprintf(buf, buflen, "%s%s%lu", be_gas_get_private_prefix(), prefix, ++id);
126
127
128
	return buf;
}

129
static const char *get_register_name_8bit_low(const arch_register_t *reg)
130
{
131
132
133
134
135
136
137
	switch (reg->global_index) {
	case REG_EAX: return "al";
	case REG_EBX: return "bl";
	case REG_ECX: return "cl";
	case REG_EDX: return "dl";
	}
	panic("unexpected register");
138
139
}

140
static const char *get_register_name_8bit_high(const arch_register_t *reg)
Michael Beck's avatar
Michael Beck committed
141
{
142
143
144
145
146
147
148
149
	switch (reg->global_index) {
	case REG_EAX: return "ah";
	case REG_EBX: return "bh";
	case REG_ECX: return "ch";
	case REG_EDX: return "dh";
	}
	panic("unexpected register");
}
Michael Beck's avatar
Michael Beck committed
150

151
152
153
154
155
156
157
158
159
160
161
162
163
static const char *get_register_name_16bit(const arch_register_t *reg)
{
	switch (reg->global_index) {
	case REG_EAX: return "ax";
	case REG_EBX: return "bx";
	case REG_ECX: return "cx";
	case REG_EDX: return "dx";
	case REG_ESI: return "si";
	case REG_EDI: return "di";
	case REG_ESP: return "sp";
	case REG_EBP: return "bp";
	}
	panic("unexpected register");
Michael Beck's avatar
Michael Beck committed
164
165
}

166
167
static const char *get_register_name_mode(const arch_register_t *reg,
                                          ir_mode *mode)
168
{
169
170
171
172
173
174
175
176
177
	if (mode == NULL)
		return reg->name;
	unsigned size = get_mode_size_bits(mode);
	if (size == 8)
		return get_register_name_8bit_low(reg);
	else if (size == 16)
		return get_register_name_16bit(reg);
	else
		return reg->name;
178
179
}

180
181
182
183
184
/**
 * emit a register, possible shortened by a mode
 * @param reg   the register
 * @param mode  the mode of the register or NULL for full register
 */
185
static void emit_register(const arch_register_t *reg, ir_mode *mode)
186
{
187
	const char *name = get_register_name_mode(reg, mode);
188
	be_emit_char('%');
189
	be_emit_string(name);
Christian Würdig's avatar
Christian Würdig committed
190
191
}

192
193
static void ia32_emit_entity(ir_entity *entity, int no_pic_adjust)
{
194
	be_gas_emit_entity(entity);
195

196
	if (is_tls_entity(entity)) {
Matthias Braun's avatar
Matthias Braun committed
197
		if (!entity_has_definition(entity)) {
198
199
200
201
202
203
			be_emit_cstring("@INDNTPOFF");
		} else {
			be_emit_cstring("@NTPOFF");
		}
	}

204
	if (be_options.pic && !no_pic_adjust && get_entity_type(entity) != get_code_type()) {
205
206
207
208
209
210
211
212
213
		be_emit_char('-');
		be_emit_string(pic_base_label);
	}
}

static void emit_ia32_Immediate_no_prefix(const ir_node *node)
{
	const ia32_immediate_attr_t *attr = get_ia32_immediate_attr_const(node);

214
215
216
	ir_entity *const entity = attr->entity;
	if (entity != NULL) {
		ia32_emit_entity(entity, attr->no_pic_adjust);
217
		if (attr->offset != 0) {
218
			be_emit_irprintf("%+"PRId32, attr->offset);
219
		}
220
	} else {
221
		be_emit_irprintf("0x%"PRIX32, (uint32_t)attr->offset);
222
223
224
225
226
227
228
229
	}
}

static void emit_ia32_Immediate(const ir_node *node)
{
	be_emit_char('$');
	emit_ia32_Immediate_no_prefix(node);
}
230

Matthias Braun's avatar
Matthias Braun committed
231
static void ia32_emit_mode_suffix_mode(const ir_mode *mode)
232
{
233
234
235
236
237
	assert(mode_is_int(mode) || mode_is_reference(mode));
	switch (get_mode_size_bits(mode)) {
		case 8:  be_emit_char('b');     return;
		case 16: be_emit_char('w');     return;
		case 32: be_emit_char('l');     return;
Christoph Mallon's avatar
Christoph Mallon committed
238
239
		/* gas docu says q is the suffix but gcc, objdump and icc use ll
		 * apparently */
Matthias Braun's avatar
Matthias Braun committed
240
241
		case 64: be_emit_cstring("ll"); return;
	}
242
	panic("cannot output mode_suffix for %+F", mode);
Christian Würdig's avatar
Christian Würdig committed
243
244
}

245
static void ia32_emit_x87_mode_suffix(ir_node const *const node)
246
{
247
	/* we only need to emit the mode on address mode */
248
249
250
	if (get_ia32_op_type(node) == ia32_Normal)
		return;

251
	ir_mode *mode = get_ia32_ls_mode(node);
252
253
254
255
	assert(mode != NULL);

	if (mode_is_float(mode)) {
		switch (get_mode_size_bits(mode)) {
256
257
258
259
260
261
262
			case  32: be_emit_char('s'); return;
			case  64: be_emit_char('l'); return;
			/* long doubles have different sizes due to alignment on different
			 * platforms. */
			case  80:
			case  96:
			case 128: be_emit_char('t'); return;
263
264
		}
	} else {
265
		assert(mode_is_int(mode) || mode_is_reference(mode));
266
267
268
269
270
271
272
		switch (get_mode_size_bits(mode)) {
			case 16: be_emit_char('s');     return;
			case 32: be_emit_char('l');     return;
			/* gas docu says q is the suffix but gcc, objdump and icc use ll
			 * apparently */
			case 64: be_emit_cstring("ll"); return;
		}
273
	}
274
	panic("cannot output mode_suffix for %+F", mode);
275
276
}

277
static char get_xmm_mode_suffix(ir_mode *mode)
278
279
{
	assert(mode_is_float(mode));
280
	switch (get_mode_size_bits(mode)) {
Christoph Mallon's avatar
Christoph Mallon committed
281
282
	case 32: return 's';
	case 64: return 'd';
283
	default: panic("invalid XMM mode");
284
285
286
	}
}

287
static void ia32_emit_xmm_mode_suffix(ir_node const *const node)
288
289
290
{
	ir_mode *mode = get_ia32_ls_mode(node);
	assert(mode != NULL);
291
	be_emit_char(get_xmm_mode_suffix(mode));
292
293
}

Christian Würdig's avatar
Christian Würdig committed
294
/**
295
 * Returns the target block for a control flow node.
Christian Würdig's avatar
Christian Würdig committed
296
 */
297
static ir_node *get_cfop_target_block(const ir_node *irn)
Christoph Mallon's avatar
Christoph Mallon committed
298
{
299
	assert(get_irn_mode(irn) == mode_X);
300
	return (ir_node*)get_irn_link(irn);
301
}
Christian Würdig's avatar
Christian Würdig committed
302

303
304
305
306
307
308
/**
 * Emits the target label for a control flow node.
 */
static void ia32_emit_cfop_target(const ir_node *node)
{
	ir_node *block = get_cfop_target_block(node);
309
	be_gas_emit_block_name(block);
310
311
}

312
void x86_emit_condition_code(x86_condition_code_t cc)
313
314
{
	switch (cc) {
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
	case x86_cc_overflow:      be_emit_cstring("o");  return;
	case x86_cc_not_overflow:  be_emit_cstring("no"); return;
	case x86_cc_float_below:
	case x86_cc_float_unordered_below:
	case x86_cc_below:         be_emit_cstring("b");  return;
	case x86_cc_float_above_equal:
	case x86_cc_float_unordered_above_equal:
	case x86_cc_above_equal:   be_emit_cstring("ae"); return;
	case x86_cc_float_equal:
	case x86_cc_equal:         be_emit_cstring("e");  return;
	case x86_cc_float_not_equal:
	case x86_cc_not_equal:     be_emit_cstring("ne"); return;
	case x86_cc_float_below_equal:
	case x86_cc_float_unordered_below_equal:
	case x86_cc_below_equal:   be_emit_cstring("be"); return;
	case x86_cc_float_above:
	case x86_cc_float_unordered_above:
	case x86_cc_above:         be_emit_cstring("a");  return;
	case x86_cc_sign:          be_emit_cstring("s");  return;
	case x86_cc_not_sign:      be_emit_cstring("ns"); return;
	case x86_cc_parity:        be_emit_cstring("p");  return;
	case x86_cc_not_parity:    be_emit_cstring("np"); return;
	case x86_cc_less:          be_emit_cstring("l");  return;
	case x86_cc_greater_equal: be_emit_cstring("ge"); return;
	case x86_cc_less_equal:    be_emit_cstring("le"); return;
	case x86_cc_greater:       be_emit_cstring("g");  return;
	case x86_cc_float_parity_cases:
	case x86_cc_additional_float_cases:
343
		break;
344
	}
345
	panic("invalid ia32 condition code");
346
347
}

348
typedef enum ia32_emit_mod_t {
349
	EMIT_NONE         = 0,
350
	EMIT_RESPECT_LS   = 1U << 0,
351
	EMIT_ALTERNATE_AM = 1U << 1,
352
353
	EMIT_LONG         = 1U << 2,
	EMIT_HIGH_REG     = 1U << 3,
354
	EMIT_LOW_REG      = 1U << 4,
355
356
	EMIT_16BIT_REG    = 1U << 5,
	EMIT_SHIFT_COMMA  = 1U << 6,
357
} ia32_emit_mod_t;
358
ENUM_BITSET(ia32_emit_mod_t)
359

360
361
362
363
364
365
static ir_node const *get_irn_n_reg(ir_node const *const node, int const pos)
{
	ir_node *const in = get_irn_n(node, pos);
	return is_ia32_NoReg_GP(in) ? NULL : in;
}

366
367
368
/**
 * Emits address mode.
 */
369
static void ia32_emit_am(ir_node const *const node)
370
371
{
	/* just to be sure... */
372
	assert(get_ia32_frame_use(node) == IA32_FRAME_USE_NONE || get_ia32_frame_ent(node));
373

374
375
376
	if (get_ia32_am_tls_segment(node))
		be_emit_cstring("%gs:");

377
378
379
	ir_node const *const base = get_irn_n_reg(node, n_ia32_base);
	ir_node const *const idx  = get_irn_n_reg(node, n_ia32_index);

380
	/* emit offset */
381
382
383
	int32_t    const offs = get_ia32_am_offs_int(node);
	ir_entity *const ent  = get_ia32_am_ent(node);
	if (ent) {
384
		const ia32_attr_t *attr = get_ia32_attr_const(node);
385
		ia32_emit_entity(ent, attr->am_sc_no_pic_adjust);
386
		if (offs != 0)
387
			be_emit_irprintf("%+"PRId32, offs);
388
389
390
	} else if (offs != 0 || (!base && !idx)) {
		/* also handle special case if nothing is set */
		be_emit_irprintf("%"PRId32, offs);
391
392
	}

393
	if (base || idx) {
394
395
396
		be_emit_char('(');

		/* emit base */
397
		if (base) {
398
			arch_register_t const *const reg = arch_get_irn_register(base);
399
400
401
402
			emit_register(reg, NULL);
		}

		/* emit index + scale */
403
		if (idx) {
404
			be_emit_char(',');
405
			arch_register_t const *const reg = arch_get_irn_register(idx);
406
407
			emit_register(reg, NULL);

408
			int const scale = get_ia32_am_scale(node);
409
			if (scale > 0)
410
411
412
413
414
415
				be_emit_irprintf(",%d", 1 << scale);
		}
		be_emit_char(')');
	}
}

416
static x86_condition_code_t determine_final_cc(ir_node const *node, int flags_pos);
417
418

void ia32_emitf(ir_node const *const node, char const *fmt, ...)
419
420
421
422
{
	va_list ap;
	va_start(ap, fmt);

423
	be_emit_char('\t');
424
	for (;;) {
425
		const char      *start = fmt;
426
		ia32_emit_mod_t  mod   = EMIT_NONE;
427
428
429
430
431
432
433
434

		while (*fmt != '%' && *fmt != '\n' && *fmt != '\0')
			++fmt;
		if (fmt != start) {
			be_emit_string_len(start, fmt - start);
		}

		if (*fmt == '\n') {
435
436
437
			be_emit_char('\n');
			be_emit_write_line();
			be_emit_char('\t');
438
439
440
441
442
443
444
			++fmt;
			if (*fmt == '\0')
				break;
			continue;
		}

		if (*fmt == '\0')
Christian Würdig's avatar
Christian Würdig committed
445
			break;
446
447

		++fmt;
448
449
		for (;;) {
			switch (*fmt) {
450
451
452
			case '*': mod |= EMIT_ALTERNATE_AM; break;
			case '#': mod |= EMIT_RESPECT_LS;   break;
			case 'l': mod |= EMIT_LONG;         break;
453
454
			case '>': mod |= EMIT_HIGH_REG;     break;
			case '<': mod |= EMIT_LOW_REG;      break;
455
			case '^': mod |= EMIT_16BIT_REG;    break;
456
			case ',': mod |= EMIT_SHIFT_COMMA;  break;
457
458
459
			default:
				goto end_of_mods;
			}
460
461
			++fmt;
		}
462
end_of_mods:
463

464
		switch (*fmt++) {
465
466
467
			arch_register_t const *reg;
			ir_node         const *imm;

468
469
470
471
472
473
			case '%':
				be_emit_char('%');
				break;

			case 'A': {
				switch (*fmt++) {
474
					case 'F':
475
						if (get_ia32_op_type(node) == ia32_Normal) {
476
477
478
							ia32_x87_attr_t const *const attr = get_ia32_x87_attr_const(node);
							char            const *const fmt  = attr->res_in_reg ? "%%st, %%%s" : "%%%s, %%st";
							be_emit_irprintf(fmt, attr->reg->name);
479
							break;
480
481
						} else {
							goto emit_AM;
482
483
						}

484
emit_AM:
485
					case 'M':
486
487
						if (mod & EMIT_ALTERNATE_AM)
							be_emit_char('*');
488
489
490
						ia32_emit_am(node);
						break;

491
492
					case 'R':
						reg = va_arg(ap, const arch_register_t*);
493
						if (get_ia32_op_type(node) == ia32_Normal) {
494
							goto emit_R;
495
496
						} else {
							goto emit_AM;
497
498
499
						}

					case 'S':
500
501
502
						if (get_ia32_op_type(node) == ia32_Normal) {
							goto emit_S;
						} else {
503
							++fmt;
504
							goto emit_AM;
505
506
507
508
509
510
511
						}

					default: goto unknown;
				}
				break;
			}

512
513
514
515
			case 'B': {
				ir_node const *const src = get_irn_n(node, n_ia32_binary_right);
				if (is_ia32_Immediate(src)) {
					emit_ia32_Immediate(src);
516
					be_emit_cstring(", ");
517
518
					if (get_ia32_op_type(node) == ia32_Normal) {
						goto destination_operand;
519
					} else {
520
						ia32_emit_am(node);
521
522
					}
				} else {
523
					if (get_ia32_op_type(node) == ia32_Normal) {
524
						reg = arch_get_irn_register(src);
525
						emit_register(reg, get_ia32_ls_mode(node));
526
527
					} else {
						ia32_emit_am(node);
528
529
					}
					be_emit_cstring(", ");
530
destination_operand:
531
532
533
534
					reg = arch_get_irn_register_in(node, n_ia32_binary_left);
					emit_register(reg, get_ia32_ls_mode(node));
				}
				break;
535
			}
536

537
			case 'D':
538
				if (*fmt < '0' || '9' < *fmt)
539
					goto unknown;
540
				reg = arch_get_irn_register_out(node, *fmt++ - '0');
541
				goto emit_R;
542

543
544
545
			case 'F':
				if (*fmt == 'M') {
					ia32_emit_x87_mode_suffix(node);
546
547
548
549
				} else if (*fmt == 'P') {
					ia32_x87_attr_t const *const attr = get_ia32_x87_attr_const(node);
					if (attr->pop)
						be_emit_char('p');
550
551
552
553
554
555
556
557
558
559
560
561
				} else if (*fmt == 'R') {
					/* NOTE: Work around a gas quirk for non-commutative operations if the
					 * destination register is not %st0.  In this case r/non-r is swapped.
					 * %st0 = %st0 - %st1 -> fsub  %st1, %st0 (as expected)
					 * %st0 = %st1 - %st0 -> fsubr %st1, %st0 (as expected)
					 * %st1 = %st0 - %st1 -> fsub  %st0, %st1 (expected: fsubr)
					 * %st1 = %st1 - %st0 -> fsubr %st0, %st1 (expected: fsub)
					 * In fact this corresponds to the encoding of the instruction:
					 * - The r suffix selects whether %st0 is on the left (no r) or on the
					 *   right (r) side of the executed operation.
					 * - The placement of %st0 selects whether the result is written to
					 *   %st0 (right) or the other register (left).
562
563
564
					 * This means that it is sufficient to test whether the operands are
					 * permuted.  In particular it is not necessary to consider wether the
					 * result is to be placed into the explicit register operand. */
565
					if (get_ia32_x87_attr_const(node)->attr.ins_permuted)
566
						be_emit_char('r');
567
568
				} else if (*fmt == 'X') {
					ia32_emit_xmm_mode_suffix(node);
569
				} else if (*fmt == '0') {
570
					be_emit_char('%');
571
					be_emit_string(get_ia32_x87_attr_const(node)->reg->name);
572
573
574
				} else {
					goto unknown;
				}
575
				++fmt;
576
577
				break;

578
			case 'I':
579
580
				imm = node;
emit_I:
581
582
583
				if (mod & EMIT_SHIFT_COMMA) {
					const ia32_immediate_attr_t *attr
						= get_ia32_immediate_attr_const(imm);
584
					if (attr->entity == NULL && attr->offset == 1)
585
586
						break;
				}
587
588
				if (!(mod & EMIT_ALTERNATE_AM))
					be_emit_char('$');
589
				emit_ia32_Immediate_no_prefix(imm);
590
591
592
				if (mod & EMIT_SHIFT_COMMA) {
					be_emit_char(',');
				}
593
594
595
596
597
598
				break;

			case 'L':
				ia32_emit_cfop_target(node);
				break;

599
600
601
			case 'M': {
				ir_mode *mode = get_ia32_ls_mode(node);
				if (!mode)
602
					mode = ia32_mode_gp;
603
604
605
606
607
608
				if (mod & EMIT_RESPECT_LS) {
					if (get_mode_size_bits(mode) == 32)
						break;
					be_emit_char(mode_is_signed(mode) ? 's' : 'z');
				}
				ia32_emit_mode_suffix_mode(mode);
609
				break;
610
			}
611
612

			case 'P': {
613
				x86_condition_code_t cc;
614
615
				if (*fmt == 'X') {
					++fmt;
616
					cc = (x86_condition_code_t)va_arg(ap, int);
617
				} else if ('0' <= *fmt && *fmt <= '9') {
618
					cc = determine_final_cc(node, *fmt - '0');
yb9976's avatar
yb9976 committed
619
					++fmt;
620
621
622
				} else {
					goto unknown;
				}
623
				x86_emit_condition_code(cc);
624
625
626
				break;
			}

627
628
629
630
631
			case 'R':
				reg = va_arg(ap, const arch_register_t*);
emit_R:
				if (mod & EMIT_ALTERNATE_AM)
					be_emit_char('*');
632
				const char *name;
633
				if (mod & EMIT_HIGH_REG) {
634
					name = get_register_name_8bit_high(reg);
635
				} else if (mod & EMIT_LOW_REG) {
636
					name = get_register_name_8bit_low(reg);
637
				} else if (mod & EMIT_16BIT_REG) {
638
					name = get_register_name_16bit(reg);
639
				} else {
640
641
642
					name = mod & EMIT_RESPECT_LS
						 ? get_register_name_mode(reg, get_ia32_ls_mode(node))
						 : reg->name;
643
				}
644
645
				be_emit_char('%');
				be_emit_string(name);
646
647
648
				if (mod & EMIT_SHIFT_COMMA) {
					be_emit_char(',');
				}
649
650
651
652
				break;

emit_S:
			case 'S': {
653
				if (*fmt < '0' || '9' < *fmt)
654
655
					goto unknown;

656
				unsigned pos = *fmt++ - '0';
657
658
659
				ir_node const *const src = get_irn_n(node, pos);
				if (is_ia32_Immediate(src)) {
					imm = src;
660
					goto emit_I;
661
				} else {
662
					reg = arch_get_irn_register(src);
663
					goto emit_R;
664
665
666
667
668
669
670
671
672
				}
			}

			case 's': {
				const char *str = va_arg(ap, const char*);
				be_emit_string(str);
				break;
			}

673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
			case 'u':
				if (mod & EMIT_LONG) {
					unsigned long num = va_arg(ap, unsigned long);
					be_emit_irprintf("%lu", num);
				} else {
					unsigned num = va_arg(ap, unsigned);
					be_emit_irprintf("%u", num);
				}
				break;

			case 'd':
				if (mod & EMIT_LONG) {
					long num = va_arg(ap, long);
					be_emit_irprintf("%ld", num);
				} else {
					int num = va_arg(ap, int);
					be_emit_irprintf("%d", num);
				}
691
692
693
694
				break;

			default:
unknown:
695
				panic("unknown format conversion");
696
		}
697
698
	}

699
	be_emit_finish_line_gas(node);
700
701
702
	va_end(ap);
}

703
704
705
/**
 * walks up a tree of copies/perms/spills/reloads to find the original value
 * that is moved around
706
 */
707
708
static ir_node *find_original_value(ir_node *node)
{
709
710
711
712
713
714
715
716
717
718
719
	if (irn_visited(node))
		return NULL;

	mark_irn_visited(node);
	if (be_is_Copy(node)) {
		return find_original_value(be_get_Copy_op(node));
	} else if (be_is_CopyKeep(node)) {
		return find_original_value(be_get_CopyKeep_op(node));
	} else if (is_Proj(node)) {
		ir_node *pred = get_Proj_pred(node);
		if (be_is_Perm(pred)) {
720
			return find_original_value(get_irn_n(pred, get_Proj_num(node)));
721
		} else if (be_is_MemPerm(pred)) {
722
			return find_original_value(get_irn_n(pred, get_Proj_num(node)));
723
724
		} else if (is_ia32_Load(pred)) {
			return find_original_value(get_irn_n(pred, n_ia32_Load_mem));
Andreas Zwinkau's avatar
Andreas Zwinkau committed
725
726
		} else if (is_ia32_Store(pred)) {
			return find_original_value(get_irn_n(pred, n_ia32_Store_val));
727
728
729
		} else {
			return node;
		}
730
	} else if (is_Phi(node)) {
731
		foreach_irn_in(node, i, in) {
732
733
734
735
736
737
738
			ir_node *res = find_original_value(in);
			if (res != NULL)
				return res;
		}
		return NULL;
	} else {
		return node;
739
740
741
	}
}

742
static x86_condition_code_t determine_final_cc(ir_node const *const node, int const flags_pos)
743
{
744
745
746
747
748
	ia32_condcode_attr_t const *const attr = get_ia32_condcode_attr_const(node);
	x86_condition_code_t              cc   = attr->condition_code;
	if (attr->attr.ins_permuted)
		cc = x86_negate_condition_code(cc);

749
	ir_node *flags = skip_Proj(get_irn_n(node, flags_pos));
750

751
	/* Permuted operands of a test instruction do not change the result. */
752
	if (is_ia32_Test(flags))
753
754
		return cc;

Christoph Mallon's avatar
Christoph Mallon committed
755
	if (is_ia32_Sahf(flags)) {
756
757
758
		flags = get_irn_n(flags, n_ia32_Sahf_val);
		if (!is_ia32_FucomFnstsw(flags) && !is_ia32_FucomppFnstsw(flags) && !is_ia32_FtstFnstsw(flags)) {
			ir_graph *const irg = get_irn_irg(node);
759
			inc_irg_visited(irg);
760
761
			flags = find_original_value(flags);
			assert(is_ia32_FucomFnstsw(flags) || is_ia32_FucomppFnstsw(flags) || is_ia32_FtstFnstsw(flags));
762
		}
763
	}
764

765
	ia32_attr_t const *const flags_attr = get_ia32_attr_const(flags);
766
	if (flags_attr->ins_permuted)
767
		cc = x86_invert_condition_code(cc);
768
	return cc;
769
770
}

771
772
773
774
775
776
/**
 * Emits an exception label for a given node.
 */
static void ia32_emit_exc_label(const ir_node *node)
{
	be_emit_string(be_gas_insn_label_prefix());
777
	be_emit_irprintf("%lu", get_ia32_exc_label_id(node));
778
779
}

780
static bool fallthrough_possible(const ir_node *block, const ir_node *target)
781
{
782
	return get_prev_block_sched(target) == block;
783
784
}

Christian Würdig's avatar
Christian Würdig committed
785
786
787
/**
 * Emits the jump sequence for a conditional jump (cmp + jmp_true + jmp_false)
 */
788
static void emit_ia32_Jcc(const ir_node *node)
789
{
790
	x86_condition_code_t cc = determine_final_cc(node, n_ia32_Jcc_eflags);
Christian Würdig's avatar
Christian Würdig committed
791

792
	/* get both Projs */
793
	ir_node const *proj_true   = get_Proj_for_pn(node, pn_ia32_Jcc_true);
794
	ir_node const *target_true = get_cfop_target_block(proj_true);
795
	ir_node const *proj_false  = get_Proj_for_pn(node, pn_ia32_Jcc_false);
796
797
	ir_node const *block       = get_nodes_block(node);
	if (fallthrough_possible(block, target_true)) {
798
		/* exchange both proj's so the second one can be omitted */
799
800
		const ir_node *t = proj_true;

801
802
		proj_true  = proj_false;
		proj_false = t;
803
		cc         = x86_negate_condition_code(cc);
804
	}
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
	const ir_node *target_false = get_cfop_target_block(proj_false);
	bool           fallthrough  = fallthrough_possible(block, target_false);
	/* if we can't have a fallthrough anyway, put the more likely case first */
	if (!fallthrough) {
		/* We would need execfreq for the concrete edge, but don't have it
		 * available here, so we use the block execfreq :-( */
		double freq_true  = get_block_execfreq(target_true);
		double freq_false = get_block_execfreq(target_false);
		if (freq_false > freq_true) {
			const ir_node *t = proj_true;
			proj_true  = proj_false;
			proj_false = t;
			cc         = x86_negate_condition_code(cc);
		}
	}
820

821
	bool need_parity_label = false;
822
	if (cc & x86_cc_float_parity_cases) {
823
824
		/* Some floating point comparisons require a test of the parity flag,
		 * which indicates that the result is unordered */
825
		if (cc & x86_cc_negated) {
826
			ia32_emitf(proj_true, "jp %L");
827
		} else {
828
829
			/* we need a local label if the false proj is a fallthrough
			 * as the falseblock might have no label emitted then */
830
831
			if (fallthrough) {
				need_parity_label = true;
832
				ia32_emitf(proj_false, "jp 1f");
833
			} else {
834
				ia32_emitf(proj_false, "jp %L");
835
			}
836
		}
837
	}
838
	ia32_emitf(proj_true, "j%PX %L", (int)cc);
Christoph Mallon's avatar
Christoph Mallon committed
839
	if (need_parity_label) {
840
841
		be_emit_cstring("1:\n");
		be_emit_write_line();
842
843
	}

844
	/* the second Proj might be a fallthrough */
845
	if (fallthrough) {
846
		if (be_options.verbose_asm)
847
			ia32_emitf(proj_false, "/* fallthrough to %L */");
848
	} else {
849
		ia32_emitf(proj_false, "jmp %L");
850
	}
Michael Beck's avatar
Michael Beck committed
851
852
}

853
854
855
856
857
858
/**
 * Emits an ia32 Setcc. This is mostly easy but some floating point compares
 * are tricky.
 */
static void emit_ia32_Setcc(const ir_node *node)
{
859
	const arch_register_t *dreg = arch_get_irn_register_out(node, pn_ia32_Setcc_res);
860

861
	x86_condition_code_t const cc = determine_final_cc(node, n_ia32_Setcc_eflags);
862
863
	if (cc & x86_cc_float_parity_cases) {
		if (cc & x86_cc_negated) {
864
865
866
			ia32_emitf(node, "set%PX %<R", (int)cc, dreg);
			ia32_emitf(node, "setp %>R", dreg);
			ia32_emitf(node, "orb %>R, %<R", dreg, dreg);
867
		} else {
868
869
870
			ia32_emitf(node, "set%PX %<R", (int)cc, dreg);
			ia32_emitf(node, "setnp %>R", dreg);
			ia32_emitf(node, "andb %>R, %<R", dreg, dreg);
871
		}
872
	} else {
873
		ia32_emitf(node, "set%PX %#R", (int)cc, dreg);
874
875
876
	}
}

877
/**
878
 * Emits code for a SwitchJmp
879
880
881
 */
static void emit_ia32_SwitchJmp(const ir_node *node)
{
882
	ir_entity             *jump_table = get_ia32_am_ent(node);
Matthias Braun's avatar
Matthias Braun committed
883
	const ir_switch_table *table      = get_ia32_switch_table(node);
Christian Würdig's avatar
Christian Würdig committed
884

885
	ia32_emitf(node, "jmp %*AM");
Matthias Braun's avatar
Matthias Braun committed
886
	be_emit_jump_table(node, table, jump_table, get_cfop_target_block);
Christian Würdig's avatar
Christian Würdig committed
887
888
889
890
891
}

/**
 * Emits code for a unconditional jump.
 */
892
static void emit_ia32_Jmp(const ir_node *node)
893
{
894
	/* we have a block schedule */
895
896
897
	ir_node *block  = get_nodes_block(node);
	ir_node *target = get_cfop_target_block(node);
	if (fallthrough_possible(block, target)) {
898
		if (be_options.verbose_asm)
899
			ia32_emitf(node, "/* fallthrough to %L */");
900
	} else {