ia32_emitter.c 81.6 KB
Newer Older
Christian Würdig's avatar
Christian Würdig committed
1
2
/*
 * This file is part of libFirm.
3
 * Copyright (C) 2012 University of Karlsruhe.
Christian Würdig's avatar
Christian Würdig committed
4
5
 */

6
/**
7
 * @file
Christian Würdig's avatar
Christian Würdig committed
8
9
 * @brief       This file implements the ia32 node emitter.
 * @author      Christian Wuerdig, Matthias Braun
10
11
 *
 * Summary table for x86 floatingpoint compares:
12
13
 * (remember effect of unordered on x86: ZF=1, PF=1, CF=1)
 *
14
15
16
17
18
 *   pnc_Eq  => !P && E
 *   pnc_Lt  => !P && B
 *   pnc_Le  => !P && BE
 *   pnc_Gt  => A
 *   pnc_Ge  => AE
19
 *   pnc_Lg  => NE
20
21
22
23
24
25
26
 *   pnc_Leg => NP  (ordered)
 *   pnc_Uo  => P
 *   pnc_Ue  => E
 *   pnc_Ul  => B
 *   pnc_Ule => BE
 *   pnc_Ug  => P || A
 *   pnc_Uge => P || AE
27
 *   pnc_Ne  => P || NE
28
 */
29
#include <inttypes.h>
Christian Würdig's avatar
Christian Würdig committed
30

31
32
#include "be_t.h"
#include "bearch_ia32_t.h"
33
#include "beblocksched.h"
34
#include "begnuas.h"
35
#include "besched.h"
36
#include "bestack.h"
37
#include "beutil.h"
38
#include "execfreq.h"
Christian Würdig's avatar
Christian Würdig committed
39
#include "gen_ia32_emitter.h"
Christian Würdig's avatar
Christian Würdig committed
40
#include "gen_ia32_regalloc_if.h"
41
#include "ia32_architecture.h"
42
43
44
45
46
47
#include "ia32_emitter.h"
#include "ia32_new_nodes.h"
#include "irgwalk.h"
#include "irtools.h"
#include "lc_opts.h"
#include "panic.h"
Christian Würdig's avatar
Christian Würdig committed
48

49
50
DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)

51
52
53
static char       pic_base_label[128];
static ir_label_t exc_label_id;
static bool       mark_spill_reload;
54

55
56
57
static bool       sp_relative;
static int        frame_type_size;
static int        callframe_offset;
58

59
60
61
/** Return the next block in Block schedule */
static ir_node *get_prev_block_sched(const ir_node *block)
{
62
	return (ir_node*)get_irn_link(block);
63
64
}

65
/** Checks if the current block is a fall-through target. */
66
static bool is_fallthrough(const ir_node *cfgpred)
67
{
Christoph Mallon's avatar
Christoph Mallon committed
68
	if (!is_Proj(cfgpred))
69
70
		return true;
	ir_node *pred = get_Proj_pred(cfgpred);
Christoph Mallon's avatar
Christoph Mallon committed
71
	if (is_ia32_SwitchJmp(pred))
72
73
		return false;
	return true;
74
75
}

76
77
78
79
/**
 * returns non-zero if the given block needs a label
 * because of being a jump-target (and not a fall-through)
 */
80
static bool block_needs_label(const ir_node *block)
81
{
82
	if (get_Block_entity(block) != NULL)
83
		return true;
84

85
86
	int  n_cfgpreds = get_Block_n_cfgpreds(block);
	bool need_label = true;
87
	if (n_cfgpreds == 0) {
88
		need_label = 0;
89
	} else if (n_cfgpreds == 1) {
Christoph Mallon's avatar
Christoph Mallon committed
90
91
		ir_node *cfgpred       = get_Block_cfgpred(block, 0);
		ir_node *cfgpred_block = get_nodes_block(cfgpred);
92
		if (get_prev_block_sched(block) == cfgpred_block
93
		    && is_fallthrough(cfgpred)) {
94
			need_label = 0;
95
96
97
98
99
100
		}
	}

	return need_label;
}

Michael Beck's avatar
Michael Beck committed
101
/**
102
 * Add a number to a prefix. This number will not be used a second time.
Michael Beck's avatar
Michael Beck committed
103
 */
104
105
static char *get_unique_label(char *buf, size_t buflen, const char *prefix)
{
106
	static unsigned long id = 0;
107
	snprintf(buf, buflen, "%s%s%lu", be_gas_get_private_prefix(), prefix, ++id);
108
109
110
	return buf;
}

111
static const char *get_register_name_8bit_low(const arch_register_t *reg)
112
{
113
114
115
116
117
118
119
	switch (reg->global_index) {
	case REG_EAX: return "al";
	case REG_EBX: return "bl";
	case REG_ECX: return "cl";
	case REG_EDX: return "dl";
	}
	panic("unexpected register");
120
121
}

122
static const char *get_register_name_8bit_high(const arch_register_t *reg)
Michael Beck's avatar
Michael Beck committed
123
{
124
125
126
127
128
129
130
131
	switch (reg->global_index) {
	case REG_EAX: return "ah";
	case REG_EBX: return "bh";
	case REG_ECX: return "ch";
	case REG_EDX: return "dh";
	}
	panic("unexpected register");
}
Michael Beck's avatar
Michael Beck committed
132

133
134
135
136
137
138
139
140
141
142
143
144
145
static const char *get_register_name_16bit(const arch_register_t *reg)
{
	switch (reg->global_index) {
	case REG_EAX: return "ax";
	case REG_EBX: return "bx";
	case REG_ECX: return "cx";
	case REG_EDX: return "dx";
	case REG_ESI: return "si";
	case REG_EDI: return "di";
	case REG_ESP: return "sp";
	case REG_EBP: return "bp";
	}
	panic("unexpected register");
Michael Beck's avatar
Michael Beck committed
146
147
}

148
149
static const char *get_register_name_mode(const arch_register_t *reg,
                                          ir_mode *mode)
150
{
151
152
153
154
155
156
157
158
159
	if (mode == NULL)
		return reg->name;
	unsigned size = get_mode_size_bits(mode);
	if (size == 8)
		return get_register_name_8bit_low(reg);
	else if (size == 16)
		return get_register_name_16bit(reg);
	else
		return reg->name;
160
161
}

162
163
164
165
166
/**
 * emit a register, possible shortened by a mode
 * @param reg   the register
 * @param mode  the mode of the register or NULL for full register
 */
167
static void emit_register(const arch_register_t *reg, ir_mode *mode)
168
{
169
	const char *name = get_register_name_mode(reg, mode);
170
	be_emit_char('%');
171
	be_emit_string(name);
Christian Würdig's avatar
Christian Würdig committed
172
173
}

174
175
static void ia32_emit_entity(ir_entity *entity, int no_pic_adjust)
{
176
	be_gas_emit_entity(entity);
177

178
	if (is_tls_entity(entity)) {
Matthias Braun's avatar
Matthias Braun committed
179
		if (!entity_has_definition(entity)) {
180
181
182
183
184
185
			be_emit_cstring("@INDNTPOFF");
		} else {
			be_emit_cstring("@NTPOFF");
		}
	}

186
	if (be_options.pic && !no_pic_adjust && get_entity_type(entity) != get_code_type()) {
187
188
189
190
191
192
193
194
195
		be_emit_char('-');
		be_emit_string(pic_base_label);
	}
}

static void emit_ia32_Immediate_no_prefix(const ir_node *node)
{
	const ia32_immediate_attr_t *attr = get_ia32_immediate_attr_const(node);

196
197
198
	ir_entity *const entity = attr->entity;
	if (entity != NULL) {
		ia32_emit_entity(entity, attr->no_pic_adjust);
199
		if (attr->offset != 0) {
200
			be_emit_irprintf("%+"PRId32, attr->offset);
201
		}
202
	} else {
203
		be_emit_irprintf("0x%"PRIX32, (uint32_t)attr->offset);
204
205
206
207
208
209
210
211
	}
}

static void emit_ia32_Immediate(const ir_node *node)
{
	be_emit_char('$');
	emit_ia32_Immediate_no_prefix(node);
}
212

Matthias Braun's avatar
Matthias Braun committed
213
static void ia32_emit_mode_suffix_mode(const ir_mode *mode)
214
{
215
216
217
218
219
	assert(mode_is_int(mode) || mode_is_reference(mode));
	switch (get_mode_size_bits(mode)) {
		case 8:  be_emit_char('b');     return;
		case 16: be_emit_char('w');     return;
		case 32: be_emit_char('l');     return;
Christoph Mallon's avatar
Christoph Mallon committed
220
221
		/* gas docu says q is the suffix but gcc, objdump and icc use ll
		 * apparently */
Matthias Braun's avatar
Matthias Braun committed
222
223
		case 64: be_emit_cstring("ll"); return;
	}
224
	panic("cannot output mode_suffix for %+F", mode);
Christian Würdig's avatar
Christian Würdig committed
225
226
}

227
static void ia32_emit_x87_mode_suffix(ir_node const *const node)
228
{
229
	/* we only need to emit the mode on address mode */
230
231
232
	if (get_ia32_op_type(node) == ia32_Normal)
		return;

233
	ir_mode *mode = get_ia32_ls_mode(node);
234
235
236
237
	assert(mode != NULL);

	if (mode_is_float(mode)) {
		switch (get_mode_size_bits(mode)) {
238
239
240
241
242
243
244
			case  32: be_emit_char('s'); return;
			case  64: be_emit_char('l'); return;
			/* long doubles have different sizes due to alignment on different
			 * platforms. */
			case  80:
			case  96:
			case 128: be_emit_char('t'); return;
245
246
		}
	} else {
247
		assert(mode_is_int(mode) || mode_is_reference(mode));
248
249
250
251
252
253
254
		switch (get_mode_size_bits(mode)) {
			case 16: be_emit_char('s');     return;
			case 32: be_emit_char('l');     return;
			/* gas docu says q is the suffix but gcc, objdump and icc use ll
			 * apparently */
			case 64: be_emit_cstring("ll"); return;
		}
255
	}
256
	panic("cannot output mode_suffix for %+F", mode);
257
258
}

259
static char get_xmm_mode_suffix(ir_mode *mode)
260
261
{
	assert(mode_is_float(mode));
262
	switch (get_mode_size_bits(mode)) {
Christoph Mallon's avatar
Christoph Mallon committed
263
264
	case 32: return 's';
	case 64: return 'd';
265
	default: panic("invalid XMM mode");
266
267
268
	}
}

269
static void ia32_emit_xmm_mode_suffix(ir_node const *const node)
270
271
272
{
	ir_mode *mode = get_ia32_ls_mode(node);
	assert(mode != NULL);
273
	be_emit_char(get_xmm_mode_suffix(mode));
274
275
}

Christian Würdig's avatar
Christian Würdig committed
276
/**
277
 * Returns the target block for a control flow node.
Christian Würdig's avatar
Christian Würdig committed
278
 */
279
static ir_node *get_cfop_target_block(const ir_node *irn)
Christoph Mallon's avatar
Christoph Mallon committed
280
{
281
	assert(get_irn_mode(irn) == mode_X);
282
	return (ir_node*)get_irn_link(irn);
283
}
Christian Würdig's avatar
Christian Würdig committed
284

285
286
287
288
289
290
/**
 * Emits the target label for a control flow node.
 */
static void ia32_emit_cfop_target(const ir_node *node)
{
	ir_node *block = get_cfop_target_block(node);
291
	be_gas_emit_block_name(block);
292
293
}

294
void x86_emit_condition_code(x86_condition_code_t cc)
295
296
{
	switch (cc) {
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
	case x86_cc_overflow:      be_emit_cstring("o");  return;
	case x86_cc_not_overflow:  be_emit_cstring("no"); return;
	case x86_cc_float_below:
	case x86_cc_float_unordered_below:
	case x86_cc_below:         be_emit_cstring("b");  return;
	case x86_cc_float_above_equal:
	case x86_cc_float_unordered_above_equal:
	case x86_cc_above_equal:   be_emit_cstring("ae"); return;
	case x86_cc_float_equal:
	case x86_cc_equal:         be_emit_cstring("e");  return;
	case x86_cc_float_not_equal:
	case x86_cc_not_equal:     be_emit_cstring("ne"); return;
	case x86_cc_float_below_equal:
	case x86_cc_float_unordered_below_equal:
	case x86_cc_below_equal:   be_emit_cstring("be"); return;
	case x86_cc_float_above:
	case x86_cc_float_unordered_above:
	case x86_cc_above:         be_emit_cstring("a");  return;
	case x86_cc_sign:          be_emit_cstring("s");  return;
	case x86_cc_not_sign:      be_emit_cstring("ns"); return;
	case x86_cc_parity:        be_emit_cstring("p");  return;
	case x86_cc_not_parity:    be_emit_cstring("np"); return;
	case x86_cc_less:          be_emit_cstring("l");  return;
	case x86_cc_greater_equal: be_emit_cstring("ge"); return;
	case x86_cc_less_equal:    be_emit_cstring("le"); return;
	case x86_cc_greater:       be_emit_cstring("g");  return;
	case x86_cc_float_parity_cases:
	case x86_cc_additional_float_cases:
325
		break;
326
	}
327
	panic("invalid ia32 condition code");
328
329
}

330
typedef enum ia32_emit_mod_t {
331
	EMIT_NONE         = 0,
332
	EMIT_RESPECT_LS   = 1U << 0,
333
	EMIT_ALTERNATE_AM = 1U << 1,
334
335
	EMIT_LONG         = 1U << 2,
	EMIT_HIGH_REG     = 1U << 3,
336
	EMIT_LOW_REG      = 1U << 4,
337
338
	EMIT_16BIT_REG    = 1U << 5,
	EMIT_SHIFT_COMMA  = 1U << 6,
339
} ia32_emit_mod_t;
340
ENUM_BITSET(ia32_emit_mod_t)
341

342
343
344
345
346
347
static ir_node const *get_irn_n_reg(ir_node const *const node, int const pos)
{
	ir_node *const in = get_irn_n(node, pos);
	return is_ia32_NoReg_GP(in) ? NULL : in;
}

348
349
350
/**
 * Emits address mode.
 */
351
static void ia32_emit_am(ir_node const *const node)
352
353
{
	/* just to be sure... */
354
	assert(get_ia32_frame_use(node) == IA32_FRAME_USE_NONE || get_ia32_frame_ent(node));
355

356
357
358
	if (get_ia32_am_tls_segment(node))
		be_emit_cstring("%gs:");

359
360
361
	ir_node const *const base = get_irn_n_reg(node, n_ia32_base);
	ir_node const *const idx  = get_irn_n_reg(node, n_ia32_index);

362
	/* emit offset */
363
364
365
	int32_t    const offs = get_ia32_am_offs_int(node);
	ir_entity *const ent  = get_ia32_am_ent(node);
	if (ent) {
366
		const ia32_attr_t *attr = get_ia32_attr_const(node);
367
		ia32_emit_entity(ent, attr->am_sc_no_pic_adjust);
368
		if (offs != 0)
369
			be_emit_irprintf("%+"PRId32, offs);
370
371
372
	} else if (offs != 0 || (!base && !idx)) {
		/* also handle special case if nothing is set */
		be_emit_irprintf("%"PRId32, offs);
373
374
	}

375
	if (base || idx) {
376
377
378
		be_emit_char('(');

		/* emit base */
379
		if (base) {
380
			arch_register_t const *const reg = arch_get_irn_register(base);
381
382
383
384
			emit_register(reg, NULL);
		}

		/* emit index + scale */
385
		if (idx) {
386
			be_emit_char(',');
387
			arch_register_t const *const reg = arch_get_irn_register(idx);
388
389
			emit_register(reg, NULL);

390
			int const scale = get_ia32_am_scale(node);
391
			if (scale > 0)
392
393
394
395
396
397
				be_emit_irprintf(",%d", 1 << scale);
		}
		be_emit_char(')');
	}
}

398
static x86_condition_code_t determine_final_cc(ir_node const *node, int flags_pos);
399
400

void ia32_emitf(ir_node const *const node, char const *fmt, ...)
401
402
403
404
{
	va_list ap;
	va_start(ap, fmt);

405
	be_emit_char('\t');
406
	for (;;) {
407
		const char      *start = fmt;
408
		ia32_emit_mod_t  mod   = EMIT_NONE;
409
410
411
412
413
414
415
416

		while (*fmt != '%' && *fmt != '\n' && *fmt != '\0')
			++fmt;
		if (fmt != start) {
			be_emit_string_len(start, fmt - start);
		}

		if (*fmt == '\n') {
417
418
419
			be_emit_char('\n');
			be_emit_write_line();
			be_emit_char('\t');
420
421
422
423
424
425
426
			++fmt;
			if (*fmt == '\0')
				break;
			continue;
		}

		if (*fmt == '\0')
Christian Würdig's avatar
Christian Würdig committed
427
			break;
428
429

		++fmt;
430
431
		for (;;) {
			switch (*fmt) {
432
433
434
			case '*': mod |= EMIT_ALTERNATE_AM; break;
			case '#': mod |= EMIT_RESPECT_LS;   break;
			case 'l': mod |= EMIT_LONG;         break;
435
436
			case '>': mod |= EMIT_HIGH_REG;     break;
			case '<': mod |= EMIT_LOW_REG;      break;
437
			case '^': mod |= EMIT_16BIT_REG;    break;
438
			case ',': mod |= EMIT_SHIFT_COMMA;  break;
439
440
441
			default:
				goto end_of_mods;
			}
442
443
			++fmt;
		}
444
end_of_mods:
445

446
		switch (*fmt++) {
447
448
449
			arch_register_t const *reg;
			ir_node         const *imm;

450
451
452
453
454
455
			case '%':
				be_emit_char('%');
				break;

			case 'A': {
				switch (*fmt++) {
456
					case 'F':
457
						if (get_ia32_op_type(node) == ia32_Normal) {
458
459
460
							ia32_x87_attr_t const *const attr = get_ia32_x87_attr_const(node);
							char            const *const fmt  = attr->res_in_reg ? "%%st, %%%s" : "%%%s, %%st";
							be_emit_irprintf(fmt, attr->reg->name);
461
							break;
462
463
						} else {
							goto emit_AM;
464
465
						}

466
emit_AM:
467
					case 'M':
468
469
						if (mod & EMIT_ALTERNATE_AM)
							be_emit_char('*');
470
471
472
						ia32_emit_am(node);
						break;

473
474
					case 'R':
						reg = va_arg(ap, const arch_register_t*);
475
						if (get_ia32_op_type(node) == ia32_Normal) {
476
							goto emit_R;
477
478
						} else {
							goto emit_AM;
479
480
481
						}

					case 'S':
482
483
484
						if (get_ia32_op_type(node) == ia32_Normal) {
							goto emit_S;
						} else {
485
							++fmt;
486
							goto emit_AM;
487
488
489
490
491
492
493
						}

					default: goto unknown;
				}
				break;
			}

494
495
496
497
			case 'B': {
				ir_node const *const src = get_irn_n(node, n_ia32_binary_right);
				if (is_ia32_Immediate(src)) {
					emit_ia32_Immediate(src);
498
					be_emit_cstring(", ");
499
500
					if (get_ia32_op_type(node) == ia32_Normal) {
						goto destination_operand;
501
					} else {
502
						ia32_emit_am(node);
503
504
					}
				} else {
505
					if (get_ia32_op_type(node) == ia32_Normal) {
506
						reg = arch_get_irn_register(src);
507
						emit_register(reg, get_ia32_ls_mode(node));
508
509
					} else {
						ia32_emit_am(node);
510
511
					}
					be_emit_cstring(", ");
512
destination_operand:
513
514
515
516
					reg = arch_get_irn_register_in(node, n_ia32_binary_left);
					emit_register(reg, get_ia32_ls_mode(node));
				}
				break;
517
			}
518

519
			case 'D':
520
				if (*fmt < '0' || '9' < *fmt)
521
					goto unknown;
522
				reg = arch_get_irn_register_out(node, *fmt++ - '0');
523
				goto emit_R;
524

525
526
527
			case 'F':
				if (*fmt == 'M') {
					ia32_emit_x87_mode_suffix(node);
528
529
530
531
				} else if (*fmt == 'P') {
					ia32_x87_attr_t const *const attr = get_ia32_x87_attr_const(node);
					if (attr->pop)
						be_emit_char('p');
532
533
534
535
536
537
538
539
540
541
542
543
				} else if (*fmt == 'R') {
					/* NOTE: Work around a gas quirk for non-commutative operations if the
					 * destination register is not %st0.  In this case r/non-r is swapped.
					 * %st0 = %st0 - %st1 -> fsub  %st1, %st0 (as expected)
					 * %st0 = %st1 - %st0 -> fsubr %st1, %st0 (as expected)
					 * %st1 = %st0 - %st1 -> fsub  %st0, %st1 (expected: fsubr)
					 * %st1 = %st1 - %st0 -> fsubr %st0, %st1 (expected: fsub)
					 * In fact this corresponds to the encoding of the instruction:
					 * - The r suffix selects whether %st0 is on the left (no r) or on the
					 *   right (r) side of the executed operation.
					 * - The placement of %st0 selects whether the result is written to
					 *   %st0 (right) or the other register (left).
544
545
546
					 * This means that it is sufficient to test whether the operands are
					 * permuted.  In particular it is not necessary to consider wether the
					 * result is to be placed into the explicit register operand. */
547
					if (get_ia32_x87_attr_const(node)->attr.ins_permuted)
548
						be_emit_char('r');
549
550
				} else if (*fmt == 'X') {
					ia32_emit_xmm_mode_suffix(node);
551
				} else if (*fmt == '0') {
552
					be_emit_char('%');
553
					be_emit_string(get_ia32_x87_attr_const(node)->reg->name);
554
555
556
				} else {
					goto unknown;
				}
557
				++fmt;
558
559
				break;

560
			case 'I':
561
562
				imm = node;
emit_I:
563
564
565
				if (mod & EMIT_SHIFT_COMMA) {
					const ia32_immediate_attr_t *attr
						= get_ia32_immediate_attr_const(imm);
566
					if (attr->entity == NULL && attr->offset == 1)
567
568
						break;
				}
569
570
				if (!(mod & EMIT_ALTERNATE_AM))
					be_emit_char('$');
571
				emit_ia32_Immediate_no_prefix(imm);
572
573
574
				if (mod & EMIT_SHIFT_COMMA) {
					be_emit_char(',');
				}
575
576
577
578
579
580
				break;

			case 'L':
				ia32_emit_cfop_target(node);
				break;

581
582
583
			case 'M': {
				ir_mode *mode = get_ia32_ls_mode(node);
				if (!mode)
584
					mode = ia32_mode_gp;
585
586
587
588
589
590
				if (mod & EMIT_RESPECT_LS) {
					if (get_mode_size_bits(mode) == 32)
						break;
					be_emit_char(mode_is_signed(mode) ? 's' : 'z');
				}
				ia32_emit_mode_suffix_mode(mode);
591
				break;
592
			}
593
594

			case 'P': {
595
				x86_condition_code_t cc;
596
597
				if (*fmt == 'X') {
					++fmt;
598
					cc = (x86_condition_code_t)va_arg(ap, int);
599
				} else if ('0' <= *fmt && *fmt <= '9') {
600
					cc = determine_final_cc(node, *fmt - '0');
yb9976's avatar
yb9976 committed
601
					++fmt;
602
603
604
				} else {
					goto unknown;
				}
605
				x86_emit_condition_code(cc);
606
607
608
				break;
			}

609
610
611
612
613
			case 'R':
				reg = va_arg(ap, const arch_register_t*);
emit_R:
				if (mod & EMIT_ALTERNATE_AM)
					be_emit_char('*');
614
				const char *name;
615
				if (mod & EMIT_HIGH_REG) {
616
					name = get_register_name_8bit_high(reg);
617
				} else if (mod & EMIT_LOW_REG) {
618
					name = get_register_name_8bit_low(reg);
619
				} else if (mod & EMIT_16BIT_REG) {
620
					name = get_register_name_16bit(reg);
621
				} else {
622
623
624
					name = mod & EMIT_RESPECT_LS
						 ? get_register_name_mode(reg, get_ia32_ls_mode(node))
						 : reg->name;
625
				}
626
627
				be_emit_char('%');
				be_emit_string(name);
628
629
630
				if (mod & EMIT_SHIFT_COMMA) {
					be_emit_char(',');
				}
631
632
633
634
				break;

emit_S:
			case 'S': {
635
				if (*fmt < '0' || '9' < *fmt)
636
637
					goto unknown;

638
				unsigned pos = *fmt++ - '0';
639
640
641
				ir_node const *const src = get_irn_n(node, pos);
				if (is_ia32_Immediate(src)) {
					imm = src;
642
					goto emit_I;
643
				} else {
644
					reg = arch_get_irn_register(src);
645
					goto emit_R;
646
647
648
649
650
651
652
653
654
				}
			}

			case 's': {
				const char *str = va_arg(ap, const char*);
				be_emit_string(str);
				break;
			}

655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
			case 'u':
				if (mod & EMIT_LONG) {
					unsigned long num = va_arg(ap, unsigned long);
					be_emit_irprintf("%lu", num);
				} else {
					unsigned num = va_arg(ap, unsigned);
					be_emit_irprintf("%u", num);
				}
				break;

			case 'd':
				if (mod & EMIT_LONG) {
					long num = va_arg(ap, long);
					be_emit_irprintf("%ld", num);
				} else {
					int num = va_arg(ap, int);
					be_emit_irprintf("%d", num);
				}
673
674
675
676
				break;

			default:
unknown:
677
				panic("unknown format conversion");
678
		}
679
680
	}

681
	be_emit_finish_line_gas(node);
682
683
684
	va_end(ap);
}

685
686
687
/**
 * walks up a tree of copies/perms/spills/reloads to find the original value
 * that is moved around
688
 */
689
690
static ir_node *find_original_value(ir_node *node)
{
691
692
693
694
695
696
697
698
699
700
701
	if (irn_visited(node))
		return NULL;

	mark_irn_visited(node);
	if (be_is_Copy(node)) {
		return find_original_value(be_get_Copy_op(node));
	} else if (be_is_CopyKeep(node)) {
		return find_original_value(be_get_CopyKeep_op(node));
	} else if (is_Proj(node)) {
		ir_node *pred = get_Proj_pred(node);
		if (be_is_Perm(pred)) {
702
			return find_original_value(get_irn_n(pred, get_Proj_num(node)));
703
		} else if (be_is_MemPerm(pred)) {
704
			return find_original_value(get_irn_n(pred, get_Proj_num(node)));
705
706
		} else if (is_ia32_Load(pred)) {
			return find_original_value(get_irn_n(pred, n_ia32_Load_mem));
Andreas Zwinkau's avatar
Andreas Zwinkau committed
707
708
		} else if (is_ia32_Store(pred)) {
			return find_original_value(get_irn_n(pred, n_ia32_Store_val));
709
710
711
		} else {
			return node;
		}
712
	} else if (is_Phi(node)) {
713
		foreach_irn_in(node, i, in) {
714
715
716
717
718
719
720
			ir_node *res = find_original_value(in);
			if (res != NULL)
				return res;
		}
		return NULL;
	} else {
		return node;
721
722
723
	}
}

724
static x86_condition_code_t determine_final_cc(ir_node const *const node, int const flags_pos)
725
{
726
727
728
729
730
	ia32_condcode_attr_t const *const attr = get_ia32_condcode_attr_const(node);
	x86_condition_code_t              cc   = attr->condition_code;
	if (attr->attr.ins_permuted)
		cc = x86_negate_condition_code(cc);

731
	ir_node *flags = skip_Proj(get_irn_n(node, flags_pos));
732

733
	/* Permuted operands of a test instruction do not change the result. */
734
	if (is_ia32_Test(flags))
735
736
		return cc;

Christoph Mallon's avatar
Christoph Mallon committed
737
	if (is_ia32_Sahf(flags)) {
738
739
740
		flags = get_irn_n(flags, n_ia32_Sahf_val);
		if (!is_ia32_FucomFnstsw(flags) && !is_ia32_FucomppFnstsw(flags) && !is_ia32_FtstFnstsw(flags)) {
			ir_graph *const irg = get_irn_irg(node);
741
			inc_irg_visited(irg);
742
743
			flags = find_original_value(flags);
			assert(is_ia32_FucomFnstsw(flags) || is_ia32_FucomppFnstsw(flags) || is_ia32_FtstFnstsw(flags));
744
		}
745
	}
746

747
	ia32_attr_t const *const flags_attr = get_ia32_attr_const(flags);
748
	if (flags_attr->ins_permuted)
749
		cc = x86_invert_condition_code(cc);
750
	return cc;
751
752
}

753
754
755
756
757
758
/**
 * Emits an exception label for a given node.
 */
static void ia32_emit_exc_label(const ir_node *node)
{
	be_emit_string(be_gas_insn_label_prefix());
759
	be_emit_irprintf("%lu", get_ia32_exc_label_id(node));
760
761
}

762
static bool fallthrough_possible(const ir_node *block, const ir_node *target)
763
{
764
	return get_prev_block_sched(target) == block;
765
766
}

Christian Würdig's avatar
Christian Würdig committed
767
768
769
/**
 * Emits the jump sequence for a conditional jump (cmp + jmp_true + jmp_false)
 */
770
static void emit_ia32_Jcc(const ir_node *node)
771
{
772
	x86_condition_code_t cc = determine_final_cc(node, n_ia32_Jcc_eflags);
Christian Würdig's avatar
Christian Würdig committed
773

774
	/* get both Projs */
775
	ir_node const *proj_true   = get_Proj_for_pn(node, pn_ia32_Jcc_true);
776
	ir_node const *target_true = get_cfop_target_block(proj_true);
777
	ir_node const *proj_false  = get_Proj_for_pn(node, pn_ia32_Jcc_false);
778
779
	ir_node const *block       = get_nodes_block(node);
	if (fallthrough_possible(block, target_true)) {
780
		/* exchange both proj's so the second one can be omitted */
781
782
		const ir_node *t = proj_true;

783
784
		proj_true  = proj_false;
		proj_false = t;
785
		cc         = x86_negate_condition_code(cc);
786
	}
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
	const ir_node *target_false = get_cfop_target_block(proj_false);
	bool           fallthrough  = fallthrough_possible(block, target_false);
	/* if we can't have a fallthrough anyway, put the more likely case first */
	if (!fallthrough) {
		/* We would need execfreq for the concrete edge, but don't have it
		 * available here, so we use the block execfreq :-( */
		double freq_true  = get_block_execfreq(target_true);
		double freq_false = get_block_execfreq(target_false);
		if (freq_false > freq_true) {
			const ir_node *t = proj_true;
			proj_true  = proj_false;
			proj_false = t;
			cc         = x86_negate_condition_code(cc);
		}
	}
802

803
	bool need_parity_label = false;
804
	if (cc & x86_cc_float_parity_cases) {
805
806
		/* Some floating point comparisons require a test of the parity flag,
		 * which indicates that the result is unordered */
807
		if (cc & x86_cc_negated) {
808
			ia32_emitf(proj_true, "jp %L");
809
		} else {
810
811
			/* we need a local label if the false proj is a fallthrough
			 * as the falseblock might have no label emitted then */
812
813
			if (fallthrough) {
				need_parity_label = true;
814
				ia32_emitf(proj_false, "jp 1f");
815
			} else {
816
				ia32_emitf(proj_false, "jp %L");
817
			}
818
		}
819
	}
820
	ia32_emitf(proj_true, "j%PX %L", (int)cc);
Christoph Mallon's avatar
Christoph Mallon committed
821
	if (need_parity_label) {
822
823
		be_emit_cstring("1:\n");
		be_emit_write_line();
824
825
	}

826
	/* the second Proj might be a fallthrough */
827
	if (fallthrough) {
828
		if (be_options.verbose_asm)
829
			ia32_emitf(proj_false, "/* fallthrough to %L */");
830
	} else {
831
		ia32_emitf(proj_false, "jmp %L");
832
	}
Michael Beck's avatar
Michael Beck committed
833
834
}

835
836
837
838
839
840
/**
 * Emits an ia32 Setcc. This is mostly easy but some floating point compares
 * are tricky.
 */
static void emit_ia32_Setcc(const ir_node *node)
{
841
	const arch_register_t *dreg = arch_get_irn_register_out(node, pn_ia32_Setcc_res);
842

843
	x86_condition_code_t const cc = determine_final_cc(node, n_ia32_Setcc_eflags);
844
845
	if (cc & x86_cc_float_parity_cases) {
		if (cc & x86_cc_negated) {
846
847
848
			ia32_emitf(node, "set%PX %<R", (int)cc, dreg);
			ia32_emitf(node, "setp %>R", dreg);
			ia32_emitf(node, "orb %>R, %<R", dreg, dreg);
849
		} else {
850
851
852
			ia32_emitf(node, "set%PX %<R", (int)cc, dreg);
			ia32_emitf(node, "setnp %>R", dreg);
			ia32_emitf(node, "andb %>R, %<R", dreg, dreg);
853
		}
854
	} else {
855
		ia32_emitf(node, "set%PX %#R", (int)cc, dreg);
856
857
858
	}
}

859
/**
860
 * Emits code for a SwitchJmp
861
862
863
 */
static void emit_ia32_SwitchJmp(const ir_node *node)
{
864
	ir_entity             *jump_table = get_ia32_am_ent(node);
Matthias Braun's avatar
Matthias Braun committed
865
	const ir_switch_table *table      = get_ia32_switch_table(node);
Christian Würdig's avatar
Christian Würdig committed
866

867
	ia32_emitf(node, "jmp %*AM");
Matthias Braun's avatar
Matthias Braun committed
868
	be_emit_jump_table(node, table, jump_table, get_cfop_target_block);
Christian Würdig's avatar
Christian Würdig committed
869
870
871
872
873
}

/**
 * Emits code for a unconditional jump.
 */
874
static void emit_ia32_Jmp(const ir_node *node)
875
{
876
	/* we have a block schedule */
877
878
879
	ir_node *block  = get_nodes_block(node);
	ir_node *target = get_cfop_target_block(node);
	if (fallthrough_possible(block, target)) {
880
		if (be_options.verbose_asm)
881
			ia32_emitf(node, "/* fallthrough to %L */");
882
	} else {
883
		ia32_emitf(node, "jmp %L");
Christian Würdig's avatar
Christian Würdig committed
884
885
886
	}
}

887
888
889
890
891
892
893
894
895
static void emit_ia32_asm_register(const arch_register_t *reg, char modifier,
                                   ir_mode *mode)
{
	const char *name;
	switch (modifier) {
	case '\0': name = get_register_name_mode(reg, mode); break;
	case  'b': name = get_register_name_8bit_low(reg); break;
	case  'h': name = get_register_name_8bit_high(reg); break;
	case  'w': name = get_register_name_16bit(reg); break;
896
	case  'k': name = reg->name; break;
897
	default:
898
		panic("invalid asm op modifier");
899
	}
900
901
	be_emit_char('%');
	be_emit_string(name);
902
903
}

904
905
906
/**
 * Emits code for an ASM pseudo op.
 */
907
static void emit_ia32_Asm(const ir_node *node)
908
{
909
910
	const ia32_asm_attr_t *attr = get_ia32_asm_attr_const(node);
	x86_emit_asm(node, &attr->asmattr, emit_ia32_asm_register);