beblocksched.c 19.7 KB
Newer Older
Christian Würdig's avatar
Christian Würdig committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
/*
 * Copyright (C) 1995-2007 University of Karlsruhe.  All right reserved.
 *
 * This file is part of libFirm.
 *
 * This file may be distributed and/or modified under the terms of the
 * GNU General Public License version 2 as published by the Free Software
 * Foundation and appearing in the file LICENSE.GPL included in the
 * packaging of this file.
 *
 * Licensees holding valid libFirm Professional Edition licenses may use
 * this file in accordance with the libFirm Commercial License.
 * Agreement provided with the Software.
 *
 * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
 * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
 * PURPOSE.
 */

Christian Würdig's avatar
Christian Würdig committed
20
21
22
23
24
25
/**
 * @file
 * @brief       Block-scheduling strategies.
 * @author      Matthias Braun, Christoph Mallon
 * @date        27.09.2006
 * @version     $Id$
26
27
28
29
30
31
32
33
34
35
 *
 * The goals of the greedy (and ILP) algorithm here works by assuming that
 * we want to change as many jumps to fallthroughs as possible (executed jumps
 * actually, we have to look at the execution frequencies). The algorithms
 * do this by collecting execution frequencies of all branches (which is easily
 * possible when all critical edges are split) then removes critical edges where
 * possible as we don't need and want them anymore now. The algorithms then try
 * to change as many edges to fallthroughs as possible, this is done by setting
 * a next and prev pointers on blocks. The greedy algorithm sorts the edges by
 * execution frequencies and tries to transform them to fallthroughs in this order
36
37
 */
#ifdef HAVE_CONFIG_H
38
#include "config.h"
Matthias Braun's avatar
Matthias Braun committed
39
#endif
40
41
42
43
44
45
46
47
48
49

#include "beblocksched.h"

#include <stdlib.h>

#include "array.h"
#include "pdeq.h"

#include "iredges.h"
#include "irgwalk.h"
Michael Beck's avatar
Michael Beck committed
50
#include "irnode_t.h"
51
52
53
#include "irgraph_t.h"
#include "irloop.h"
#include "irprintf.h"
Michael Beck's avatar
Michael Beck committed
54
#include "execfreq.h"
55
#include "irdump_t.h"
56
57
#include "irtools.h"
#include "debug.h"
58
#include "beirgmod.h"
59
60
#include "bemodule.h"
#include "be.h"
61

62
63
64
65
#include <libcore/lc_opts.h>
#include <libcore/lc_opts_enum.h>
#include <libcore/lc_timing.h>

66
67
68
#ifdef WITH_ILP
#include <lpp/lpp.h>
#include <lpp/lpp_net.h>
Christian Würdig's avatar
Christian Würdig committed
69
#endif /* WITH_ILP */
70

Matthias Braun's avatar
Matthias Braun committed
71
72
DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)

73
74
75
76
77
78
79
80
81
82
83
84
typedef enum _blocksched_algos_t {
	BLOCKSCHED_NAIV, BLOCKSCHED_EXTBB, BLOCKSCHED_GREEDY, BLOCKSCHED_ILP
} blocksched_algos_t;

static int algo = BLOCKSCHED_GREEDY;

static const lc_opt_enum_int_items_t blockschedalgo_items[] = {
	{ "naiv",	BLOCKSCHED_NAIV },
	{ "extbb",	BLOCKSCHED_EXTBB },
	{ "greedy", BLOCKSCHED_GREEDY },
#ifdef WITH_ILP
	{ "ilp",    BLOCKSCHED_ILP },
Christian Würdig's avatar
Christian Würdig committed
85
#endif /* WITH_ILP */
86
87
88
89
90
91
92
93
	{ NULL,     0 }
};

static lc_opt_enum_int_var_t algo_var = {
	&algo, blockschedalgo_items
};

static const lc_opt_table_entry_t be_blocksched_options[] = {
Christian Würdig's avatar
Christian Würdig committed
94
	LC_OPT_ENT_ENUM_INT ("algo", "the block scheduling algorithm", &algo_var),
95
	LC_OPT_LAST
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
};

/*
 *   ____                   _
 *  / ___|_ __ ___  ___  __| |_   _
 * | |  _| '__/ _ \/ _ \/ _` | | | |
 * | |_| | | |  __/  __/ (_| | |_| |
 *  \____|_|  \___|\___|\__,_|\__, |
 *                            |___/
 */

typedef struct _blocksched_entry_t {
	ir_node *block;
	struct _blocksched_entry_t *next;
	struct _blocksched_entry_t *prev;
} blocksched_entry_t;

typedef struct _edge_t {
114
115
116
	ir_node *block;             /**< source block */
	int     pos;                /**< number of cfg predecessor (target) */
	double  execfreq;           /**< the frequency */
117
	int     highest_execfreq;   /**< flag that indicates whether this edge is the edge with the highest
118
119
120
121
							   	     execfreq pointing away from this block */
} edge_t;

typedef struct _blocksched_env_t {
122
	ir_graph       *irg;
123
	struct obstack *obst;
124
125
126
127
	ir_exec_freq   *execfreqs;
	edge_t         *edges;
	pdeq           *worklist;
	int            blockcount;
128
129
} blocksched_env_t;

130
131
132
133
/**
 * Collect cfg frequencies of all edges between blocks.
 * Also determines edge with highest frequency.
 */
134
135
static void collect_egde_frequency(ir_node *block, void *data)
{
136
	blocksched_env_t   *env = data;
137
138
	int                arity;
	edge_t             edge;
139
140
	blocksched_entry_t *entry;

141
	entry        = obstack_alloc(env->obst, sizeof(entry[0]));
142
	entry->block = block;
143
144
	entry->next  = NULL;
	entry->prev  = NULL;
145
146
	set_irn_link(block, entry);

147
	arity = get_Block_n_cfgpreds(block);
148

149
150
151
152
153
	if (arity == 0) {
		assert(block == get_irg_start_block(env->irg));
		/* must be the start block, nothing to do here */
		return;
	} else if (arity == 1) {
154
155
156
		edge.block            = block;
		edge.pos              = 0;
		edge.execfreq         = get_block_execfreq(env->execfreqs, block);
157
158
159
		edge.highest_execfreq = 1;
		ARR_APP1(edge_t, env->edges, edge);
	} else {
160
		int    i;
161
		double highest_execfreq = -1.0;
162
		int    highest_edge_num = -1;
163
164

		edge.block = block;
165
166
		for (i = 0; i < arity; ++i) {
			double  execfreq;
167
			ir_node *pred_block = get_Block_cfgpred_block(block, i);
168

169
170
			execfreq = get_block_execfreq(env->execfreqs, pred_block);

171
172
			edge.pos              = i;
			edge.execfreq         = execfreq;
173
174
			edge.highest_execfreq = 0;
			ARR_APP1(edge_t, env->edges, edge);
175
176

			if (execfreq > highest_execfreq) {
177
178
179
180
181
				highest_execfreq = execfreq;
				highest_edge_num = ARR_LEN(env->edges) - 1;
			}
		}

182
183
		if(highest_edge_num >= 0)
			env->edges[highest_edge_num].highest_execfreq = 1;
184
185
186
187
188
189
190
	}
}

static int cmp_edges(const void *d1, const void *d2)
{
	const edge_t *e1 = d1;
	const edge_t *e2 = d2;
191
192

	return QSORT_CMP(e2->execfreq, e1->execfreq);
193
194
195
196
197
198
199
}

static void coalesce_blocks(blocksched_env_t *env)
{
	int i;
	int edge_count = ARR_LEN(env->edges);

200
201
202
203
	/* run1: only look at jumps */
	for (i = 0; i < edge_count; ++i) {
		const edge_t *edge  = &env->edges[i];
		ir_node      *block = edge->block;
204
		int           pos   = edge->pos;
205
		ir_node      *pred_block;
206
207
		blocksched_entry_t *entry, *pred_entry;

208
209
		/* only check edge with highest frequency */
		if (! edge->highest_execfreq)
210
211
			continue;

212
213
214
215
216
		/* the block might have been removed already... */
		if (is_Bad(get_Block_cfgpred(block, 0)))
			continue;

		pred_block = get_Block_cfgpred_block(block, pos);
217
		entry      = get_irn_link(block);
218
219
		pred_entry = get_irn_link(pred_block);

220
		if (pred_entry->next != NULL || entry->prev != NULL)
221
			continue;
222
223
224

		/* only coalesce jumps */
		if (get_block_succ_next(pred_block, get_block_succ_first(pred_block)) != NULL)
225
226
			continue;

227
		/* schedule the 2 blocks behind each other */
Matthias Braun's avatar
Matthias Braun committed
228
		DBG((dbg, LEVEL_1, "Coalesce (Jump) %+F -> %+F (%.3g)\n",
229
		           pred_entry->block, entry->block, edge->execfreq));
230
		pred_entry->next = entry;
231
		entry->prev      = pred_entry;
232
233
	}

234
235
236
237
	/* run2: remaining edges */
	for (i = 0; i < edge_count; ++i) {
		const edge_t *edge  = &env->edges[i];
		ir_node      *block = edge->block;
238
		int           pos   = edge->pos;
239
		ir_node      *pred_block;
240
241
		blocksched_entry_t *entry, *pred_entry;

242
243
		/* the block might have been removed already... */
		if (is_Bad(get_Block_cfgpred(block, 0)))
244
245
			continue;

246
247
		/* we can't do fallthroughs in backedges */
		if (is_backedge(block, pos))
248
249
250
			continue;

		pred_block = get_Block_cfgpred_block(block, pos);
251
		entry      = get_irn_link(block);
252
253
		pred_entry = get_irn_link(pred_block);

Matthias Braun's avatar
Matthias Braun committed
254
		/* is 1 of the blocks already attached to another block? */
255
		if (pred_entry->next != NULL || entry->prev != NULL)
256
257
			continue;

258
		/* schedule the 2 blocks behind each other */
Matthias Braun's avatar
Matthias Braun committed
259
		DBG((dbg, LEVEL_1, "Coalesce (CondJump) %+F -> %+F (%.3g)\n",
260
		           pred_entry->block, entry->block, edge->execfreq));
261
		pred_entry->next = entry;
262
		entry->prev      = pred_entry;
263
264
265
266
267
	}
}

static void pick_block_successor(blocksched_entry_t *entry, blocksched_env_t *env)
{
268
269
	ir_node            *block = entry->block;
	ir_node            *succ  = NULL;
270
	blocksched_entry_t *succ_entry;
271
272
	const ir_edge_t    *edge;
	double             best_succ_execfreq;
273

274
	if (irn_visited(block))
275
		return;
276

277
278
279
	env->blockcount++;
	mark_irn_visited(block);

Matthias Braun's avatar
Matthias Braun committed
280
	DBG((dbg, LEVEL_1, "Pick succ of %+F\n", block));
281

282
	/* put all successors into the worklist */
283
284
285
	foreach_block_succ(block, edge) {
		ir_node *succ_block = get_edge_src_irn(edge);

286
		if (irn_visited(succ_block))
287
288
			continue;

289
290
		/* we only need to put the first of a series of already connected
		 * blocks into the worklist */
291
		succ_entry = get_irn_link(succ_block);
292
293
294
		while (succ_entry->prev != NULL) {
			/* break cycles... */
			if (succ_entry->prev->block == succ_block) {
295
				succ_entry->prev->next = NULL;
296
				succ_entry->prev       = NULL;
297
298
299
300
301
				break;
			}
			succ_entry = succ_entry->prev;
		};

302
		if (irn_visited(succ_entry->block))
303
304
			continue;

Matthias Braun's avatar
Matthias Braun committed
305
		DBG((dbg, LEVEL_1, "Put %+F into worklist\n", succ_entry->block));
306
307
308
		pdeq_putr(env->worklist, succ_entry->block);
	}

309
	if (entry->next != NULL) {
310
311
312
313
		pick_block_successor(entry->next, env);
		return;
	}

Matthias Braun's avatar
Matthias Braun committed
314
	DBG((dbg, LEVEL_1, "deciding...\n"));
315
	best_succ_execfreq = -1;
316

317
	/* no successor yet: pick the successor block with the highest execution
318
319
	 * frequency which has no predecessor yet */

320
321
	foreach_block_succ(block, edge) {
		ir_node *succ_block = get_edge_src_irn(edge);
322
		double  execfreq;
323

324
		if (irn_visited(succ_block))
325
326
327
			continue;

		succ_entry = get_irn_link(succ_block);
328
		if (succ_entry->prev != NULL)
329
330
			continue;

Michael Beck's avatar
Michael Beck committed
331
		execfreq = get_block_execfreq(env->execfreqs, succ_block);
332
		if (execfreq > best_succ_execfreq) {
333
334
335
336
337
			best_succ_execfreq = execfreq;
			succ = succ_block;
		}
	}

338
	if (succ == NULL) {
Matthias Braun's avatar
Matthias Braun committed
339
		DBG((dbg, LEVEL_1, "pick from worklist\n"));
340
341

		do {
342
			if (pdeq_empty(env->worklist)) {
Matthias Braun's avatar
Matthias Braun committed
343
				DBG((dbg, LEVEL_1, "worklist empty\n"));
344
345
346
				return;
			}
			succ = pdeq_getl(env->worklist);
347
		} while (irn_visited(succ));
348
349
	}

350
351
	succ_entry       = get_irn_link(succ);
	entry->next      = succ_entry;
352
353
354
355
356
357
358
	succ_entry->prev = entry;

	pick_block_successor(succ_entry, env);
}

static blocksched_entry_t *finish_block_schedule(blocksched_env_t *env)
{
359
360
361
	ir_graph           *irg        = env->irg;
	ir_node            *startblock = get_irg_start_block(irg);
	blocksched_entry_t *entry      = get_irn_link(startblock);
362

363
	set_using_visited(irg);
364
365
366
367
368
369
370
	inc_irg_visited(irg);

	env->worklist = new_pdeq();
	pick_block_successor(entry, env);
	assert(pdeq_empty(env->worklist));
	del_pdeq(env->worklist);

371
372
	clear_using_visited(irg);

373
374
375
	return entry;
}

376
377
378
379
380
static ir_node **create_blocksched_array(blocksched_env_t *env, blocksched_entry_t *first,
										int count, struct obstack* obst)
{
	int                i = 0;
	ir_node            **block_list;
381
	blocksched_entry_t *entry;
382
	(void) env;
383
384

	block_list = NEW_ARR_D(ir_node *, obst, count);
Matthias Braun's avatar
Matthias Braun committed
385
	DBG((dbg, LEVEL_1, "Blockschedule:\n"));
386
387

	for (entry = first; entry != NULL; entry = entry->next) {
388
389
		assert(i < count);
		block_list[i++] = entry->block;
Matthias Braun's avatar
Matthias Braun committed
390
		DBG((dbg, LEVEL_1, "\t%+F\n", entry->block));
391
392
393
394
395
396
397
398
	}
	assert(i == count);

	return block_list;
}

static ir_node **create_block_schedule_greedy(ir_graph *irg, ir_exec_freq *execfreqs)
{
399
400
	blocksched_env_t   env;
	struct obstack     obst;
401
	blocksched_entry_t *start_entry;
402
	ir_node            **block_list;
403
404
405

	obstack_init(&obst);

406
407
408
409
410
	env.irg        = irg;
	env.obst       = &obst;
	env.execfreqs  = execfreqs;
	env.edges      = NEW_ARR_F(edge_t, 0);
	env.worklist   = NULL;
411
412
413
414
415
416
417
418
	env.blockcount = 0;

	// collect edge execution frequencies
	irg_block_walk_graph(irg, collect_egde_frequency, NULL, &env);

	// sort interblock edges by execution frequency
	qsort(env.edges, ARR_LEN(env.edges), sizeof(env.edges[0]), cmp_edges);

419
	(void)be_remove_empty_blocks(irg);
420

421
	if (algo != BLOCKSCHED_NAIV)
422
423
424
		coalesce_blocks(&env);

	start_entry = finish_block_schedule(&env);
425
	block_list  = create_blocksched_array(&env, start_entry, env.blockcount, get_irg_obstack(irg));
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443

	DEL_ARR_F(env.edges);
	obstack_free(&obst, NULL);

	return block_list;
}

/*
 *  ___ _     ____
 * |_ _| |   |  _ \
 *  | || |   | |_) |
 *  | || |___|  __/
 * |___|_____|_|
 *
 */

#ifdef WITH_ILP
typedef struct _ilp_edge_t {
444
445
446
	ir_node *block;   /**< source block */
	int     pos;      /**< number of cfg predecessor (target) */
	int     ilpvar;
447
448
449
450
} ilp_edge_t;

typedef struct _blocksched_ilp_env_t {
	blocksched_env_t env;
451
452
	ilp_edge_t       *ilpedges;
	lpp_t            *lpp;
453
454
455
456
457
458
459
460
461
462
463
464
} blocksched_ilp_env_t;

typedef struct _blocksched_ilp_entry_t {
	ir_node *block;
	struct _blocksched_entry_t *next;
	struct _blocksched_entry_t *prev;

	int out_cst;
} blocksched_ilp_entry_t;

static int add_ilp_edge(ir_node *block, int pos, double execfreq, blocksched_ilp_env_t *env)
{
465
	char       name[64];
466
	ilp_edge_t edge;
467
	int        edgeidx = ARR_LEN(env->ilpedges);
468
469
470

	snprintf(name, sizeof(name), "edge%d", edgeidx);

471
472
	edge.block  = block;
	edge.pos    = pos;
473
474
475
476
477
478
479
480
	edge.ilpvar = lpp_add_var_default(env->lpp, name, lpp_binary, execfreq, 1.0);

	ARR_APP1(ilp_edge_t, env->ilpedges, edge);
	return edgeidx;
}

static void collect_egde_frequency_ilp(ir_node *block, void *data)
{
481
482
483
484
485
486
487
	blocksched_ilp_env_t *env        = data;
	ir_graph             *irg        = env->env.irg;
	ir_node              *startblock = get_irg_start_block(irg);
	int                  arity;
	lpp_cst_t            cst;
	char                 name[64];
	int                  out_count;
488
489
490
491
492
	blocksched_ilp_entry_t *entry;

	snprintf(name, sizeof(name), "block_out_constr_%ld", get_irn_node_nr(block));
	out_count = get_irn_n_edges_kind(block, EDGE_KIND_BLOCK);

493
494
495
496
	entry          = obstack_alloc(env->env.obst, sizeof(entry[0]));
	entry->block   = block;
	entry->next    = NULL;
	entry->prev    = NULL;
497
498
499
	entry->out_cst = lpp_add_cst_uniq(env->lpp, name, lpp_greater, out_count - 1);
	set_irn_link(block, entry);

500
	if (block == startblock)
501
502
503
		return;

	arity = get_irn_arity(block);
504
	if (arity == 1) {
505
506
		double execfreq = get_block_execfreq(env->env.execfreqs, block);
		add_ilp_edge(block, 0, execfreq, env);
507
508
	}
	else {
509
510
511
512
513
514
		int i;
		int *edgenums = alloca(sizeof(edgenums[0]) * arity);

		snprintf(name, sizeof(name), "block_in_constr_%ld", get_irn_node_nr(block));
		cst = lpp_add_cst_uniq(env->lpp, name, lpp_greater, arity - 1);

515
516
517
		for (i = 0; i < arity; ++i) {
			double     execfreq;
			int        edgenum;
518
			ilp_edge_t *edge;
519
			ir_node    *pred_block = get_Block_cfgpred_block(block, i);
520
521

			execfreq = get_block_execfreq(env->env.execfreqs, pred_block);
522
523
			edgenum  = add_ilp_edge(block, i, execfreq, env);
			edge     = &env->ilpedges[edgenum];
524
525
526
527
528
529
530
531
			lpp_set_factor_fast(env->lpp, cst, edge->ilpvar, 1.0);
		}
	}
}


static void coalesce_blocks_ilp(blocksched_ilp_env_t *env)
{
532
533
	int  i;
	int  edge_count = ARR_LEN(env->ilpedges);
534
535
536

	/* complete out constraints */
	for(i = 0; i < edge_count; ++i) {
537
538
539
		const ilp_edge_t *edge  = &env->ilpedges[i];
		ir_node          *block = edge->block;
		ir_node          *pred;
540
541
		blocksched_ilp_entry_t *entry;

542
543
		/* the block might have been removed already... */
		if (is_Bad(get_Block_cfgpred(block, 0)))
544
545
			continue;

546
		pred  = get_Block_cfgpred_block(block, edge->pos);
547
548
		entry = get_irn_link(pred);

Matthias Braun's avatar
Matthias Braun committed
549
		DBG((dbg, LEVEL_1, "Adding out cst to %+F from %+F,%d\n",
550
				  pred, block, edge->pos));
551
552
553
		lpp_set_factor_fast(env->lpp, entry->out_cst, edge->ilpvar, 1.0);
	}

554
555
556
557
558
559
560
561
562
563
564
565
#if 0
	{
		FILE *f;
		char fname[256];
		lpp_dump(env->lpp, "lpp.out");
		snprintf(fname, sizeof(fname), "lpp_%s.plain", get_irg_dump_name(env->env.irg));
		f = fopen(fname, "w");
		lpp_dump_plain(env->lpp, f);
		fclose(f);
	}
#endif

566
567
568
569
570
	//lpp_solve_net(env->lpp, main_env->options->ilp_server, main_env->options->ilp_solver);
	lpp_solve_net(env->lpp, "i44pc52", "cplex");
	assert(lpp_is_sol_valid(env->lpp));

	/* Apply results to edges */
571
572
573
574
575
	for (i = 0; i < edge_count; ++i) {
		const ilp_edge_t   *edge  = &env->ilpedges[i];
		ir_node            *block = edge->block;
		ir_node            *pred;
		int                is_jump;
576
577
578
		blocksched_entry_t *entry;
		blocksched_entry_t *pred_entry;

579
580
		/* the block might have been removed already... */
		if (is_Bad(get_Block_cfgpred(block, 0)))
581
582
			continue;

583
		is_jump = (int)lpp_get_var_sol(env->lpp, edge->ilpvar);
584
		if (is_jump)
585
586
			continue;

587
588
		pred       = get_Block_cfgpred_block(block, edge->pos);
		entry      = get_irn_link(block);
589
590
591
		pred_entry = get_irn_link(pred);

		assert(entry->prev == NULL && pred_entry->next == NULL);
592
		entry->prev      = pred_entry;
593
594
595
596
597
598
599
		pred_entry->next = entry;
	}
}

static ir_node **create_block_schedule_ilp(ir_graph *irg, ir_exec_freq *execfreqs)
{
	blocksched_ilp_env_t env;
600
601
602
	struct obstack       obst;
	blocksched_entry_t   *start_entry;
	ir_node              **block_list;
603
604
605

	obstack_init(&obst);

606
607
608
609
	env.env.irg        = irg;
	env.env.obst       = &obst;
	env.env.execfreqs  = execfreqs;
	env.env.worklist   = NULL;
610
	env.env.blockcount = 0;
611
	env.ilpedges       = NEW_ARR_F(ilp_edge_t, 0);
612
613
614
615
616
617
618

	env.lpp = new_lpp("blockschedule", lpp_minimize);
	lpp_set_time_limit(env.lpp, 20);
	lpp_set_log(env.lpp, stdout);

	irg_block_walk_graph(irg, collect_egde_frequency_ilp, NULL, &env);

619
	(void)be_remove_empty_blocks(irg);
620
621
622
	coalesce_blocks_ilp(&env);

	start_entry = finish_block_schedule(&env.env);
623
	block_list  = create_blocksched_array(&env.env, start_entry, env.env.blockcount, get_irg_obstack(irg));
624
625
626
627
628
629
630

	DEL_ARR_F(env.ilpedges);
	free_lpp(env.lpp);
	obstack_free(&obst, NULL);

	return block_list;
}
Christian Würdig's avatar
Christian Würdig committed
631
#endif /* WITH_ILP */
632
633
634
635
636
637
638
639
640
641
642
643

/*
 *  _____      _   ____  ____
 * | ____|_  _| |_| __ )| __ )
 * |  _| \ \/ / __|  _ \|  _ \
 * | |___ >  <| |_| |_) | |_) |
 * |_____/_/\_\\__|____/|____/
 *
 */

/** A simple forward single linked list. */
typedef struct {
644
645
	ir_node  *start;   /**< start of the list */
	ir_node  *end;     /**< last block in the list */
646
647
648
649
	unsigned n_blks;  /**< number of blocks in the list */
} anchor;

static void add_block(anchor *list, ir_node *block) {
650
	if (list->start == NULL) {
651
		list->start = block;
652
		list->end   = block;
653
	} else {
654
655
656
657
658
659
660
661
		set_irn_link(list->end, block);
		list->end = block;
	}

	list->n_blks++;
}

static void create_block_list(ir_node *leader_block, anchor *list) {
662
	int             i;
663
	const ir_edge_t *edge;
664
665
	ir_node         *block = NULL;
	ir_extblk       *extbb = get_Block_extbb(leader_block);
666

667
	if (extbb_visited(extbb))
668
669
670
		return;
	mark_extbb_visited(extbb);

671
	for (i = 0; i < get_extbb_n_blocks(extbb); ++i) {
672
673
674
675
676
677
		block = get_extbb_block(extbb, i);
		add_block(list, block);
	}

	assert(block != NULL);

678
	/* pick successor extbbs */
679
680
681
682
683
	foreach_block_succ(block, edge) {
		ir_node *succ = get_edge_src_irn(edge);
		create_block_list(succ, list);
	}

684
	for (i = 0; i < get_extbb_n_blocks(extbb) - 1; ++i) {
685
		block = get_extbb_block(extbb, i);
686

687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
		foreach_block_succ(block, edge) {
			ir_node *succ = get_edge_src_irn(edge);
			create_block_list(succ, list);
		}
	}
}

void compute_extbb_execfreqs(ir_graph *irg, ir_exec_freq *execfreqs);

/*
 * Calculates a block schedule. The schedule is stored as a linked
 * list starting at the start_block of the irg.
 */
static ir_node **create_extbb_block_schedule(ir_graph *irg, ir_exec_freq *execfreqs)
{
	anchor list;
	ir_node **blk_list, *b, *n;
	unsigned i;

	/* schedule extended basic blocks */
	compute_extbb_execfreqs(irg, execfreqs);
	//compute_extbb(irg);

	list.start  = NULL;
	list.end    = NULL;
	list.n_blks = 0;
713
714
715

	set_using_irn_link(irg);
	set_using_visited(irg);
716
	inc_irg_block_visited(irg);
717

718
719
720
721
722
723
724
725
726
727
	create_block_list(get_irg_start_block(irg), &list);

	/** create an array, so we can go forward and backward */
	blk_list = NEW_ARR_D(ir_node *, irg->obst,list.n_blks);

	for (i = 0, b = list.start; b; b = n, ++i) {
		n = get_irn_link(b);
		blk_list[i] = b;
	}

728
729
730
	clear_using_irn_link(irg);
	clear_using_visited(irg);

731
732
733
734
735
736
737
738
739
740
741
	return blk_list;
}

/*
 *  __  __       _
 * |  \/  | __ _(_)_ __
 * | |\/| |/ _` | | '_ \
 * | |  | | (_| | | | | |
 * |_|  |_|\__,_|_|_| |_|
 *
 */
742
void be_init_blocksched(void)
743
{
744
745
	lc_opt_entry_t *be_grp = lc_opt_get_grp(firm_opt_get_root(), "be");
	lc_opt_entry_t *blocksched_grp = lc_opt_get_grp(be_grp, "blocksched");
746
747

	lc_opt_add_table(blocksched_grp, be_blocksched_options);
748

Matthias Braun's avatar
Matthias Braun committed
749
	FIRM_DBG_REGISTER(dbg, "firm.be.blocksched");
750
}
751
752

BE_REGISTER_MODULE_CONSTRUCTOR(be_init_blocksched);
753
754
755
756
757
758
759
760
761
762
763
764

ir_node **be_create_block_schedule(ir_graph *irg, ir_exec_freq *execfreqs)
{
	switch(algo) {
	case BLOCKSCHED_GREEDY:
	case BLOCKSCHED_NAIV:
		return create_block_schedule_greedy(irg, execfreqs);
	case BLOCKSCHED_EXTBB:
		return create_extbb_block_schedule(irg, execfreqs);
#ifdef WITH_ILP
	case BLOCKSCHED_ILP:
		return create_block_schedule_ilp(irg, execfreqs);
Christian Würdig's avatar
Christian Würdig committed
765
#endif /* WITH_ILP */
766
767
768
769
770
	}

	assert(0 && "unknown blocksched algo");
	return NULL;
}