nsz Git - libfirm/blob - ir/be/beblocksched.c

   1 /*
   2  * Copyright (C) 1995-2008 University of Karlsruhe.  All right reserved.
   3  *
   4  * This file is part of libFirm.
   5  *
   6  * This file may be distributed and/or modified under the terms of the
   7  * GNU General Public License version 2 as published by the Free Software
   8  * Foundation and appearing in the file LICENSE.GPL included in the
   9  * packaging of this file.
  10  *
  11  * Licensees holding valid libFirm Professional Edition licenses may use
  12  * this file in accordance with the libFirm Commercial License.
  13  * Agreement provided with the Software.
  14  *
  15  * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
  16  * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
  17  * PURPOSE.
  18  */
  19
  20 /**
  21  * @file
  22  * @brief       Block-scheduling strategies.
  23  * @author      Matthias Braun, Christoph Mallon
  24  * @date        27.09.2006
  25  * @version     $Id$
  26  *
  27  * The goals of the greedy (and ILP) algorithm here works by assuming that
  28  * we want to change as many jumps to fallthroughs as possible (executed jumps
  29  * actually, we have to look at the execution frequencies). The algorithms
  30  * do this by collecting execution frequencies of all branches (which is easily
  31  * possible when all critical edges are split) then removes critical edges where
  32  * possible as we don't need and want them anymore now. The algorithms then try
  33  * to change as many edges to fallthroughs as possible, this is done by setting
  34  * a next and prev pointers on blocks. The greedy algorithm sorts the edges by
  35  * execution frequencies and tries to transform them to fallthroughs in this order
  36  */
  37 #include "config.h"
  38
  39 #include "beblocksched.h"
  40
  41 #include <stdlib.h>
  42
  43 #include "array.h"
  44 #include "pdeq.h"
  45
  46 #include "iredges.h"
  47 #include "irgwalk.h"
  48 #include "irnode_t.h"
  49 #include "irgraph_t.h"
  50 #include "irloop.h"
  51 #include "irprintf.h"
  52 #include "execfreq.h"
  53 #include "irdump_t.h"
  54 #include "irtools.h"
  55 #include "debug.h"
  56 #include "beirgmod.h"
  57 #include "bemodule.h"
  58 #include "be.h"
  59 #include "error.h"
  60
  61 #include "lc_opts.h"
  62 #include "lc_opts_enum.h"
  63
  64 #ifdef WITH_ILP
  65 #include <lpp/lpp.h>
  66 #include <lpp/lpp_net.h>
  67 #endif /* WITH_ILP */
  68
  69 DEBUG_ONLY(static firm_dbg_module_t *dbg = NULL;)
  70
  71 typedef enum _blocksched_algos_t {
  72         BLOCKSCHED_NAIV, BLOCKSCHED_EXTBB, BLOCKSCHED_GREEDY, BLOCKSCHED_ILP
  73 } blocksched_algos_t;
  74
  75 static int algo = BLOCKSCHED_GREEDY;
  76
  77 static const lc_opt_enum_int_items_t blockschedalgo_items[] = {
  78         { "naiv",       BLOCKSCHED_NAIV },
  79         { "extbb",      BLOCKSCHED_EXTBB },
  80         { "greedy", BLOCKSCHED_GREEDY },
  81 #ifdef WITH_ILP
  82         { "ilp",    BLOCKSCHED_ILP },
  83 #endif /* WITH_ILP */
  84         { NULL,     0 }
  85 };
  86
  87 static lc_opt_enum_int_var_t algo_var = {
  88         &algo, blockschedalgo_items
  89 };
  90
  91 static const lc_opt_table_entry_t be_blocksched_options[] = {
  92         LC_OPT_ENT_ENUM_INT ("algo", "the block scheduling algorithm", &algo_var),
  93         LC_OPT_LAST
  94 };
  95
  96 /*
  97  *   ____                   _
  98  *  / ___|_ __ ___  ___  __| |_   _
  99  * | |  _| '__/ _ \/ _ \/ _` | | | |
 100  * | |_| | | |  __/  __/ (_| | |_| |
 101  *  \____|_|  \___|\___|\__,_|\__, |
 102  *                            |___/
 103  */
 104
 105 typedef struct _blocksched_entry_t {
 106         ir_node *block;
 107         struct _blocksched_entry_t *next;
 108         struct _blocksched_entry_t *prev;
 109 } blocksched_entry_t;
 110
 111 typedef struct _edge_t {
 112         ir_node *block;             /**< source block */
 113         int     pos;                /**< number of cfg predecessor (target) */
 114         double  execfreq;           /**< the frequency */
 115         int     highest_execfreq;   /**< flag that indicates whether this edge is the edge with the highest
 116                                          execfreq pointing away from this block */
 117 } edge_t;
 118
 119 typedef struct _blocksched_env_t {
 120         ir_graph       *irg;
 121         struct obstack *obst;
 122         ir_exec_freq   *execfreqs;
 123         edge_t         *edges;
 124         pdeq           *worklist;
 125         int            blockcount;
 126 } blocksched_env_t;
 127
 128 /**
 129  * Collect cfg frequencies of all edges between blocks.
 130  * Also determines edge with highest frequency.
 131  */
 132 static void collect_egde_frequency(ir_node *block, void *data)
 133 {
 134         blocksched_env_t   *env = data;
 135         int                arity;
 136         edge_t             edge;
 137         blocksched_entry_t *entry;
 138
 139         entry        = obstack_alloc(env->obst, sizeof(entry[0]));
 140         entry->block = block;
 141         entry->next  = NULL;
 142         entry->prev  = NULL;
 143         set_irn_link(block, entry);
 144
 145         arity = get_Block_n_cfgpreds(block);
 146
 147         if (arity == 0) {
 148                 assert(block == get_irg_start_block(env->irg)
 149                                 || block == get_irg_end_block(env->irg));
 150                 /* must be the start block (or end-block for endless loops), nothing to
 151                  * do here */
 152                 return;
 153         } else if (arity == 1) {
 154                 edge.block            = block;
 155                 edge.pos              = 0;
 156                 edge.execfreq         = get_block_execfreq(env->execfreqs, block);
 157                 edge.highest_execfreq = 1;
 158                 ARR_APP1(edge_t, env->edges, edge);
 159         } else {
 160                 int    i;
 161                 double highest_execfreq = -1.0;
 162                 int    highest_edge_num = -1;
 163
 164                 edge.block = block;
 165                 for (i = 0; i < arity; ++i) {
 166                         double  execfreq;
 167                         ir_node *pred_block = get_Block_cfgpred_block(block, i);
 168
 169                         execfreq = get_block_execfreq(env->execfreqs, pred_block);
 170
 171                         edge.pos              = i;
 172                         edge.execfreq         = execfreq;
 173                         edge.highest_execfreq = 0;
 174                         ARR_APP1(edge_t, env->edges, edge);
 175
 176                         if (execfreq > highest_execfreq) {
 177                                 highest_execfreq = execfreq;
 178                                 highest_edge_num = ARR_LEN(env->edges) - 1;
 179                         }
 180                 }
 181
 182                 if(highest_edge_num >= 0)
 183                         env->edges[highest_edge_num].highest_execfreq = 1;
 184         }
 185 }
 186
 187 static int cmp_edges(const void *d1, const void *d2)
 188 {
 189         const edge_t *e1 = d1;
 190         const edge_t *e2 = d2;
 191
 192         return QSORT_CMP(e2->execfreq, e1->execfreq);
 193 }
 194
 195 static void coalesce_blocks(blocksched_env_t *env)
 196 {
 197         int i;
 198         int edge_count = ARR_LEN(env->edges);
 199
 200         /* run1: only look at jumps */
 201         for (i = 0; i < edge_count; ++i) {
 202                 const edge_t *edge  = &env->edges[i];
 203                 ir_node      *block = edge->block;
 204                 int           pos   = edge->pos;
 205                 ir_node      *pred_block;
 206                 blocksched_entry_t *entry, *pred_entry;
 207
 208                 /* only check edge with highest frequency */
 209                 if (! edge->highest_execfreq)
 210                         continue;
 211
 212                 /* the block might have been removed already... */
 213                 if (is_Bad(get_Block_cfgpred(block, 0)))
 214                         continue;
 215
 216                 pred_block = get_Block_cfgpred_block(block, pos);
 217                 entry      = get_irn_link(block);
 218                 pred_entry = get_irn_link(pred_block);
 219
 220                 if (pred_entry->next != NULL || entry->prev != NULL)
 221                         continue;
 222
 223                 /* only coalesce jumps */
 224                 if (get_block_succ_next(pred_block, get_block_succ_first(pred_block)) != NULL)
 225                         continue;
 226
 227                 /* schedule the 2 blocks behind each other */
 228                 DBG((dbg, LEVEL_1, "Coalesce (Jump) %+F -> %+F (%.3g)\n",
 229                            pred_entry->block, entry->block, edge->execfreq));
 230                 pred_entry->next = entry;
 231                 entry->prev      = pred_entry;
 232         }
 233
 234         /* run2: remaining edges */
 235         for (i = 0; i < edge_count; ++i) {
 236                 const edge_t *edge  = &env->edges[i];
 237                 ir_node      *block = edge->block;
 238                 int           pos   = edge->pos;
 239                 ir_node      *pred_block;
 240                 blocksched_entry_t *entry, *pred_entry;
 241
 242                 /* the block might have been removed already... */
 243                 if (is_Bad(get_Block_cfgpred(block, 0)))
 244                         continue;
 245
 246                 /* we can't do fallthroughs in backedges */
 247                 if (is_backedge(block, pos))
 248                         continue;
 249
 250                 pred_block = get_Block_cfgpred_block(block, pos);
 251                 entry      = get_irn_link(block);
 252                 pred_entry = get_irn_link(pred_block);
 253
 254                 /* is 1 of the blocks already attached to another block? */
 255                 if (pred_entry->next != NULL || entry->prev != NULL)
 256                         continue;
 257
 258                 /* schedule the 2 blocks behind each other */
 259                 DBG((dbg, LEVEL_1, "Coalesce (CondJump) %+F -> %+F (%.3g)\n",
 260                            pred_entry->block, entry->block, edge->execfreq));
 261                 pred_entry->next = entry;
 262                 entry->prev      = pred_entry;
 263         }
 264 }
 265
 266 static void pick_block_successor(blocksched_entry_t *entry, blocksched_env_t *env)
 267 {
 268         ir_node            *block = entry->block;
 269         ir_node            *succ  = NULL;
 270         blocksched_entry_t *succ_entry;
 271         const ir_edge_t    *edge;
 272         double             best_succ_execfreq;
 273
 274         if (irn_visited_else_mark(block))
 275                 return;
 276
 277         env->blockcount++;
 278
 279         DBG((dbg, LEVEL_1, "Pick succ of %+F\n", block));
 280
 281         /* put all successors into the worklist */
 282         foreach_block_succ(block, edge) {
 283                 ir_node *succ_block = get_edge_src_irn(edge);
 284
 285                 if (irn_visited(succ_block))
 286                         continue;
 287
 288                 /* we only need to put the first of a series of already connected
 289                  * blocks into the worklist */
 290                 succ_entry = get_irn_link(succ_block);
 291                 while (succ_entry->prev != NULL) {
 292                         /* break cycles... */
 293                         if (succ_entry->prev->block == succ_block) {
 294                                 succ_entry->prev->next = NULL;
 295                                 succ_entry->prev       = NULL;
 296                                 break;
 297                         }
 298                         succ_entry = succ_entry->prev;
 299                 };
 300
 301                 if (irn_visited(succ_entry->block))
 302                         continue;
 303
 304                 DBG((dbg, LEVEL_1, "Put %+F into worklist\n", succ_entry->block));
 305                 pdeq_putr(env->worklist, succ_entry->block);
 306         }
 307
 308         if (entry->next != NULL) {
 309                 pick_block_successor(entry->next, env);
 310                 return;
 311         }
 312
 313         DBG((dbg, LEVEL_1, "deciding...\n"));
 314         best_succ_execfreq = -1;
 315
 316         /* no successor yet: pick the successor block with the highest execution
 317          * frequency which has no predecessor yet */
 318
 319         foreach_block_succ(block, edge) {
 320                 ir_node *succ_block = get_edge_src_irn(edge);
 321                 double  execfreq;
 322
 323                 if (irn_visited(succ_block))
 324                         continue;
 325
 326                 succ_entry = get_irn_link(succ_block);
 327                 if (succ_entry->prev != NULL)
 328                         continue;
 329
 330                 execfreq = get_block_execfreq(env->execfreqs, succ_block);
 331                 if (execfreq > best_succ_execfreq) {
 332                         best_succ_execfreq = execfreq;
 333                         succ = succ_block;
 334                 }
 335         }
 336
 337         if (succ == NULL) {
 338                 DBG((dbg, LEVEL_1, "pick from worklist\n"));
 339
 340                 do {
 341                         if (pdeq_empty(env->worklist)) {
 342                                 DBG((dbg, LEVEL_1, "worklist empty\n"));
 343                                 return;
 344                         }
 345                         succ = pdeq_getl(env->worklist);
 346                 } while (irn_visited(succ));
 347         }
 348
 349         succ_entry       = get_irn_link(succ);
 350         entry->next      = succ_entry;
 351         succ_entry->prev = entry;
 352
 353         pick_block_successor(succ_entry, env);
 354 }
 355
 356 static blocksched_entry_t *finish_block_schedule(blocksched_env_t *env)
 357 {
 358         ir_graph           *irg        = env->irg;
 359         ir_node            *startblock = get_irg_start_block(irg);
 360         blocksched_entry_t *entry      = get_irn_link(startblock);
 361
 362         ir_reserve_resources(irg, IR_RESOURCE_IRN_VISITED);
 363         inc_irg_visited(irg);
 364
 365         env->worklist = new_pdeq();
 366         pick_block_successor(entry, env);
 367         assert(pdeq_empty(env->worklist));
 368         del_pdeq(env->worklist);
 369
 370         ir_free_resources(irg, IR_RESOURCE_IRN_VISITED);
 371
 372         return entry;
 373 }
 374
 375 static ir_node **create_blocksched_array(blocksched_env_t *env, blocksched_entry_t *first,
 376                                                                                 int count, struct obstack* obst)
 377 {
 378         int                i = 0;
 379         ir_node            **block_list;
 380         blocksched_entry_t *entry;
 381         (void) env;
 382
 383         block_list = NEW_ARR_D(ir_node *, obst, count);
 384         DBG((dbg, LEVEL_1, "Blockschedule:\n"));
 385
 386         for (entry = first; entry != NULL; entry = entry->next) {
 387                 assert(i < count);
 388                 block_list[i++] = entry->block;
 389                 DBG((dbg, LEVEL_1, "\t%+F\n", entry->block));
 390         }
 391         assert(i == count);
 392
 393         return block_list;
 394 }
 395
 396 static ir_node **create_block_schedule_greedy(ir_graph *irg, ir_exec_freq *execfreqs)
 397 {
 398         blocksched_env_t   env;
 399         struct obstack     obst;
 400         blocksched_entry_t *start_entry;
 401         ir_node            **block_list;
 402
 403         obstack_init(&obst);
 404
 405         env.irg        = irg;
 406         env.obst       = &obst;
 407         env.execfreqs  = execfreqs;
 408         env.edges      = NEW_ARR_F(edge_t, 0);
 409         env.worklist   = NULL;
 410         env.blockcount = 0;
 411
 412         // collect edge execution frequencies
 413         irg_block_walk_graph(irg, collect_egde_frequency, NULL, &env);
 414
 415         // sort interblock edges by execution frequency
 416         qsort(env.edges, ARR_LEN(env.edges), sizeof(env.edges[0]), cmp_edges);
 417
 418         (void)be_remove_empty_blocks(irg);
 419
 420         if (algo != BLOCKSCHED_NAIV)
 421                 coalesce_blocks(&env);
 422
 423         start_entry = finish_block_schedule(&env);
 424         block_list  = create_blocksched_array(&env, start_entry, env.blockcount, get_irg_obstack(irg));
 425
 426         DEL_ARR_F(env.edges);
 427         obstack_free(&obst, NULL);
 428
 429         return block_list;
 430 }
 431
 432 /*
 433  *  ___ _     ____
 434  * |_ _| |   |  _ \
 435  *  | || |   | |_) |
 436  *  | || |___|  __/
 437  * |___|_____|_|
 438  *
 439  */
 440
 441 #ifdef WITH_ILP
 442 typedef struct _ilp_edge_t {
 443         ir_node *block;   /**< source block */
 444         int     pos;      /**< number of cfg predecessor (target) */
 445         int     ilpvar;
 446 } ilp_edge_t;
 447
 448 typedef struct _blocksched_ilp_env_t {
 449         blocksched_env_t env;
 450         ilp_edge_t       *ilpedges;
 451         lpp_t            *lpp;
 452 } blocksched_ilp_env_t;
 453
 454 typedef struct _blocksched_ilp_entry_t {
 455         ir_node *block;
 456         struct _blocksched_entry_t *next;
 457         struct _blocksched_entry_t *prev;
 458
 459         int out_cst;
 460 } blocksched_ilp_entry_t;
 461
 462 static int add_ilp_edge(ir_node *block, int pos, double execfreq, blocksched_ilp_env_t *env)
 463 {
 464         char       name[64];
 465         ilp_edge_t edge;
 466         int        edgeidx = ARR_LEN(env->ilpedges);
 467
 468         snprintf(name, sizeof(name), "edge%d", edgeidx);
 469
 470         edge.block  = block;
 471         edge.pos    = pos;
 472         edge.ilpvar = lpp_add_var_default(env->lpp, name, lpp_binary, execfreq, 1.0);
 473
 474         ARR_APP1(ilp_edge_t, env->ilpedges, edge);
 475         return edgeidx;
 476 }
 477
 478 static void collect_egde_frequency_ilp(ir_node *block, void *data)
 479 {
 480         blocksched_ilp_env_t *env        = data;
 481         ir_graph             *irg        = env->env.irg;
 482         ir_node              *startblock = get_irg_start_block(irg);
 483         int                  arity;
 484         lpp_cst_t            cst;
 485         char                 name[64];
 486         int                  out_count;
 487         blocksched_ilp_entry_t *entry;
 488
 489         snprintf(name, sizeof(name), "block_out_constr_%ld", get_irn_node_nr(block));
 490         out_count = get_irn_n_edges_kind(block, EDGE_KIND_BLOCK);
 491
 492         entry          = obstack_alloc(env->env.obst, sizeof(entry[0]));
 493         entry->block   = block;
 494         entry->next    = NULL;
 495         entry->prev    = NULL;
 496         entry->out_cst = lpp_add_cst_uniq(env->lpp, name, lpp_greater, out_count - 1);
 497         set_irn_link(block, entry);
 498
 499         if (block == startblock)
 500                 return;
 501
 502         arity = get_irn_arity(block);
 503         if (arity == 1) {
 504                 double execfreq = get_block_execfreq(env->env.execfreqs, block);
 505                 add_ilp_edge(block, 0, execfreq, env);
 506         }
 507         else {
 508                 int i;
 509
 510                 snprintf(name, sizeof(name), "block_in_constr_%ld", get_irn_node_nr(block));
 511                 cst = lpp_add_cst_uniq(env->lpp, name, lpp_greater, arity - 1);
 512
 513                 for (i = 0; i < arity; ++i) {
 514                         double     execfreq;
 515                         int        edgenum;
 516                         ilp_edge_t *edge;
 517                         ir_node    *pred_block = get_Block_cfgpred_block(block, i);
 518
 519                         execfreq = get_block_execfreq(env->env.execfreqs, pred_block);
 520                         edgenum  = add_ilp_edge(block, i, execfreq, env);
 521                         edge     = &env->ilpedges[edgenum];
 522                         lpp_set_factor_fast(env->lpp, cst, edge->ilpvar, 1.0);
 523                 }
 524         }
 525 }
 526
 527
 528 static void coalesce_blocks_ilp(blocksched_ilp_env_t *env)
 529 {
 530         int  i;
 531         int  edge_count = ARR_LEN(env->ilpedges);
 532
 533         /* complete out constraints */
 534         for(i = 0; i < edge_count; ++i) {
 535                 const ilp_edge_t *edge  = &env->ilpedges[i];
 536                 ir_node          *block = edge->block;
 537                 ir_node          *pred;
 538                 blocksched_ilp_entry_t *entry;
 539
 540                 /* the block might have been removed already... */
 541                 if (is_Bad(get_Block_cfgpred(block, 0)))
 542                         continue;
 543
 544                 pred  = get_Block_cfgpred_block(block, edge->pos);
 545                 entry = get_irn_link(pred);
 546
 547                 DBG((dbg, LEVEL_1, "Adding out cst to %+F from %+F,%d\n",
 548                                   pred, block, edge->pos));
 549                 lpp_set_factor_fast(env->lpp, entry->out_cst, edge->ilpvar, 1.0);
 550         }
 551
 552 #if 0
 553         {
 554                 FILE *f;
 555                 char fname[256];
 556                 lpp_dump(env->lpp, "lpp.out");
 557                 snprintf(fname, sizeof(fname), "lpp_%s.plain", get_irg_dump_name(env->env.irg));
 558                 f = fopen(fname, "w");
 559                 lpp_dump_plain(env->lpp, f);
 560                 fclose(f);
 561         }
 562 #endif
 563
 564         //lpp_solve_net(env->lpp, main_env->options->ilp_server, main_env->options->ilp_solver);
 565         lpp_solve_net(env->lpp, "i44pc52", "cplex");
 566         assert(lpp_is_sol_valid(env->lpp));
 567
 568         /* Apply results to edges */
 569         for (i = 0; i < edge_count; ++i) {
 570                 const ilp_edge_t   *edge  = &env->ilpedges[i];
 571                 ir_node            *block = edge->block;
 572                 ir_node            *pred;
 573                 int                is_jump;
 574                 blocksched_entry_t *entry;
 575                 blocksched_entry_t *pred_entry;
 576
 577                 /* the block might have been removed already... */
 578                 if (is_Bad(get_Block_cfgpred(block, 0)))
 579                         continue;
 580
 581                 is_jump = (int)lpp_get_var_sol(env->lpp, edge->ilpvar);
 582                 if (is_jump)
 583                         continue;
 584
 585                 pred       = get_Block_cfgpred_block(block, edge->pos);
 586                 entry      = get_irn_link(block);
 587                 pred_entry = get_irn_link(pred);
 588
 589                 assert(entry->prev == NULL && pred_entry->next == NULL);
 590                 entry->prev      = pred_entry;
 591                 pred_entry->next = entry;
 592         }
 593 }
 594
 595 static ir_node **create_block_schedule_ilp(ir_graph *irg, ir_exec_freq *execfreqs)
 596 {
 597         blocksched_ilp_env_t env;
 598         struct obstack       obst;
 599         blocksched_entry_t   *start_entry;
 600         ir_node              **block_list;
 601
 602         obstack_init(&obst);
 603
 604         env.env.irg        = irg;
 605         env.env.obst       = &obst;
 606         env.env.execfreqs  = execfreqs;
 607         env.env.worklist   = NULL;
 608         env.env.blockcount = 0;
 609         env.ilpedges       = NEW_ARR_F(ilp_edge_t, 0);
 610
 611         env.lpp = new_lpp("blockschedule", lpp_minimize);
 612         lpp_set_time_limit(env.lpp, 20);
 613         lpp_set_log(env.lpp, stdout);
 614
 615         irg_block_walk_graph(irg, collect_egde_frequency_ilp, NULL, &env);
 616
 617         (void)be_remove_empty_blocks(irg);
 618         coalesce_blocks_ilp(&env);
 619
 620         start_entry = finish_block_schedule(&env.env);
 621         block_list  = create_blocksched_array(&env.env, start_entry, env.env.blockcount, get_irg_obstack(irg));
 622
 623         DEL_ARR_F(env.ilpedges);
 624         free_lpp(env.lpp);
 625         obstack_free(&obst, NULL);
 626
 627         return block_list;
 628 }
 629 #endif /* WITH_ILP */
 630
 631 /*
 632  *  _____      _   ____  ____
 633  * | ____|_  _| |_| __ )| __ )
 634  * |  _| \ \/ / __|  _ \|  _ \
 635  * | |___ >  <| |_| |_) | |_) |
 636  * |_____/_/\_\\__|____/|____/
 637  *
 638  */
 639
 640 /** A simple forward single linked list. */
 641 typedef struct {
 642         ir_node  *start;   /**< start of the list */
 643         ir_node  *end;     /**< last block in the list */
 644         unsigned n_blks;  /**< number of blocks in the list */
 645 } anchor;
 646
 647 static void add_block(anchor *list, ir_node *block) {
 648         if (list->start == NULL) {
 649                 list->start = block;
 650                 list->end   = block;
 651         } else {
 652                 set_irn_link(list->end, block);
 653                 list->end = block;
 654         }
 655
 656         list->n_blks++;
 657 }
 658
 659 static void create_block_list(ir_node *leader_block, anchor *list) {
 660         int             i;
 661         const ir_edge_t *edge;
 662         ir_node         *block = NULL;
 663         ir_extblk       *extbb = get_Block_extbb(leader_block);
 664
 665         if (extbb_visited(extbb))
 666                 return;
 667         mark_extbb_visited(extbb);
 668
 669         for (i = 0; i < get_extbb_n_blocks(extbb); ++i) {
 670                 block = get_extbb_block(extbb, i);
 671                 add_block(list, block);
 672         }
 673
 674         assert(block != NULL);
 675
 676         /* pick successor extbbs */
 677         foreach_block_succ(block, edge) {
 678                 ir_node *succ = get_edge_src_irn(edge);
 679                 create_block_list(succ, list);
 680         }
 681
 682         for (i = 0; i < get_extbb_n_blocks(extbb) - 1; ++i) {
 683                 block = get_extbb_block(extbb, i);
 684
 685                 foreach_block_succ(block, edge) {
 686                         ir_node *succ = get_edge_src_irn(edge);
 687                         create_block_list(succ, list);
 688                 }
 689         }
 690 }
 691
 692 void compute_extbb_execfreqs(ir_graph *irg, ir_exec_freq *execfreqs);
 693
 694 /*
 695  * Calculates a block schedule. The schedule is stored as a linked
 696  * list starting at the start_block of the irg.
 697  */
 698 static ir_node **create_extbb_block_schedule(ir_graph *irg, ir_exec_freq *execfreqs)
 699 {
 700         anchor list;
 701         ir_node **blk_list, *b, *n;
 702         unsigned i;
 703
 704         /* schedule extended basic blocks */
 705         compute_extbb_execfreqs(irg, execfreqs);
 706         //compute_extbb(irg);
 707
 708         list.start  = NULL;
 709         list.end    = NULL;
 710         list.n_blks = 0;
 711
 712         ir_reserve_resources(irg, IR_RESOURCE_IRN_VISITED | IR_RESOURCE_IRN_LINK);
 713         inc_irg_block_visited(irg);
 714
 715         create_block_list(get_irg_start_block(irg), &list);
 716
 717         /** create an array, so we can go forward and backward */
 718         blk_list = NEW_ARR_D(ir_node *, irg->obst,list.n_blks);
 719
 720         for (i = 0, b = list.start; b; b = n, ++i) {
 721                 n = get_irn_link(b);
 722                 blk_list[i] = b;
 723         }
 724
 725         ir_free_resources(irg, IR_RESOURCE_IRN_VISITED | IR_RESOURCE_IRN_LINK);
 726
 727         return blk_list;
 728 }
 729
 730 /*
 731  *  __  __       _
 732  * |  \/  | __ _(_)_ __
 733  * | |\/| |/ _` | | '_ \
 734  * | |  | | (_| | | | | |
 735  * |_|  |_|\__,_|_|_| |_|
 736  *
 737  */
 738 void be_init_blocksched(void)
 739 {
 740         lc_opt_entry_t *be_grp = lc_opt_get_grp(firm_opt_get_root(), "be");
 741         lc_opt_entry_t *blocksched_grp = lc_opt_get_grp(be_grp, "blocksched");
 742
 743         lc_opt_add_table(blocksched_grp, be_blocksched_options);
 744
 745         FIRM_DBG_REGISTER(dbg, "firm.be.blocksched");
 746 }
 747
 748 BE_REGISTER_MODULE_CONSTRUCTOR(be_init_blocksched);
 749
 750 ir_node **be_create_block_schedule(ir_graph *irg, ir_exec_freq *execfreqs)
 751 {
 752         switch(algo) {
 753         case BLOCKSCHED_GREEDY:
 754         case BLOCKSCHED_NAIV:
 755                 return create_block_schedule_greedy(irg, execfreqs);
 756         case BLOCKSCHED_EXTBB:
 757                 return create_extbb_block_schedule(irg, execfreqs);
 758 #ifdef WITH_ILP
 759         case BLOCKSCHED_ILP:
 760                 return create_block_schedule_ilp(irg, execfreqs);
 761 #endif /* WITH_ILP */
 762         }
 763
 764         panic("unknown blocksched algo");
 765         return NULL;
 766 }