f65db2cf808c24b527fd69be9555b9cf24ef3465
[libfirm] / heuristical_co.c
1 /*
2  * Copyright (C) 1995-2008 University of Karlsruhe.  All right reserved.
3  *
4  * This file is part of libFirm.
5  *
6  * This file may be distributed and/or modified under the terms of the
7  * GNU General Public License version 2 as published by the Free Software
8  * Foundation and appearing in the file LICENSE.GPL included in the
9  * packaging of this file.
10  *
11  * Licensees holding valid libFirm Professional Edition licenses may use
12  * this file in accordance with the libFirm Commercial License.
13  * Agreement provided with the Software.
14  *
15  * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
16  * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
17  * PURPOSE.
18  */
19
20 /**
21  * @file
22  * @brief   Heuristic PBQP solver for SSA-based register allocation.
23  * @date    18.09.2009
24  * @author  Thomas Bersch
25  * @version $Id$
26  */
27 #include "config.h"
28
29 #include "adt/array.h"
30 #include "assert.h"
31 #include "error.h"
32
33 #include "bucket.h"
34 #include "heuristical_co.h"
35 #include "optimal.h"
36 #if     KAPS_DUMP
37 #include "html_dumper.h"
38 #endif
39 #include "kaps.h"
40 #include "matrix.h"
41 #include "pbqp_edge.h"
42 #include "pbqp_edge_t.h"
43 #include "pbqp_node.h"
44 #include "pbqp_node_t.h"
45 #include "vector.h"
46
47 #include "plist.h"
48 #include "timing.h"
49
50 static void merge_into_RN_node(pbqp *pbqp, plist_t *rpeo)
51 {
52         pbqp_node   *node         = NULL;
53
54         assert(pbqp);
55
56         /* We want to reduce the first node in reverse perfect elimination order. */
57         do {
58                 /* get first element from reverse perfect elimination order */
59                 node = plist_first(rpeo)->data;
60                 /* remove element from reverse perfect elimination order */
61                 plist_erase(rpeo, plist_first(rpeo));
62                 /* insert node at the end of rpeo so the rpeo already exits after pbqp solving */
63                 plist_insert_back(rpeo, node);
64         } while(node_is_reduced(node));
65
66         assert(node);
67         assert(pbqp_node_get_degree(node) > 2);
68
69 #if     KAPS_DUMP
70         if (pbqp->dump_file) {
71                 char     txt[100];
72                 sprintf(txt, "RN-Reduction of Node n%d", node->index);
73                 dump_section(pbqp->dump_file, 2, txt);
74                 pbqp_dump_graph(pbqp);
75         }
76 #endif
77         /* Check whether we can merge a neighbor into the current node. */
78         apply_RM(pbqp, node);
79 }
80
81 static void apply_RN_co(pbqp *pbqp)
82 {
83         pbqp_node   *node      = NULL;
84         unsigned     min_index = 0;
85
86         assert(pbqp);
87
88         node        = merged_node;
89         merged_node = NULL;
90         assert(node);
91
92         if (node_is_reduced(node))
93                 return;
94
95         min_index = get_local_minimal_alternative(pbqp, node);
96
97 #if     KAPS_DUMP
98         if (pbqp->dump_file) {
99                 fprintf(pbqp->dump_file, "node n%d is set to %d<br><br>\n",
100                                         node->index, min_index);
101         }
102 #endif
103
104 #if KAPS_STATISTIC
105                 FILE *fh = fopen("solutions.pb", "a");
106                 fprintf(fh, "[%u]", min_index);
107                 fclose(fh);
108                 pbqp->num_rn++;
109 #endif
110
111         /* Now that we found the local minimum set all other costs to infinity. */
112         select_alternative(node, min_index);
113 }
114
115 static void apply_heuristic_reductions_co(pbqp *pbqp, plist_t *rpeo)
116 {
117         #if KAPS_TIMING
118                 /* create timers */
119                 ir_timer_t *t_edge = ir_timer_new();
120                 ir_timer_t *t_r1   = ir_timer_new();
121                 ir_timer_t *t_r2   = ir_timer_new();
122                 ir_timer_t *t_rn   = ir_timer_new();
123         #endif
124
125         for (;;) {
126                 if (edge_bucket_get_length(edge_bucket) > 0) {
127                         #if KAPS_TIMING
128                                 ir_timer_start(t_edge);
129                         #endif
130
131                         apply_edge(pbqp);
132
133                         #if KAPS_TIMING
134                                 ir_timer_stop(t_edge);
135                         #endif
136                 } else if (node_bucket_get_length(node_buckets[1]) > 0) {
137                         #if KAPS_TIMING
138                                 ir_timer_start(t_r1);
139                         #endif
140
141                         apply_RI(pbqp);
142
143                         #if KAPS_TIMING
144                                 ir_timer_stop(t_r1);
145                         #endif
146                 } else if (node_bucket_get_length(node_buckets[2]) > 0) {
147                         #if KAPS_TIMING
148                                 ir_timer_start(t_r2);
149                         #endif
150
151                         apply_RII(pbqp);
152
153                         #if KAPS_TIMING
154                                 ir_timer_stop(t_r2);
155                         #endif
156                 } else if (merged_node != NULL) {
157                         #if KAPS_TIMING
158                                 ir_timer_start(t_rn);
159                         #endif
160
161                         apply_RN_co(pbqp);
162
163                         #if KAPS_TIMING
164                                 ir_timer_stop(t_rn);
165                         #endif
166                 } else if (node_bucket_get_length(node_buckets[3]) > 0) {
167                         #if KAPS_TIMING
168                                 ir_timer_start(t_rn);
169                         #endif
170
171                         merge_into_RN_node(pbqp, rpeo);
172
173                         #if KAPS_TIMING
174                                 ir_timer_stop(t_rn);
175                         #endif
176                 } else {
177                         #if KAPS_TIMING
178                                 printf("PBQP RE reductions:           %10.3lf msec\n", (double)ir_timer_elapsed_usec(t_edge) / 1000.0);
179                                 printf("PBQP R1 reductions:           %10.3lf msec\n", (double)ir_timer_elapsed_usec(t_r1) / 1000.0);
180                                 printf("PBQP R2 reductions:           %10.3lf msec\n", (double)ir_timer_elapsed_usec(t_r2) / 1000.0);
181                                 printf("PBQP RN reductions:           %10.3lf msec\n", (double)ir_timer_elapsed_usec(t_rn) / 1000.0);
182                         #endif
183
184                         return;
185                 }
186         }
187 }
188
189 void solve_pbqp_heuristical_co(pbqp *pbqp, plist_t *rpeo)
190 {
191         /* Reduce nodes degree ... */
192         initial_simplify_edges(pbqp);
193
194         /* ... and put node into bucket representing their degree. */
195         fill_node_buckets(pbqp);
196
197         #if KAPS_STATISTIC
198                 FILE *fh = fopen("solutions.pb", "a");
199                 fprintf(fh, "Solution");
200                 fclose(fh);
201         #endif
202
203         apply_heuristic_reductions_co(pbqp, rpeo);
204
205         pbqp->solution = determine_solution(pbqp);
206
207         #if KAPS_STATISTIC
208                 fh = fopen("solutions.pb", "a");
209                 #if KAPS_USE_UNSIGNED
210                         fprintf(fh, ": %u RE:%u R0:%u R1:%u R2:%u RM:%u RN/BF:%u\n", pbqp->solution,
211                                         pbqp->num_edges, pbqp->num_r0, pbqp->num_r1, pbqp->num_r2,
212                                         pbqp->num_rm, pbqp->num_rn);
213                 #else
214                         fprintf(fh, ": %lld RE:%u R0:%u R1:%u R2:%u RM:%u RN/BF:%u\n", pbqp->solution,
215                                         pbqp->num_edges, pbqp->num_r0, pbqp->num_r1, pbqp->num_r2,
216                 #endif
217                 fclose(fh);
218         #endif
219
220         /* Solve reduced nodes. */
221         back_propagate(pbqp);
222
223         free_buckets();
224 }