2 * Copyright (C) 1995-2008 University of Karlsruhe. All right reserved.
4 * This file is part of libFirm.
6 * This file may be distributed and/or modified under the terms of the
7 * GNU General Public License version 2 as published by the Free Software
8 * Foundation and appearing in the file LICENSE.GPL included in the
9 * packaging of this file.
11 * Licensees holding valid libFirm Professional Edition licenses may use
12 * this file in accordance with the libFirm Commercial License.
13 * Agreement provided with the Software.
15 * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
16 * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * @brief Optimal reductions and helper functions.
24 * @author Sebastian Buchwald
29 #include "adt/array.h"
35 #include "html_dumper.h"
40 #include "pbqp_edge.h"
41 #include "pbqp_edge_t.h"
42 #include "pbqp_node.h"
43 #include "pbqp_node_t.h"
49 pbqp_edge **edge_bucket;
50 pbqp_node **node_buckets[4];
51 pbqp_node **reduced_bucket = NULL;
52 static int buckets_filled = 0;
54 static void insert_into_edge_bucket(pbqp_edge *edge)
56 if (edge_bucket_contains(edge_bucket, edge)) {
57 /* Edge is already inserted. */
61 edge_bucket_insert(&edge_bucket, edge);
64 static void init_buckets(void)
68 edge_bucket_init(&edge_bucket);
69 node_bucket_init(&reduced_bucket);
71 for (i = 0; i < 4; ++i) {
72 node_bucket_init(&node_buckets[i]);
76 void free_buckets(void)
80 for (i = 0; i < 4; ++i) {
81 node_bucket_free(&node_buckets[i]);
84 edge_bucket_free(&edge_bucket);
85 node_bucket_free(&reduced_bucket);
90 void fill_node_buckets(pbqp *pbqp)
96 node_len = pbqp->num_nodes;
99 ir_timer_t *t_fill_buckets = ir_timer_register("be_pbqp_fill_buckets", "PBQP Fill Nodes into buckets");
100 ir_timer_reset_and_start(t_fill_buckets);
103 for (node_index = 0; node_index < node_len; ++node_index) {
105 pbqp_node *node = get_node(pbqp, node_index);
109 degree = pbqp_node_get_degree(node);
111 /* We have only one bucket for nodes with arity >= 3. */
116 node_bucket_insert(&node_buckets[degree], node);
122 ir_timer_stop(t_fill_buckets);
123 printf("%-20s: %8.3lf msec\n", ir_timer_get_description(t_fill_buckets), (double)ir_timer_elapsed_usec(t_fill_buckets) / 1000.0);
127 static void normalize_towards_source(pbqp_edge *edge)
140 src_node = edge->src;
141 tgt_node = edge->tgt;
145 src_vec = src_node->costs;
146 tgt_vec = tgt_node->costs;
150 src_len = src_vec->len;
151 tgt_len = tgt_vec->len;
158 /* Normalize towards source node. */
159 for (src_index = 0; src_index < src_len; ++src_index) {
160 num min = pbqp_matrix_get_row_min(mat, src_index, tgt_vec);
163 if (src_vec->entries[src_index].data == INF_COSTS) {
164 pbqp_matrix_set_row_value(mat, src_index, 0);
166 pbqp_matrix_sub_row_value(mat, src_index, tgt_vec, min);
168 src_vec->entries[src_index].data = pbqp_add(
169 src_vec->entries[src_index].data, min);
171 if (min == INF_COSTS) {
173 unsigned edge_len = pbqp_node_get_degree(src_node);
175 for (edge_index = 0; edge_index < edge_len; ++edge_index) {
176 pbqp_edge *edge_candidate = src_node->edges[edge_index];
177 if (edge_candidate != edge) {
178 insert_into_edge_bucket(edge_candidate);
186 static void normalize_towards_target(pbqp_edge *edge)
199 src_node = edge->src;
200 tgt_node = edge->tgt;
204 src_vec = src_node->costs;
205 tgt_vec = tgt_node->costs;
209 src_len = src_vec->len;
210 tgt_len = tgt_vec->len;
217 for (tgt_index = 0; tgt_index < tgt_len; ++tgt_index) {
218 num min = pbqp_matrix_get_col_min(mat, tgt_index, src_vec);
221 if (tgt_vec->entries[tgt_index].data == INF_COSTS) {
222 pbqp_matrix_set_col_value(mat, tgt_index, 0);
224 pbqp_matrix_sub_col_value(mat, tgt_index, src_vec, min);
226 tgt_vec->entries[tgt_index].data = pbqp_add(
227 tgt_vec->entries[tgt_index].data, min);
229 if (min == INF_COSTS) {
231 unsigned edge_len = pbqp_node_get_degree(tgt_node);
233 for (edge_index = 0; edge_index < edge_len; ++edge_index) {
234 pbqp_edge *edge_candidate = tgt_node->edges[edge_index];
235 if (edge_candidate != edge) {
236 insert_into_edge_bucket(edge_candidate);
245 * Tries to apply RM for the source node of the given edge.
247 * Checks whether the source node of edge can be merged into the target node of
248 * edge, and performs the merge, if possible.
250 static void merge_source_into_target(pbqp *pbqp, pbqp_edge *edge)
268 src_node = edge->src;
269 tgt_node = edge->tgt;
273 src_vec = src_node->costs;
274 tgt_vec = tgt_node->costs;
278 src_len = src_vec->len;
279 tgt_len = tgt_vec->len;
281 /* Matrizes are normalized. */
288 mapping = NEW_ARR_F(unsigned, src_len);
290 /* Check that each column has at most one zero entry. */
291 for (tgt_index = 0; tgt_index < tgt_len; ++tgt_index) {
292 unsigned onlyOneZero = 0;
293 if (tgt_vec->entries[tgt_index].data == INF_COSTS)
296 for (src_index = 0; src_index < src_len; ++src_index) {
297 if (src_vec->entries[src_index].data == INF_COSTS)
300 if (mat->entries[src_index * tgt_len + tgt_index] == INF_COSTS)
303 /* Matrix entry is finite. */
310 mapping[tgt_index] = src_index;
314 /* We know that we can merge the source node into the target node. */
315 edge_len = pbqp_node_get_degree(src_node);
321 /* Reconnect the source's edges with the target node. */
322 for (edge_index = 0; edge_index < edge_len; ++edge_index) {
323 pbqp_edge *old_edge = src_node->edges[edge_index];
324 pbqp_matrix *old_matrix;
325 pbqp_matrix *new_matrix;
326 pbqp_node *other_node;
328 unsigned other_index;
333 if (old_edge == edge)
336 old_matrix = old_edge->costs;
339 if (old_edge->tgt == src_node) {
340 other_node = edge->src;
341 other_len = old_matrix->rows;
344 other_node = edge->tgt;
345 other_len = old_matrix->cols;
349 new_matrix = pbqp_matrix_alloc(pbqp, tgt_len, other_len);
351 /* Source node selects the column of the old_matrix. */
352 if (old_edge->tgt == src_node) {
353 for (tgt_index = 0; tgt_index < tgt_len; ++tgt_index) {
354 unsigned old_index = mapping[tgt_index];
355 for (other_index = 0; other_index < other_len; ++other_index) {
356 new_matrix->entries[tgt_index*other_len+other_index] = old_matrix->entries[other_index*src_len+old_index];
360 /* Source node selects the row of the old_matrix. */
362 for (tgt_index = 0; tgt_index < tgt_len; ++tgt_index) {
363 unsigned old_index = mapping[tgt_index];
364 for (other_index = 0; other_index < other_len; ++other_index) {
365 new_matrix->entries[tgt_index*other_len+other_index] = old_matrix->entries[old_index*other_len+other_index];
370 add_edge_costs(pbqp, tgt_node->index, other_node->index, new_matrix);
372 disconnect_edge(src_node, old_edge);
373 disconnect_edge(other_node, old_edge);
376 /* Reduce the remaining source node via RI. */
381 void reorder_node(pbqp_node *node)
383 unsigned degree = pbqp_node_get_degree(node);
384 /* Assume node lost one incident edge. */
385 unsigned old_degree = degree + 1;
387 if (!buckets_filled) return;
389 /* Same bucket as before */
390 if (degree > 2) return;
392 if (!node_bucket_contains(node_buckets[old_degree], node)) {
393 /* Old arity is new arity, so we have nothing to do. */
394 assert(node_bucket_contains(node_buckets[degree], node));
398 /* Delete node from old bucket... */
399 node_bucket_remove(&node_buckets[old_degree], node);
401 /* ..and add to new one. */
402 node_bucket_insert(&node_buckets[degree], node);
406 void check_melting_possibility(pbqp *pbqp, pbqp_edge *edge)
421 src_node = edge->src;
422 tgt_node = edge->tgt;
426 src_vec = src_node->costs;
427 tgt_vec = tgt_node->costs;
431 src_len = src_vec->len;
432 tgt_len = tgt_vec->len;
439 if (src_len == 1 && tgt_len == 1) {
440 //panic("Something is wrong");
444 for (src_index = 0; src_index < src_len; ++src_index) {
446 if (src_vec->entries[src_index].data == INF_COSTS) {
449 for (tgt_index = 0; tgt_index < tgt_len; ++tgt_index) {
450 if (tgt_vec->entries[tgt_index].data == INF_COSTS) {
453 if (mat->entries[src_index * tgt_len + tgt_index] == 0) {
462 if (mat->entries[src_index * tgt_len + tgt_index] == INF_COSTS) {
468 allRowsOk &= onlyOneZero;
472 for (tgt_index = 0; tgt_index < tgt_len; ++tgt_index) {
474 if (tgt_vec->entries[tgt_index].data == INF_COSTS) {
477 for (src_index = 0; src_index < src_len; ++src_index) {
478 if (src_vec->entries[src_index].data == INF_COSTS) {
481 if (mat->entries[src_index * tgt_len + tgt_index] == 0) {
490 if (mat->entries[src_index * tgt_len + tgt_index] == INF_COSTS) {
496 allColsOk &= onlyOneZero;
499 if (allRowsOk || allColsOk) {
505 void simplify_edge(pbqp *pbqp, pbqp_edge *edge)
518 src_node = edge->src;
519 tgt_node = edge->tgt;
523 /* If edge are already deleted, we have nothing to do. */
524 if (!is_connected(src_node, edge) || !is_connected(tgt_node, edge))
528 if (pbqp->dump_file) {
530 sprintf(txt, "Simplification of Edge n%d-n%d", src_node->index, tgt_node->index);
531 dump_section(pbqp->dump_file, 3, txt);
535 src_vec = src_node->costs;
536 tgt_vec = tgt_node->costs;
540 src_len = src_vec->len;
541 tgt_len = tgt_vec->len;
549 if (pbqp->dump_file) {
550 fputs("Input:<br>\n", pbqp->dump_file);
551 dump_simplifyedge(pbqp, edge);
555 normalize_towards_source(edge);
556 normalize_towards_target(edge);
559 if (pbqp->dump_file) {
560 fputs("<br>\nOutput:<br>\n", pbqp->dump_file);
561 dump_simplifyedge(pbqp, edge);
565 if (pbqp_matrix_is_zero(mat, src_vec, tgt_vec)) {
567 if (pbqp->dump_file) {
568 fputs("edge has been eliminated<br>\n", pbqp->dump_file);
577 reorder_node(src_node);
578 reorder_node(tgt_node);
582 void initial_simplify_edges(pbqp *pbqp)
590 ir_timer_t *t_int_simpl = ir_timer_register("be_pbqp_init_simp", "PBQP Initial simplify edges");
591 ir_timer_reset_and_start(t_int_simpl);
595 if (pbqp->dump_file) {
596 pbqp_dump_input(pbqp);
597 dump_section(pbqp->dump_file, 1, "2. Simplification of Cost Matrices");
601 node_len = pbqp->num_nodes;
605 /* First simplify all edges. */
606 for (node_index = 0; node_index < node_len; ++node_index) {
608 pbqp_node *node = get_node(pbqp, node_index);
615 edge_len = pbqp_node_get_degree(node);
617 for (edge_index = 0; edge_index < edge_len; ++edge_index) {
618 pbqp_edge *edge = edges[edge_index];
620 /* Simplify only once per edge. */
621 if (node != edge->src) continue;
623 simplify_edge(pbqp, edge);
628 ir_timer_stop(t_int_simpl);
629 printf("%-20s: %8.3lf msec\n", ir_timer_get_description(t_int_simpl), (double)ir_timer_elapsed_usec(t_int_simpl) / 1000.0);
633 num determine_solution(pbqp *pbqp)
640 ir_timer_t *t_det_solution = ir_timer_register("be_det_solution", "PBQP Determine Solution");
641 ir_timer_reset_and_start(t_det_solution);
651 file = pbqp->dump_file;
654 dump_section(file, 1, "4. Determine Solution/Minimum");
655 dump_section(file, 2, "4.1. Trivial Solution");
659 /* Solve trivial nodes and calculate solution. */
660 node_len = node_bucket_get_length(node_buckets[0]);
663 pbqp->num_r0 = node_len;
666 for (node_index = 0; node_index < node_len; ++node_index) {
667 pbqp_node *node = node_buckets[0][node_index];
670 node->solution = vector_get_min_index(node->costs);
671 solution = pbqp_add(solution,
672 node->costs->entries[node->solution].data);
676 fprintf(file, "node n%d is set to %d<br>\n", node->index, node->solution);
677 dump_node(file, node);
684 dump_section(file, 2, "Minimum");
685 #if KAPS_USE_UNSIGNED
686 fprintf(file, "Minimum is equal to %u.", solution);
688 fprintf(file, "Minimum is equal to %lld.", solution);
694 ir_timer_stop(t_det_solution);
695 printf("%-20s: %8.3lf msec\n", ir_timer_get_description(t_det_solution), (double)ir_timer_elapsed_usec(t_det_solution) / 1000.0);
701 static void back_propagate_RI(pbqp *pbqp, pbqp_node *node)
712 edge = node->edges[0];
714 is_src = edge->src == node;
721 node->solution = pbqp_matrix_get_col_min_index(mat, other->solution, vec);
726 node->solution = pbqp_matrix_get_row_min_index(mat, other->solution, vec);
730 if (pbqp->dump_file) {
731 fprintf(pbqp->dump_file, "node n%d is set to %d<br>\n", node->index, node->solution);
736 static void back_propagate_RII(pbqp *pbqp, pbqp_node *node)
738 pbqp_edge *src_edge = node->edges[0];
739 pbqp_edge *tgt_edge = node->edges[1];
740 int src_is_src = src_edge->src == node;
741 int tgt_is_src = tgt_edge->src == node;
742 pbqp_matrix *src_mat;
743 pbqp_matrix *tgt_mat;
754 src_node = src_edge->tgt;
756 src_node = src_edge->src;
760 tgt_node = tgt_edge->tgt;
762 tgt_node = tgt_edge->src;
765 /* Swap nodes if necessary. */
766 if (tgt_node->index < src_node->index) {
778 src_is_src = src_edge->src == node;
779 tgt_is_src = tgt_edge->src == node;
782 src_mat = src_edge->costs;
783 tgt_mat = tgt_edge->costs;
785 node_vec = node->costs;
787 row_index = src_node->solution;
788 col_index = tgt_node->solution;
790 vec = vector_copy(pbqp, node_vec);
793 vector_add_matrix_col(vec, src_mat, row_index);
795 vector_add_matrix_row(vec, src_mat, row_index);
799 vector_add_matrix_col(vec, tgt_mat, col_index);
801 vector_add_matrix_row(vec, tgt_mat, col_index);
804 node->solution = vector_get_min_index(vec);
807 if (pbqp->dump_file) {
808 fprintf(pbqp->dump_file, "node n%d is set to %d<br>\n", node->index, node->solution);
812 obstack_free(&pbqp->obstack, vec);
815 void back_propagate(pbqp *pbqp)
818 unsigned node_len = node_bucket_get_length(reduced_bucket);
823 if (pbqp->dump_file) {
824 dump_section(pbqp->dump_file, 2, "Back Propagation");
828 for (node_index = node_len; node_index > 0; --node_index) {
829 pbqp_node *node = reduced_bucket[node_index - 1];
831 switch (pbqp_node_get_degree(node)) {
833 back_propagate_RI(pbqp, node);
836 back_propagate_RII(pbqp, node);
839 panic("Only nodes with degree one or two should be in this bucket");
845 void apply_edge(pbqp *pbqp)
847 pbqp_edge *edge = edge_bucket_pop(&edge_bucket);
849 simplify_edge(pbqp, edge);
852 void apply_RI(pbqp *pbqp)
854 pbqp_node *node = node_bucket_pop(&node_buckets[1]);
855 pbqp_edge *edge = node->edges[0];
856 pbqp_matrix *mat = edge->costs;
857 int is_src = edge->src == node;
858 pbqp_node *other_node;
861 assert(pbqp_node_get_degree(node) == 1);
864 other_node = edge->tgt;
866 other_node = edge->src;
870 if (pbqp->dump_file) {
872 sprintf(txt, "RI-Reduction of Node n%d", node->index);
873 dump_section(pbqp->dump_file, 2, txt);
874 pbqp_dump_graph(pbqp);
875 fputs("<br>\nBefore reduction:<br>\n", pbqp->dump_file);
876 dump_node(pbqp->dump_file, node);
877 dump_node(pbqp->dump_file, other_node);
878 dump_edge(pbqp->dump_file, edge);
883 pbqp_matrix_add_to_all_cols(mat, node->costs);
884 normalize_towards_target(edge);
886 pbqp_matrix_add_to_all_rows(mat, node->costs);
887 normalize_towards_source(edge);
889 disconnect_edge(other_node, edge);
892 if (pbqp->dump_file) {
893 fputs("<br>\nAfter reduction:<br>\n", pbqp->dump_file);
894 dump_node(pbqp->dump_file, other_node);
898 reorder_node(other_node);
904 /* Add node to back propagation list. */
905 node_bucket_insert(&reduced_bucket, node);
908 void apply_RII(pbqp *pbqp)
910 pbqp_node *node = node_bucket_pop(&node_buckets[2]);
911 pbqp_edge *src_edge = node->edges[0];
912 pbqp_edge *tgt_edge = node->edges[1];
913 int src_is_src = src_edge->src == node;
914 int tgt_is_src = tgt_edge->src == node;
915 pbqp_matrix *src_mat;
916 pbqp_matrix *tgt_mat;
931 assert(pbqp_node_get_degree(node) == 2);
934 src_node = src_edge->tgt;
936 src_node = src_edge->src;
940 tgt_node = tgt_edge->tgt;
942 tgt_node = tgt_edge->src;
945 /* Swap nodes if necessary. */
946 if (tgt_node->index < src_node->index) {
958 src_is_src = src_edge->src == node;
959 tgt_is_src = tgt_edge->src == node;
963 if (pbqp->dump_file) {
965 sprintf(txt, "RII-Reduction of Node n%d", node->index);
966 dump_section(pbqp->dump_file, 2, txt);
967 pbqp_dump_graph(pbqp);
968 fputs("<br>\nBefore reduction:<br>\n", pbqp->dump_file);
969 dump_node(pbqp->dump_file, src_node);
970 dump_edge(pbqp->dump_file, src_edge);
971 dump_node(pbqp->dump_file, node);
972 dump_edge(pbqp->dump_file, tgt_edge);
973 dump_node(pbqp->dump_file, tgt_node);
977 src_mat = src_edge->costs;
978 tgt_mat = tgt_edge->costs;
980 src_vec = src_node->costs;
981 tgt_vec = tgt_node->costs;
982 node_vec = node->costs;
984 row_len = src_vec->len;
985 col_len = tgt_vec->len;
986 node_len = node_vec->len;
988 mat = pbqp_matrix_alloc(pbqp, row_len, col_len);
990 for (row_index = 0; row_index < row_len; ++row_index) {
991 for (col_index = 0; col_index < col_len; ++col_index) {
992 vec = vector_copy(pbqp, node_vec);
995 vector_add_matrix_col(vec, src_mat, row_index);
997 vector_add_matrix_row(vec, src_mat, row_index);
1001 vector_add_matrix_col(vec, tgt_mat, col_index);
1003 vector_add_matrix_row(vec, tgt_mat, col_index);
1006 mat->entries[row_index * col_len + col_index] = vector_get_min(vec);
1008 obstack_free(&pbqp->obstack, vec);
1012 pbqp_edge *edge = get_edge(pbqp, src_node->index, tgt_node->index);
1014 /* Disconnect node. */
1015 disconnect_edge(src_node, src_edge);
1016 disconnect_edge(tgt_node, tgt_edge);
1022 /* Add node to back propagation list. */
1023 node_bucket_insert(&reduced_bucket, node);
1026 edge = alloc_edge(pbqp, src_node->index, tgt_node->index, mat);
1029 pbqp_matrix_add(edge->costs, mat);
1031 /* Free local matrix. */
1032 obstack_free(&pbqp->obstack, mat);
1034 reorder_node(src_node);
1035 reorder_node(tgt_node);
1039 if (pbqp->dump_file) {
1040 fputs("<br>\nAfter reduction:<br>\n", pbqp->dump_file);
1041 dump_edge(pbqp->dump_file, edge);
1045 /* Edge has changed so we simplify it. */
1046 simplify_edge(pbqp, edge);
1049 void select_alternative(pbqp_node *node, unsigned selected_index)
1051 unsigned edge_index;
1052 unsigned node_index;
1055 unsigned max_degree = pbqp_node_get_degree(node);
1058 node->solution = selected_index;
1059 node_vec = node->costs;
1060 node_len = node_vec->len;
1061 assert(selected_index < node_len);
1063 /* Set all other costs to infinity. */
1064 for (node_index = 0; node_index < node_len; ++node_index) {
1065 if (node_index != selected_index) {
1066 node_vec->entries[node_index].data = INF_COSTS;
1070 /* Add all incident edges to edge bucket, since they are now independent. */
1071 for (edge_index = 0; edge_index < max_degree; ++edge_index) {
1072 insert_into_edge_bucket(node->edges[edge_index]);
1076 pbqp_node *get_node_with_max_degree(void)
1078 pbqp_node **bucket = node_buckets[3];
1079 unsigned bucket_len = node_bucket_get_length(bucket);
1080 unsigned bucket_index;
1081 unsigned max_degree = 0;
1082 pbqp_node *result = NULL;
1084 for (bucket_index = 0; bucket_index < bucket_len; ++bucket_index) {
1085 pbqp_node *candidate = bucket[bucket_index];
1086 unsigned degree = pbqp_node_get_degree(candidate);
1088 if (degree > max_degree) {
1090 max_degree = degree;
1097 unsigned get_local_minimal_alternative(pbqp *pbqp, pbqp_node *node)
1103 unsigned edge_index;
1104 unsigned max_degree;
1105 unsigned node_index;
1107 unsigned min_index = 0;
1108 num min = INF_COSTS;
1113 node_vec = node->costs;
1114 node_len = node_vec->len;
1115 max_degree = pbqp_node_get_degree(node);
1117 for (node_index = 0; node_index < node_len; ++node_index) {
1118 num value = node_vec->entries[node_index].data;
1120 for (edge_index = 0; edge_index < max_degree; ++edge_index) {
1121 edge = node->edges[edge_index];
1123 is_src = edge->src == node;
1126 vec = vector_copy(pbqp, edge->tgt->costs);
1127 vector_add_matrix_row(vec, mat, node_index);
1129 vec = vector_copy(pbqp, edge->src->costs);
1130 vector_add_matrix_col(vec, mat, node_index);
1133 value = pbqp_add(value, vector_get_min(vec));
1135 obstack_free(&pbqp->obstack, vec);
1140 min_index = node_index;
1147 int node_is_reduced(pbqp_node *node)
1149 if (!reduced_bucket) return 0;
1151 if (pbqp_node_get_degree(node) == 0) return 1;
1153 return node_bucket_contains(reduced_bucket, node);