must use Lg, not Ne to check for !=
[libfirm] / ir / opt / boolopt.c
1 #include <assert.h>
2 #include <string.h>
3
4 #include "adt/obst.h"
5 #include "ircons.h"
6 #include "irgmod.h"
7 #include "irgwalk.h"
8 #include "irprintf.h"
9 #include "irnode_t.h"
10 #include "tv.h"
11
12 typedef struct cond_pair {
13         ir_node *cmp_lo;
14         ir_node *cmp_hi;
15         pn_Cmp   pnc_lo;
16         pn_Cmp   pnc_hi;
17         ir_node *proj_lo;
18         ir_node *proj_hi;
19         tarval  *tv_lo;
20         tarval  *tv_hi;
21 } cond_pair;
22
23 static int find_cond_pair(ir_node *const l, ir_node *const r, cond_pair *const res)
24 {
25         if (is_Proj(l) && is_Proj(r)) {
26                 ir_node *const lo = get_Proj_pred(l);
27                 ir_node *const ro = get_Proj_pred(r);
28
29                 if (is_Cmp(lo) && is_Cmp(ro)) {
30                         ir_node *const lol = get_Cmp_left(lo);
31                         ir_node *const lor = get_Cmp_right(lo);
32                         ir_node *const rol = get_Cmp_left(ro);
33                         ir_node *const ror = get_Cmp_right(ro);
34
35                         if(is_Const(lor) && is_Const_null(lor) && is_Const(ror) && is_Const_null(ror) && get_Proj_proj(l) == pn_Cmp_Lg && get_Proj_proj(r) == pn_Cmp_Lg) {
36                                 ir_fprintf(stderr, "found zero zero\n");
37                         }
38
39                         /* TODO float */
40                         /* The constants shall be unequal.  Local optimisations handle the
41                          * equal case */
42                         if (lol == rol && mode_is_int(get_irn_mode(lol)) && lor != ror && is_Const(lor) && is_Const(ror)) {
43                                 tarval *const tv_l  = get_Const_tarval(lor);
44                                 tarval *const tv_r  = get_Const_tarval(ror);
45                                 pn_Cmp  const pnc_l = get_Proj_proj(l);
46                                 pn_Cmp  const pnc_r = get_Proj_proj(r);
47                                 pn_Cmp  const rel   = tarval_cmp(tv_l, tv_r);
48
49                                 assert(rel != pn_Cmp_Eq);
50
51                                 if (rel == pn_Cmp_Lt) {
52                                         res->cmp_lo  = lo;
53                                         res->cmp_hi  = ro;
54                                         res->pnc_lo  = pnc_l;
55                                         res->pnc_hi  = pnc_r;
56                                         res->proj_lo = l;
57                                         res->proj_hi = r;
58                                         res->tv_lo   = tv_l;
59                                         res->tv_hi   = tv_r;
60                                 } else {
61                                         assert(rel == pn_Cmp_Gt);
62                                         res->cmp_lo  = ro;
63                                         res->cmp_hi  = lo;
64                                         res->pnc_lo  = pnc_r;
65                                         res->pnc_hi  = pnc_l;
66                                         res->proj_lo = r;
67                                         res->proj_hi = l;
68                                         res->tv_lo   = tv_r;
69                                         res->tv_hi   = tv_l;
70                                 }
71                                 return 1;
72                         }
73                 }
74         }
75         return 0;
76 }
77
78 static ir_node *bool_and(cond_pair* const cpair)
79 {
80         ir_node *const cmp_lo  = cpair->cmp_lo;
81         ir_node *const cmp_hi  = cpair->cmp_hi;
82         pn_Cmp   const pnc_lo  = cpair->pnc_lo;
83         pn_Cmp   const pnc_hi  = cpair->pnc_hi;
84         ir_node *const proj_lo = cpair->proj_lo;
85         ir_node *const proj_hi = cpair->proj_hi;
86         tarval  *const tv_lo   = cpair->tv_lo;
87         tarval  *const tv_hi   = cpair->tv_hi;
88
89         /* Beware of NaN's, we can only check for (ordered) != here (which is Lg, not Ne) */
90         if ((pnc_lo == pn_Cmp_Lt || pnc_lo == pn_Cmp_Le || pnc_lo == pn_Cmp_Eq) &&
91                         (pnc_hi == pn_Cmp_Eq || pnc_hi == pn_Cmp_Ge || pnc_hi == pn_Cmp_Gt)) {
92                 /* x <|<=|== lo | x ==|>=|> hi -> false */
93                 ir_node *const t = new_Const(mode_b, tarval_b_false);
94                 return t;
95         } else if ((pnc_lo == pn_Cmp_Lt || pnc_lo == pn_Cmp_Le || pnc_lo == pn_Cmp_Eq) &&
96                                                  (pnc_hi == pn_Cmp_Lt || pnc_hi == pn_Cmp_Le || pnc_hi == pn_Cmp_Lg)) {
97                 /* x <|<=|== lo && x <|<=|!= hi -> x <|<=|== lo */
98                 return proj_lo;
99         } else if ((pnc_lo == pn_Cmp_Ge || pnc_lo == pn_Cmp_Gt || pnc_lo == pn_Cmp_Lg) &&
100                                                  (pnc_hi == pn_Cmp_Eq || pnc_hi == pn_Cmp_Ge || pnc_hi == pn_Cmp_Gt)) {
101                 /* x >=|>|!= lo || x ==|>=|> hi -> x ==|>=|> hi */
102                 return proj_hi;
103         } else if (tarval_is_one(tarval_sub(tv_hi, tv_lo))) { /* lo + 1 == hi */
104                 if (pnc_lo == pn_Cmp_Ge && pnc_hi == pn_Cmp_Lt) {
105                         /* x >= c || x < c + 1 -> x == c */
106                         ir_graph *const irg   = current_ir_graph;
107                         ir_node  *const block = get_nodes_block(cmp_lo);
108                         ir_node  *const p = new_r_Proj(irg, block, cmp_lo, mode_b, pn_Cmp_Eq);
109                         return p;
110                 } else if (pnc_lo == pn_Cmp_Gt) {
111                         if (pnc_hi == pn_Cmp_Lg) {
112                                 /* x > c || x != c + 1 -> x > c + 1 */
113                                 ir_graph *const irg   = current_ir_graph;
114                                 ir_node  *const block = get_nodes_block(cmp_hi);
115                                 ir_node  *const p = new_r_Proj(irg, block, cmp_hi, mode_b, pn_Cmp_Gt);
116                                 return p;
117                         } else if (pnc_hi == pn_Cmp_Lt) {
118                                 /* x > c || x < c + 1 -> false */
119                                 ir_node *const t = new_Const(mode_b, tarval_b_false);
120                                 return t;
121                         } else if (pnc_hi == pn_Cmp_Le) {
122                                 /* x > c || x <= c + 1 -> x != c + 1 */
123                                 ir_graph *const irg   = current_ir_graph;
124                                 ir_node  *const block = get_nodes_block(cmp_hi);
125                                 ir_node  *const p = new_r_Proj(irg, block, cmp_hi, mode_b, pn_Cmp_Eq);
126                                 return p;
127                         }
128                 } else if (pnc_lo == pn_Cmp_Lg && pnc_hi == pn_Cmp_Lt) {
129                         /* x != c || c < c + 1 -> x < c */
130                         ir_graph *const irg   = current_ir_graph;
131                         ir_node  *const block = get_nodes_block(cmp_lo);
132                         ir_node  *const p     = new_r_Proj(irg, block, cmp_lo, mode_b, pn_Cmp_Lt);
133                         return p;
134                 }
135         }
136         return NULL;
137 }
138
139 static ir_node *bool_or(cond_pair *const cpair)
140 {
141         ir_node *const cmp_lo  = cpair->cmp_lo;
142         ir_node *const cmp_hi  = cpair->cmp_hi;
143         pn_Cmp   const pnc_lo  = cpair->pnc_lo;
144         pn_Cmp   const pnc_hi  = cpair->pnc_hi;
145         ir_node *const proj_lo = cpair->proj_lo;
146         ir_node *const proj_hi = cpair->proj_hi;
147         tarval  *const tv_lo   = cpair->tv_lo;
148         tarval  *const tv_hi   = cpair->tv_hi;
149
150         /* Beware of NaN's, we can only check for (ordered) != here (which is Lg, not Ne) */
151         if ((pnc_lo == pn_Cmp_Ge || pnc_lo == pn_Cmp_Gt || pnc_lo == pn_Cmp_Lg) &&
152                         (pnc_hi == pn_Cmp_Lt || pnc_hi == pn_Cmp_Le || pnc_hi == pn_Cmp_Lg)) {
153                 /* x >=|>|!= lo | x <|<=|!= hi -> true */
154                 ir_node *const t = new_Const(mode_b, tarval_b_true);
155                 return t;
156         } else if ((pnc_lo == pn_Cmp_Lt || pnc_lo == pn_Cmp_Le || pnc_lo == pn_Cmp_Eq) &&
157                                                  (pnc_hi == pn_Cmp_Lt || pnc_hi == pn_Cmp_Le || pnc_hi == pn_Cmp_Lg)) {
158                 /* x <|<=|== lo || x <|<=|!= hi -> x <|<=|!= hi */
159                 return proj_hi;
160         } else if ((pnc_lo == pn_Cmp_Ge || pnc_lo == pn_Cmp_Gt || pnc_lo == pn_Cmp_Lg) &&
161                                                  (pnc_hi == pn_Cmp_Eq || pnc_hi == pn_Cmp_Ge || pnc_hi == pn_Cmp_Gt)) {
162                 /* x >=|>|!= lo || x ==|>=|> hi -> x >=|>|!= lo */
163                 return proj_lo;
164         } else if (tarval_is_one(tarval_sub(tv_hi, tv_lo))) { /* lo + 1 == hi */
165                 if (pnc_lo == pn_Cmp_Lt && pnc_hi == pn_Cmp_Ge) {
166                         /* x < c || x >= c + 1 -> x != c */
167                         ir_graph *const irg   = current_ir_graph;
168                         ir_node  *const block = get_nodes_block(cmp_lo);
169                         ir_node  *const p = new_r_Proj(irg, block, cmp_lo, mode_b, pn_Cmp_Lg);
170                         return p;
171                 } else if (pnc_lo == pn_Cmp_Le) {
172                         if (pnc_hi == pn_Cmp_Eq) {
173                                 /* x <= c || x == c + 1 -> x <= c + 1 */
174                                 ir_graph *const irg   = current_ir_graph;
175                                 ir_node  *const block = get_nodes_block(cmp_hi);
176                                 ir_node  *const p = new_r_Proj(irg, block, cmp_hi, mode_b, pn_Cmp_Le);
177                                 return p;
178                         } else if (pnc_hi == pn_Cmp_Ge) {
179                                 /* x <= c || x >= c + 1 -> true */
180                                 ir_node *const t = new_Const(mode_b, tarval_b_true);
181                                 return t;
182                         } else if (pnc_hi == pn_Cmp_Gt) {
183                                 /* x <= c || x > c + 1 -> x != c + 1 */
184                                 ir_graph *const irg   = current_ir_graph;
185                                 ir_node  *const block = get_nodes_block(cmp_hi);
186                                 ir_node  *const p = new_r_Proj(irg, block, cmp_hi, mode_b, pn_Cmp_Lg);
187                                 return p;
188                         }
189                 } else if (pnc_lo == pn_Cmp_Eq && pnc_hi == pn_Cmp_Ge) {
190                         /* x == c || c >= c + 1 -> x >= c */
191                         ir_graph *const irg   = current_ir_graph;
192                         ir_node  *const block = get_nodes_block(cmp_lo);
193                         ir_node  *const p     = new_r_Proj(irg, block, cmp_lo, mode_b, pn_Cmp_Ge);
194                         return p;
195                 }
196         }
197         return NULL;
198 }
199
200 static void bool_walk(ir_node *n, void *env)
201 {
202         (void)env;
203
204         if (get_irn_mode(n) != mode_b)
205                 return;
206
207         if (is_And(n)) {
208                 ir_node *const l = get_And_left(n);
209                 ir_node *const r = get_And_right(n);
210                 ir_node *      replacement;
211                 cond_pair      cpair;
212                 if (!find_cond_pair(l, r, &cpair))
213                         return;
214                 replacement = bool_and(&cpair);
215                 if (replacement)
216                         exchange(n, replacement);
217         } else if (is_Or(n)) {
218                 ir_node *const l = get_Or_left(n);
219                 ir_node *const r = get_Or_right(n);
220                 ir_node *      replacement;
221                 cond_pair      cpair;
222                 if (!find_cond_pair(l, r, &cpair))
223                         return;
224                 replacement = bool_or(&cpair);
225                 if (replacement)
226                         exchange(n, replacement);
227         }
228 }
229
230 /**
231  * Walker, clear Block mark and Phi list
232  */
233 static void clear_block_infos(ir_node *node, void *env)
234 {
235         (void) env;
236
237         /* we visit blocks before any other nodes (from the block) */
238         if (!is_Block(node))
239                 return;
240
241         /* clear the PHI list */
242         set_Block_phis(node, NULL);
243         set_Block_mark(node, 0);
244 }
245
246 /**
247  * Walker: collect Phi nodes and update the
248  */
249 static void collect_phis(ir_node *node, void *env)
250 {
251         (void) env;
252
253         if (is_Phi(node)) {
254                 ir_node *block = get_nodes_block(node);
255                 add_Block_phi(block, node);
256                 return;
257         }
258
259         /* Ignore control flow nodes, these will be removed. */
260         if (get_irn_pinned(node) == op_pin_state_pinned &&
261                         !is_Block(node) && !is_cfop(node)) {
262                 ir_node *block = get_nodes_block(node);
263                 set_Block_mark(block, 1);
264         }
265 }
266
267 ir_node *skip_empty_block(ir_node *node)
268 {
269         ir_node      *block;
270
271         if(!is_Jmp(node))
272                 return node;
273
274         block = get_nodes_block(node);
275         if(get_Block_n_cfgpreds(block) != 1)
276                 return node;
277
278         if(get_Block_mark(block))
279                 return node;
280
281         return get_Block_cfgpred(block, 0);
282 }
283
284 static void find_cf_and_or_walker(ir_node *block, void *env)
285 {
286         int i, i2;
287         int n_cfgpreds = get_Block_n_cfgpreds(block);
288         (void) env;
289
290         if(n_cfgpreds < 2)
291                 return;
292
293         /* Find the following structure:
294          *
295          *        upper_block
296          *         /       |
297          *        /        |
298          *   lower_block   |
299          *     /  \        |
300          *   ...   \       |
301          *           block
302          */
303
304 restart:
305         for(i = 0; i < n_cfgpreds; ++i) {
306                 ir_node      *lower_block;
307                 ir_node      *lower_cf;
308                 ir_node      *cond;
309                 ir_node      *cond_selector;
310                 ir_node      *lower_pred;
311
312                 lower_cf = get_Block_cfgpred(block, i);
313                 lower_cf = skip_empty_block(lower_cf);
314                 if(!is_Proj(lower_cf))
315                         continue;
316
317                 lower_block = get_nodes_block(lower_cf);
318                 if(get_Block_n_cfgpreds(lower_block) != 1)
319                         continue;
320
321                 cond = get_Proj_pred(lower_cf);
322                 if(!is_Cond(cond))
323                         continue;
324
325                 cond_selector = get_Cond_selector(cond);
326                 if(get_irn_mode(cond_selector) != mode_b)
327                         continue;
328
329                 /* the block must not produce any side-effects */
330                 if(get_Block_mark(lower_block))
331                         continue;
332
333                 lower_pred = get_Block_cfgpred_block(lower_block, 0);
334
335                 for(i2 = 0; i2 < n_cfgpreds; ++i2) {
336                         ir_node   *upper_block;
337                         ir_node   *upper_cf;
338                         ir_node   *upper_cond;
339                         ir_node   *upper_cond_selector;
340                         ir_node   *replacement;
341                         ir_graph  *irg;
342                         cond_pair  cpair;
343
344                         upper_cf    = get_Block_cfgpred(block, i2);
345                         upper_cf    = skip_empty_block(upper_cf);
346                         if(is_Bad(upper_cf))
347                                 continue;
348                         upper_block = get_nodes_block(upper_cf);
349                         if(upper_block != lower_pred)
350                                 continue;
351
352                         assert(is_Proj(upper_cf));
353                         upper_cond = get_Proj_pred(upper_cf);
354                         assert(is_Cond(upper_cond));
355                         upper_cond_selector = get_Cond_selector(upper_cond);
356                         if(get_irn_mode(upper_cond_selector) != mode_b)
357                                 continue;
358
359                         /* we have found the structure */
360                         /* TODO: check phis */
361                         if(!find_cond_pair(cond_selector, upper_cond_selector, &cpair))
362                                 continue;
363
364                         /* normalize pncs: we need the true case to jump into the
365                          * common block */
366                         irg = current_ir_graph;
367                         if(get_Proj_proj(lower_cf) == pn_Cond_false) {
368                                 if(cpair.proj_lo == cond_selector) {
369                                         ir_mode *mode = get_tarval_mode(cpair.tv_lo);
370                                         cpair.pnc_lo  = get_negated_pnc(cpair.pnc_lo, mode);
371                                         cpair.proj_lo = new_r_Proj(irg, lower_block,
372                                                         get_Proj_pred(cpair.proj_lo), mode_b, cpair.pnc_lo);
373                                 } else {
374                                         ir_mode *mode = get_tarval_mode(cpair.tv_hi);
375                                         assert(cpair.proj_hi == cond_selector);
376                                         cpair.pnc_hi  = get_negated_pnc(cpair.pnc_hi, mode);
377                                         cpair.proj_hi = new_r_Proj(irg, lower_block,
378                                                         get_Proj_pred(cpair.proj_hi), mode_b, cpair.pnc_hi);
379                                 }
380                         }
381                         if(get_Proj_proj(upper_cf) == pn_Cond_false) {
382                                 if(cpair.proj_lo == upper_cond_selector) {
383                                         ir_mode *mode = get_tarval_mode(cpair.tv_lo);
384                                         cpair.pnc_lo  = get_negated_pnc(cpair.pnc_lo, mode);
385                                         cpair.proj_lo = new_r_Proj(irg, upper_block,
386                                                         get_Proj_pred(cpair.proj_lo), mode_b, cpair.pnc_lo);
387                                 } else {
388                                         ir_mode *mode = get_tarval_mode(cpair.tv_hi);
389                                         assert(cpair.proj_hi == upper_cond_selector);
390                                         cpair.pnc_hi  = get_negated_pnc(cpair.pnc_hi, mode);
391                                         cpair.proj_hi = new_r_Proj(irg, upper_block,
392                                                         get_Proj_pred(cpair.proj_hi), mode_b, cpair.pnc_hi);
393                                 }
394                         }
395
396                         /* can we optimize the case? */
397                         replacement = bool_or(&cpair);
398                         if(replacement == NULL)
399                                 continue;
400
401                         /* move all nodes from lower block to upper block */
402                         exchange(lower_block, upper_block);
403
404                         set_Block_cfgpred(block, i2, new_Bad());
405
406                         /* the optimisations expected the true case to jump */
407                         if(get_Proj_proj(lower_cf) == pn_Cond_false) {
408                                 ir_node *block = get_nodes_block(replacement);
409                                 replacement    = new_rd_Not(NULL, current_ir_graph, block,
410                                                             replacement, mode_b);
411                         }
412                         set_Cond_selector(cond, replacement);
413
414                         ir_fprintf(stderr, "replaced (ub %+F)\n", upper_block);
415                         goto restart;
416                 }
417         }
418 }
419
420 void opt_bool(ir_graph *const irg)
421 {
422         irg_walk_graph(irg, NULL, bool_walk, NULL);
423
424         set_using_block_mark(irg);
425
426         irg_walk_graph(irg, clear_block_infos, collect_phis, NULL);
427
428         irg_block_walk_graph(irg, NULL, find_cf_and_or_walker, NULL);
429
430         set_irg_outs_inconsistent(irg);
431         set_irg_doms_inconsistent(irg);
432         set_irg_extblk_inconsistent(irg);
433         set_irg_loopinfo_inconsistent(irg);
434
435         clear_using_block_mark(irg);
436 }