* config/sparc/sparc.c (load_pic_register): Emit the appropriate
[official-gcc.git] / gcc / tree-ssa-pre.c
blobb6dedbcaadbaff6b267c8feaf6b78e27be024e09
1 /* SSA-PRE for trees.
2 Copyright (C) 2001, 2002, 2003, 2004, 2005 Free Software Foundation, Inc.
3 Contributed by Daniel Berlin <dan@dberlin.org> and Steven Bosscher
4 <stevenb@suse.de>
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2, or (at your option)
11 any later version.
13 GCC is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING. If not, write to
20 the Free Software Foundation, 59 Temple Place - Suite 330,
21 Boston, MA 02111-1307, USA. */
23 #include "config.h"
24 #include "system.h"
25 #include "coretypes.h"
26 #include "tm.h"
27 #include "errors.h"
28 #include "ggc.h"
29 #include "tree.h"
30 #include "basic-block.h"
31 #include "diagnostic.h"
32 #include "tree-inline.h"
33 #include "tree-flow.h"
34 #include "tree-gimple.h"
35 #include "tree-dump.h"
36 #include "timevar.h"
37 #include "fibheap.h"
38 #include "hashtab.h"
39 #include "tree-iterator.h"
40 #include "real.h"
41 #include "alloc-pool.h"
42 #include "tree-pass.h"
43 #include "flags.h"
44 #include "bitmap.h"
45 #include "langhooks.h"
47 /* TODO:
49 1. Avail sets can be shared by making an avail_find_leader that
50 walks up the dominator tree and looks in those avail sets.
51 This might affect code optimality, it's unclear right now.
52 2. Load motion can be performed by value numbering the loads the
53 same as we do other expressions. This requires iterative
54 hashing the vuses into the values. Right now we simply assign
55 a new value every time we see a statement with a vuse.
56 3. Strength reduction can be performed by anticipating expressions
57 we can repair later on.
58 4. Our canonicalization of expressions during lookups don't take
59 constants into account very well. In particular, we don't fold
60 anywhere, so we can get situations where we stupidly think
61 something is a new value (a + 1 + 1 vs a + 2). This is somewhat
62 expensive to fix, but it does expose a lot more eliminations.
63 It may or not be worth it, depending on how critical you
64 consider PRE vs just plain GRE.
65 */
67 /* For ease of terminology, "expression node" in the below refers to
68 every expression node but MODIFY_EXPR, because MODIFY_EXPR's represent
69 the actual statement containing the expressions we care about, and
70 we cache the value number by putting it in the expression. */
72 /* Basic algorithm
74 First we walk the statements to generate the AVAIL sets, the
75 EXP_GEN sets, and the tmp_gen sets. EXP_GEN sets represent the
76 generation of values/expressions by a given block. We use them
77 when computing the ANTIC sets. The AVAIL sets consist of
78 SSA_NAME's that represent values, so we know what values are
79 available in what blocks. AVAIL is a forward dataflow problem. In
80 SSA, values are never killed, so we don't need a kill set, or a
81 fixpoint iteration, in order to calculate the AVAIL sets. In
82 traditional parlance, AVAIL sets tell us the downsafety of the
83 expressions/values.
85 Next, we generate the ANTIC sets. These sets represent the
86 anticipatable expressions. ANTIC is a backwards dataflow
87 problem.An expression is anticipatable in a given block if it could
88 be generated in that block. This means that if we had to perform
89 an insertion in that block, of the value of that expression, we
90 could. Calculating the ANTIC sets requires phi translation of
91 expressions, because the flow goes backwards through phis. We must
92 iterate to a fixpoint of the ANTIC sets, because we have a kill
93 set. Even in SSA form, values are not live over the entire
94 function, only from their definition point onwards. So we have to
95 remove values from the ANTIC set once we go past the definition
96 point of the leaders that make them up.
97 compute_antic/compute_antic_aux performs this computation.
99 Third, we perform insertions to make partially redundant
100 expressions fully redundant.
102 An expression is partially redundant (excluding partial
103 anticipation) if:
105 1. It is AVAIL in some, but not all, of the predecessors of a
106 given block.
107 2. It is ANTIC in all the predecessors.
109 In order to make it fully redundant, we insert the expression into
110 the predecessors where it is not available, but is ANTIC.
111 insert/insert_aux performs this insertion.
113 Fourth, we eliminate fully redundant expressions.
114 This is a simple statement walk that replaces redundant
115 calculations with the now available values. */
117 /* Representations of value numbers:
119 Value numbers are represented using the "value handle" approach.
120 This means that each SSA_NAME (and for other reasons to be
121 disclosed in a moment, expression nodes) has a value handle that
122 can be retrieved through get_value_handle. This value handle, *is*
123 the value number of the SSA_NAME. You can pointer compare the
124 value handles for equivalence purposes.
126 For debugging reasons, the value handle is internally more than
127 just a number, it is a VAR_DECL named "value.x", where x is a
128 unique number for each value number in use. This allows
129 expressions with SSA_NAMES replaced by value handles to still be
130 pretty printed in a sane way. They simply print as "value.3 *
131 value.5", etc.
133 Expression nodes have value handles associated with them as a
134 cache. Otherwise, we'd have to look them up again in the hash
135 table This makes significant difference (factor of two or more) on
136 some test cases. They can be thrown away after the pass is
137 finished. */
139 /* Representation of expressions on value numbers:
141 In some portions of this code, you will notice we allocate "fake"
142 analogues to the expression we are value numbering, and replace the
143 operands with the values of the expression. Since we work on
144 values, and not just names, we canonicalize expressions to value
145 expressions for use in the ANTIC sets, the EXP_GEN set, etc.
147 This is theoretically unnecessary, it just saves a bunch of
148 repeated get_value_handle and find_leader calls in the remainder of
149 the code, trading off temporary memory usage for speed. The tree
150 nodes aren't actually creating more garbage, since they are
151 allocated in a special pools which are thrown away at the end of
152 this pass.
154 All of this also means that if you print the EXP_GEN or ANTIC sets,
155 you will see "value.5 + value.7" in the set, instead of "a_55 +
156 b_66" or something. The only thing that actually cares about
157 seeing the value leaders is phi translation, and it needs to be
158 able to find the leader for a value in an arbitrary block, so this
159 "value expression" form is perfect for it (otherwise you'd do
160 get_value_handle->find_leader->translate->get_value_handle->find_leader).*/
163 /* Representation of sets:
165 There are currently two types of sets used, hopefully to be unified soon.
166 The AVAIL sets do not need to be sorted in any particular order,
167 and thus, are simply represented as two bitmaps, one that keeps
168 track of values present in the set, and one that keeps track of
169 expressions present in the set.
171 The other sets are represented as doubly linked lists kept in topological
172 order, with an optional supporting bitmap of values present in the
173 set. The sets represent values, and the elements can be values or
174 expressions. The elements can appear in different sets, but each
175 element can only appear once in each set.
177 Since each node in the set represents a value, we also want to be
178 able to map expression, set pairs to something that tells us
179 whether the value is present is a set. We use a per-set bitmap for
180 that. The value handles also point to a linked list of the
181 expressions they represent via a tree annotation. This is mainly
182 useful only for debugging, since we don't do identity lookups. */
185 /* A value set element. Basically a single linked list of
186 expressions/values. */
187 typedef struct value_set_node
189 /* An expression. */
190 tree expr;
192 /* A pointer to the next element of the value set. */
193 struct value_set_node *next;
194 } *value_set_node_t;
197 /* A value set. This is a singly linked list of value_set_node
198 elements with a possible bitmap that tells us what values exist in
199 the set. This set must be kept in topologically sorted order. */
200 typedef struct value_set
202 /* The head of the list. Used for iterating over the list in
203 order. */
204 value_set_node_t head;
206 /* The tail of the list. Used for tail insertions, which are
207 necessary to keep the set in topologically sorted order because
208 of how the set is built. */
209 value_set_node_t tail;
211 /* The length of the list. */
212 size_t length;
214 /* True if the set is indexed, which means it contains a backing
215 bitmap for quick determination of whether certain values exist in the
216 set. */
217 bool indexed;
219 /* The bitmap of values that exist in the set. May be NULL in an
220 empty or non-indexed set. */
221 bitmap values;
223 } *value_set_t;
226 /* An unordered bitmap set. One bitmap tracks values, the other,
227 expressions. */
228 typedef struct bitmap_set
230 bitmap expressions;
231 bitmap values;
232 } *bitmap_set_t;
234 /* Sets that we need to keep track of. */
235 typedef struct bb_value_sets
237 /* The EXP_GEN set, which represents expressions/values generated in
238 a basic block. */
239 value_set_t exp_gen;
241 /* The PHI_GEN set, which represents PHI results generated in a
242 basic block. */
243 bitmap_set_t phi_gen;
245 /* The TMP_GEN set, which represents results/temporaries generated
246 in a basic block. IE the LHS of an expression. */
247 bitmap_set_t tmp_gen;
249 /* The AVAIL_OUT set, which represents which values are available in
250 a given basic block. */
251 bitmap_set_t avail_out;
253 /* The ANTIC_IN set, which represents which values are anticiptable
254 in a given basic block. */
255 value_set_t antic_in;
257 /* The NEW_SETS set, which is used during insertion to augment the
258 AVAIL_OUT set of blocks with the new insertions performed during
259 the current iteration. */
260 bitmap_set_t new_sets;
261 } *bb_value_sets_t;
263 #define EXP_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->exp_gen
264 #define PHI_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->phi_gen
265 #define TMP_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->tmp_gen
266 #define AVAIL_OUT(BB) ((bb_value_sets_t) ((BB)->aux))->avail_out
267 #define ANTIC_IN(BB) ((bb_value_sets_t) ((BB)->aux))->antic_in
268 #define NEW_SETS(BB) ((bb_value_sets_t) ((BB)->aux))->new_sets
270 /* This structure is used to keep track of statistics on what
271 optimization PRE was able to perform. */
272 static struct
274 /* The number of RHS computations eliminated by PRE. */
275 int eliminations;
277 /* The number of new expressions/temporaries generated by PRE. */
278 int insertions;
280 /* The number of new PHI nodes added by PRE. */
281 int phis;
282 } pre_stats;
285 static tree bitmap_find_leader (bitmap_set_t, tree);
286 static tree find_leader (value_set_t, tree);
287 static void value_insert_into_set (value_set_t, tree);
288 static void bitmap_value_insert_into_set (bitmap_set_t, tree);
289 static void bitmap_value_replace_in_set (bitmap_set_t, tree);
290 static void insert_into_set (value_set_t, tree);
291 static void bitmap_set_copy (bitmap_set_t, bitmap_set_t);
292 static bool bitmap_set_contains_value (bitmap_set_t, tree);
293 static bitmap_set_t bitmap_set_new (void);
294 static value_set_t set_new (bool);
295 static bool is_undefined_value (tree);
296 static tree create_expression_by_pieces (basic_block, tree, tree);
299 /* We can add and remove elements and entries to and from sets
300 and hash tables, so we use alloc pools for them. */
302 static alloc_pool value_set_pool;
303 static alloc_pool bitmap_set_pool;
304 static alloc_pool value_set_node_pool;
305 static alloc_pool binary_node_pool;
306 static alloc_pool unary_node_pool;
307 static alloc_pool reference_node_pool;
308 static bitmap_obstack grand_bitmap_obstack;
310 /* Set of blocks with statements that have had its EH information
311 cleaned up. */
312 static bitmap need_eh_cleanup;
314 /* The phi_translate_table caches phi translations for a given
315 expression and predecessor. */
317 static htab_t phi_translate_table;
319 /* A three tuple {e, pred, v} used to cache phi translations in the
320 phi_translate_table. */
322 typedef struct expr_pred_trans_d
324 /* The expression. */
325 tree e;
327 /* The predecessor block along which we translated the expression. */
328 basic_block pred;
330 /* The value that resulted from the translation. */
331 tree v;
333 /* The hashcode for the expression, pred pair. This is cached for
334 speed reasons. */
335 hashval_t hashcode;
336 } *expr_pred_trans_t;
338 /* Return the hash value for a phi translation table entry. */
340 static hashval_t
341 expr_pred_trans_hash (const void *p)
343 const expr_pred_trans_t ve = (expr_pred_trans_t) p;
344 return ve->hashcode;
347 /* Return true if two phi translation table entries are the same.
348 P1 and P2 should point to the expr_pred_trans_t's to be compared.*/
350 static int
351 expr_pred_trans_eq (const void *p1, const void *p2)
353 const expr_pred_trans_t ve1 = (expr_pred_trans_t) p1;
354 const expr_pred_trans_t ve2 = (expr_pred_trans_t) p2;
355 basic_block b1 = ve1->pred;
356 basic_block b2 = ve2->pred;
359 /* If they are not translations for the same basic block, they can't
360 be equal. */
361 if (b1 != b2)
362 return false;
364 /* If they are for the same basic block, determine if the
365 expressions are equal. */
366 if (expressions_equal_p (ve1->e, ve2->e))
367 return true;
369 return false;
372 /* Search in the phi translation table for the translation of
373 expression E in basic block PRED. Return the translated value, if
374 found, NULL otherwise. */
376 static inline tree
377 phi_trans_lookup (tree e, basic_block pred)
379 void **slot;
380 struct expr_pred_trans_d ept;
381 ept.e = e;
382 ept.pred = pred;
383 ept.hashcode = vn_compute (e, (unsigned long) pred, NULL);
384 slot = htab_find_slot_with_hash (phi_translate_table, &ept, ept.hashcode,
385 NO_INSERT);
386 if (!slot)
387 return NULL;
388 else
389 return ((expr_pred_trans_t) *slot)->v;
393 /* Add the tuple mapping from {expression E, basic block PRED} to
394 value V, to the phi translation table. */
396 static inline void
397 phi_trans_add (tree e, tree v, basic_block pred)
399 void **slot;
400 expr_pred_trans_t new_pair = xmalloc (sizeof (*new_pair));
401 new_pair->e = e;
402 new_pair->pred = pred;
403 new_pair->v = v;
404 new_pair->hashcode = vn_compute (e, (unsigned long) pred, NULL);
405 slot = htab_find_slot_with_hash (phi_translate_table, new_pair,
406 new_pair->hashcode, INSERT);
407 if (*slot)
408 free (*slot);
409 *slot = (void *) new_pair;
413 /* Add expression E to the expression set of value V. */
415 void
416 add_to_value (tree v, tree e)
418 /* Constants have no expression sets. */
419 if (is_gimple_min_invariant (v))
420 return;
422 if (VALUE_HANDLE_EXPR_SET (v) == NULL)
423 VALUE_HANDLE_EXPR_SET (v) = set_new (false);
425 insert_into_set (VALUE_HANDLE_EXPR_SET (v), e);
429 /* Return true if value V exists in the bitmap for SET. */
431 static inline bool
432 value_exists_in_set_bitmap (value_set_t set, tree v)
434 if (!set->values)
435 return false;
437 return bitmap_bit_p (set->values, VALUE_HANDLE_ID (v));
441 /* Remove value V from the bitmap for SET. */
443 static void
444 value_remove_from_set_bitmap (value_set_t set, tree v)
446 gcc_assert (set->indexed);
448 if (!set->values)
449 return;
451 bitmap_clear_bit (set->values, VALUE_HANDLE_ID (v));
455 /* Insert the value number V into the bitmap of values existing in
456 SET. */
458 static inline void
459 value_insert_into_set_bitmap (value_set_t set, tree v)
461 gcc_assert (set->indexed);
463 if (set->values == NULL)
464 set->values = BITMAP_ALLOC (&grand_bitmap_obstack);
466 bitmap_set_bit (set->values, VALUE_HANDLE_ID (v));
470 /* Create a new bitmap set and return it. */
472 static bitmap_set_t
473 bitmap_set_new (void)
475 bitmap_set_t ret = pool_alloc (bitmap_set_pool);
476 ret->expressions = BITMAP_ALLOC (&grand_bitmap_obstack);
477 ret->values = BITMAP_ALLOC (&grand_bitmap_obstack);
478 return ret;
481 /* Create a new set. */
483 static value_set_t
484 set_new (bool indexed)
486 value_set_t ret;
487 ret = pool_alloc (value_set_pool);
488 ret->head = ret->tail = NULL;
489 ret->length = 0;
490 ret->indexed = indexed;
491 ret->values = NULL;
492 return ret;
495 /* Insert an expression EXPR into a bitmapped set. */
497 static void
498 bitmap_insert_into_set (bitmap_set_t set, tree expr)
500 tree val;
501 /* XXX: For now, we only let SSA_NAMES into the bitmap sets. */
502 gcc_assert (TREE_CODE (expr) == SSA_NAME);
503 val = get_value_handle (expr);
505 gcc_assert (val);
506 if (!is_gimple_min_invariant (val))
508 bitmap_set_bit (set->values, VALUE_HANDLE_ID (val));
509 bitmap_set_bit (set->expressions, SSA_NAME_VERSION (expr));
513 /* Insert EXPR into SET. */
515 static void
516 insert_into_set (value_set_t set, tree expr)
518 value_set_node_t newnode = pool_alloc (value_set_node_pool);
519 tree val = get_value_handle (expr);
520 gcc_assert (val);
522 if (is_gimple_min_invariant (val))
523 return;
525 /* For indexed sets, insert the value into the set value bitmap.
526 For all sets, add it to the linked list and increment the list
527 length. */
528 if (set->indexed)
529 value_insert_into_set_bitmap (set, val);
531 newnode->next = NULL;
532 newnode->expr = expr;
533 set->length ++;
534 if (set->head == NULL)
536 set->head = set->tail = newnode;
538 else
540 set->tail->next = newnode;
541 set->tail = newnode;
545 /* Copy a bitmapped set ORIG, into bitmapped set DEST. */
547 static void
548 bitmap_set_copy (bitmap_set_t dest, bitmap_set_t orig)
550 bitmap_copy (dest->expressions, orig->expressions);
551 bitmap_copy (dest->values, orig->values);
554 /* Copy the set ORIG to the set DEST. */
556 static void
557 set_copy (value_set_t dest, value_set_t orig)
559 value_set_node_t node;
561 if (!orig || !orig->head)
562 return;
564 for (node = orig->head;
565 node;
566 node = node->next)
568 insert_into_set (dest, node->expr);
572 /* Remove EXPR from SET. */
574 static void
575 set_remove (value_set_t set, tree expr)
577 value_set_node_t node, prev;
579 /* Remove the value of EXPR from the bitmap, decrement the set
580 length, and remove it from the actual double linked list. */
581 value_remove_from_set_bitmap (set, get_value_handle (expr));
582 set->length--;
583 prev = NULL;
584 for (node = set->head;
585 node != NULL;
586 prev = node, node = node->next)
588 if (node->expr == expr)
590 if (prev == NULL)
591 set->head = node->next;
592 else
593 prev->next= node->next;
595 if (node == set->tail)
596 set->tail = prev;
597 pool_free (value_set_node_pool, node);
598 return;
603 /* Return true if SET contains the value VAL. */
605 static bool
606 set_contains_value (value_set_t set, tree val)
608 /* All constants are in every set. */
609 if (is_gimple_min_invariant (val))
610 return true;
612 if (set->length == 0)
613 return false;
615 return value_exists_in_set_bitmap (set, val);
618 /* Return true if bitmapped set SET contains the expression EXPR. */
619 static bool
620 bitmap_set_contains (bitmap_set_t set, tree expr)
622 /* All constants are in every set. */
623 if (is_gimple_min_invariant (get_value_handle (expr)))
624 return true;
626 /* XXX: Bitmapped sets only contain SSA_NAME's for now. */
627 if (TREE_CODE (expr) != SSA_NAME)
628 return false;
629 return bitmap_bit_p (set->expressions, SSA_NAME_VERSION (expr));
633 /* Return true if bitmapped set SET contains the value VAL. */
635 static bool
636 bitmap_set_contains_value (bitmap_set_t set, tree val)
638 if (is_gimple_min_invariant (val))
639 return true;
640 return bitmap_bit_p (set->values, VALUE_HANDLE_ID (val));
643 /* Replace an instance of value LOOKFOR with expression EXPR in SET. */
645 static void
646 bitmap_set_replace_value (bitmap_set_t set, tree lookfor, tree expr)
648 value_set_t exprset;
649 value_set_node_t node;
650 if (is_gimple_min_invariant (lookfor))
651 return;
652 if (!bitmap_set_contains_value (set, lookfor))
653 return;
655 /* The number of expressions having a given value is usually
656 significantly less than the total number of expressions in SET.
657 Thus, rather than check, for each expression in SET, whether it
658 has the value LOOKFOR, we walk the reverse mapping that tells us
659 what expressions have a given value, and see if any of those
660 expressions are in our set. For large testcases, this is about
661 5-10x faster than walking the bitmap. If this is somehow a
662 significant lose for some cases, we can choose which set to walk
663 based on the set size. */
664 exprset = VALUE_HANDLE_EXPR_SET (lookfor);
665 for (node = exprset->head; node; node = node->next)
667 if (TREE_CODE (node->expr) == SSA_NAME)
669 if (bitmap_bit_p (set->expressions, SSA_NAME_VERSION (node->expr)))
671 bitmap_clear_bit (set->expressions, SSA_NAME_VERSION (node->expr));
672 bitmap_set_bit (set->expressions, SSA_NAME_VERSION (expr));
673 return;
679 /* Subtract bitmapped set B from value set A, and return the new set. */
681 static value_set_t
682 bitmap_set_subtract_from_value_set (value_set_t a, bitmap_set_t b,
683 bool indexed)
685 value_set_t ret = set_new (indexed);
686 value_set_node_t node;
687 for (node = a->head;
688 node;
689 node = node->next)
691 if (!bitmap_set_contains (b, node->expr))
692 insert_into_set (ret, node->expr);
694 return ret;
697 /* Return true if two sets are equal. */
699 static bool
700 set_equal (value_set_t a, value_set_t b)
702 value_set_node_t node;
704 if (a->length != b->length)
705 return false;
706 for (node = a->head;
707 node;
708 node = node->next)
710 if (!set_contains_value (b, get_value_handle (node->expr)))
711 return false;
713 return true;
716 /* Replace an instance of EXPR's VALUE with EXPR in SET if it exists,
717 and add it otherwise. */
719 static void
720 bitmap_value_replace_in_set (bitmap_set_t set, tree expr)
722 tree val = get_value_handle (expr);
723 if (bitmap_set_contains_value (set, val))
724 bitmap_set_replace_value (set, val, expr);
725 else
726 bitmap_insert_into_set (set, expr);
729 /* Insert EXPR into SET if EXPR's value is not already present in
730 SET. */
732 static void
733 bitmap_value_insert_into_set (bitmap_set_t set, tree expr)
735 tree val = get_value_handle (expr);
737 if (is_gimple_min_invariant (val))
738 return;
740 if (!bitmap_set_contains_value (set, val))
741 bitmap_insert_into_set (set, expr);
744 /* Insert the value for EXPR into SET, if it doesn't exist already. */
746 static void
747 value_insert_into_set (value_set_t set, tree expr)
749 tree val = get_value_handle (expr);
751 /* Constant and invariant values exist everywhere, and thus,
752 actually keeping them in the sets is pointless. */
753 if (is_gimple_min_invariant (val))
754 return;
756 if (!set_contains_value (set, val))
757 insert_into_set (set, expr);
761 /* Print out SET to OUTFILE. */
763 static void
764 bitmap_print_value_set (FILE *outfile, bitmap_set_t set,
765 const char *setname, int blockindex)
767 fprintf (outfile, "%s[%d] := { ", setname, blockindex);
768 if (set)
770 bool first = true;
771 unsigned i;
772 bitmap_iterator bi;
774 EXECUTE_IF_SET_IN_BITMAP (set->expressions, 0, i, bi)
776 if (!first)
777 fprintf (outfile, ", ");
778 first = false;
779 print_generic_expr (outfile, ssa_name (i), 0);
781 fprintf (outfile, " (");
782 print_generic_expr (outfile, get_value_handle (ssa_name (i)), 0);
783 fprintf (outfile, ") ");
786 fprintf (outfile, " }\n");
788 /* Print out the value_set SET to OUTFILE. */
790 static void
791 print_value_set (FILE *outfile, value_set_t set,
792 const char *setname, int blockindex)
794 value_set_node_t node;
795 fprintf (outfile, "%s[%d] := { ", setname, blockindex);
796 if (set)
798 for (node = set->head;
799 node;
800 node = node->next)
802 print_generic_expr (outfile, node->expr, 0);
804 fprintf (outfile, " (");
805 print_generic_expr (outfile, get_value_handle (node->expr), 0);
806 fprintf (outfile, ") ");
808 if (node->next)
809 fprintf (outfile, ", ");
813 fprintf (outfile, " }\n");
816 /* Print out the expressions that have VAL to OUTFILE. */
818 void
819 print_value_expressions (FILE *outfile, tree val)
821 if (VALUE_HANDLE_EXPR_SET (val))
823 char s[10];
824 sprintf (s, "VH.%04d", VALUE_HANDLE_ID (val));
825 print_value_set (outfile, VALUE_HANDLE_EXPR_SET (val), s, 0);
830 void
831 debug_value_expressions (tree val)
833 print_value_expressions (stderr, val);
837 void debug_value_set (value_set_t, const char *, int);
839 void
840 debug_value_set (value_set_t set, const char *setname, int blockindex)
842 print_value_set (stderr, set, setname, blockindex);
845 /* Translate EXPR using phis in PHIBLOCK, so that it has the values of
846 the phis in PRED. Return NULL if we can't find a leader for each
847 part of the translated expression. */
849 static tree
850 phi_translate (tree expr, value_set_t set, basic_block pred,
851 basic_block phiblock)
853 tree phitrans = NULL;
854 tree oldexpr = expr;
856 if (expr == NULL)
857 return NULL;
859 if (is_gimple_min_invariant (expr))
860 return expr;
862 /* Phi translations of a given expression don't change. */
863 phitrans = phi_trans_lookup (expr, pred);
864 if (phitrans)
865 return phitrans;
867 switch (TREE_CODE_CLASS (TREE_CODE (expr)))
869 case tcc_reference:
870 /* XXX: Until we have PRE of loads working, none will be ANTIC. */
871 return NULL;
873 case tcc_binary:
875 tree oldop1 = TREE_OPERAND (expr, 0);
876 tree oldop2 = TREE_OPERAND (expr, 1);
877 tree newop1;
878 tree newop2;
879 tree newexpr;
881 newop1 = phi_translate (find_leader (set, oldop1),
882 set, pred, phiblock);
883 if (newop1 == NULL)
884 return NULL;
885 newop2 = phi_translate (find_leader (set, oldop2),
886 set, pred, phiblock);
887 if (newop2 == NULL)
888 return NULL;
889 if (newop1 != oldop1 || newop2 != oldop2)
891 newexpr = pool_alloc (binary_node_pool);
892 memcpy (newexpr, expr, tree_size (expr));
893 create_tree_ann (newexpr);
894 TREE_OPERAND (newexpr, 0) = newop1 == oldop1 ? oldop1 : get_value_handle (newop1);
895 TREE_OPERAND (newexpr, 1) = newop2 == oldop2 ? oldop2 : get_value_handle (newop2);
896 vn_lookup_or_add (newexpr, NULL);
897 expr = newexpr;
898 phi_trans_add (oldexpr, newexpr, pred);
901 return expr;
903 case tcc_unary:
905 tree oldop1 = TREE_OPERAND (expr, 0);
906 tree newop1;
907 tree newexpr;
909 newop1 = phi_translate (find_leader (set, oldop1),
910 set, pred, phiblock);
911 if (newop1 == NULL)
912 return NULL;
913 if (newop1 != oldop1)
915 newexpr = pool_alloc (unary_node_pool);
916 memcpy (newexpr, expr, tree_size (expr));
917 create_tree_ann (newexpr);
918 TREE_OPERAND (newexpr, 0) = get_value_handle (newop1);
919 vn_lookup_or_add (newexpr, NULL);
920 expr = newexpr;
921 phi_trans_add (oldexpr, newexpr, pred);
924 return expr;
926 case tcc_exceptional:
928 tree phi = NULL;
929 edge e;
930 gcc_assert (TREE_CODE (expr) == SSA_NAME);
931 if (TREE_CODE (SSA_NAME_DEF_STMT (expr)) == PHI_NODE)
932 phi = SSA_NAME_DEF_STMT (expr);
933 else
934 return expr;
936 e = find_edge (pred, bb_for_stmt (phi));
937 if (e)
939 if (is_undefined_value (PHI_ARG_DEF (phi, e->dest_idx)))
940 return NULL;
941 vn_lookup_or_add (PHI_ARG_DEF (phi, e->dest_idx), NULL);
942 return PHI_ARG_DEF (phi, e->dest_idx);
945 return expr;
947 default:
948 gcc_unreachable ();
952 static void
953 phi_translate_set (value_set_t dest, value_set_t set, basic_block pred,
954 basic_block phiblock)
956 value_set_node_t node;
957 for (node = set->head;
958 node;
959 node = node->next)
961 tree translated;
962 translated = phi_translate (node->expr, set, pred, phiblock);
963 phi_trans_add (node->expr, translated, pred);
965 if (translated != NULL)
966 value_insert_into_set (dest, translated);
970 /* Find the leader for a value (i.e., the name representing that
971 value) in a given set, and return it. Return NULL if no leader is
972 found. */
974 static tree
975 bitmap_find_leader (bitmap_set_t set, tree val)
977 if (val == NULL)
978 return NULL;
980 if (is_gimple_min_invariant (val))
981 return val;
982 if (bitmap_set_contains_value (set, val))
984 /* Rather than walk the entire bitmap of expressions, and see
985 whether any of them has the value we are looking for, we look
986 at the reverse mapping, which tells us the set of expressions
987 that have a given value (IE value->expressions with that
988 value) and see if any of those expressions are in our set.
989 The number of expressions per value is usually significantly
990 less than the number of expressions in the set. In fact, for
991 large testcases, doing it this way is roughly 5-10x faster
992 than walking the bitmap.
993 If this is somehow a significant lose for some cases, we can
994 choose which set to walk based on which set is smaller. */
995 value_set_t exprset;
996 value_set_node_t node;
997 exprset = VALUE_HANDLE_EXPR_SET (val);
998 for (node = exprset->head; node; node = node->next)
1000 if (TREE_CODE (node->expr) == SSA_NAME)
1002 if (bitmap_bit_p (set->expressions,
1003 SSA_NAME_VERSION (node->expr)))
1004 return node->expr;
1008 return NULL;
1012 /* Find the leader for a value (i.e., the name representing that
1013 value) in a given set, and return it. Return NULL if no leader is
1014 found. */
1016 static tree
1017 find_leader (value_set_t set, tree val)
1019 value_set_node_t node;
1021 if (val == NULL)
1022 return NULL;
1024 /* Constants represent themselves. */
1025 if (is_gimple_min_invariant (val))
1026 return val;
1028 if (set->length == 0)
1029 return NULL;
1031 if (value_exists_in_set_bitmap (set, val))
1033 for (node = set->head;
1034 node;
1035 node = node->next)
1037 if (get_value_handle (node->expr) == val)
1038 return node->expr;
1042 return NULL;
1045 /* Determine if the expression EXPR is valid in SET. This means that
1046 we have a leader for each part of the expression (if it consists of
1047 values), or the expression is an SSA_NAME.
1049 NB: We never should run into a case where we have SSA_NAME +
1050 SSA_NAME or SSA_NAME + value. The sets valid_in_set is called on,
1051 the ANTIC sets, will only ever have SSA_NAME's or binary value
1052 expression (IE VALUE1 + VALUE2) */
1054 static bool
1055 valid_in_set (value_set_t set, tree expr)
1057 switch (TREE_CODE_CLASS (TREE_CODE (expr)))
1059 case tcc_binary:
1061 tree op1 = TREE_OPERAND (expr, 0);
1062 tree op2 = TREE_OPERAND (expr, 1);
1063 return set_contains_value (set, op1) && set_contains_value (set, op2);
1066 case tcc_unary:
1068 tree op1 = TREE_OPERAND (expr, 0);
1069 return set_contains_value (set, op1);
1072 case tcc_reference:
1073 /* XXX: Until PRE of loads works, no reference nodes are ANTIC. */
1074 return false;
1076 case tcc_exceptional:
1077 gcc_assert (TREE_CODE (expr) == SSA_NAME);
1078 return true;
1080 default:
1081 /* No other cases should be encountered. */
1082 gcc_unreachable ();
1086 /* Clean the set of expressions that are no longer valid in SET. This
1087 means expressions that are made up of values we have no leaders for
1088 in SET. */
1090 static void
1091 clean (value_set_t set)
1093 value_set_node_t node;
1094 value_set_node_t next;
1095 node = set->head;
1096 while (node)
1098 next = node->next;
1099 if (!valid_in_set (set, node->expr))
1100 set_remove (set, node->expr);
1101 node = next;
1105 DEF_VEC_MALLOC_P (basic_block);
1107 /* Compute the ANTIC set for BLOCK.
1109 If succs(BLOCK) > 1 then
1110 ANTIC_OUT[BLOCK] = intersection of ANTIC_IN[b] for all succ(BLOCK)
1111 else if succs(BLOCK) == 1 then
1112 ANTIC_OUT[BLOCK] = phi_translate (ANTIC_IN[succ(BLOCK)])
1114 ANTIC_IN[BLOCK] = clean(ANTIC_OUT[BLOCK] U EXP_GEN[BLOCK] - TMP_GEN[BLOCK])
1116 XXX: It would be nice to either write a set_clear, and use it for
1117 ANTIC_OUT, or to mark the antic_out set as deleted at the end
1118 of this routine, so that the pool can hand the same memory back out
1119 again for the next ANTIC_OUT. */
1121 static bool
1122 compute_antic_aux (basic_block block, bool block_has_abnormal_pred_edge)
1124 bool changed = false;
1125 value_set_t S, old, ANTIC_OUT;
1126 value_set_node_t node;
1128 ANTIC_OUT = S = NULL;
1130 /* If any edges from predecessors are abnormal, antic_in is empty,
1131 so do nothing. */
1132 if (block_has_abnormal_pred_edge)
1133 goto maybe_dump_sets;
1135 old = set_new (false);
1136 set_copy (old, ANTIC_IN (block));
1137 ANTIC_OUT = set_new (true);
1139 /* If the block has no successors, ANTIC_OUT is empty. */
1140 if (EDGE_COUNT (block->succs) == 0)
1142 /* If we have one successor, we could have some phi nodes to
1143 translate through. */
1144 else if (EDGE_COUNT (block->succs) == 1)
1146 phi_translate_set (ANTIC_OUT, ANTIC_IN(EDGE_SUCC (block, 0)->dest),
1147 block, EDGE_SUCC (block, 0)->dest);
1149 /* If we have multiple successors, we take the intersection of all of
1150 them. */
1151 else
1153 VEC (basic_block) * worklist;
1154 edge e;
1155 size_t i;
1156 basic_block bprime, first;
1157 edge_iterator ei;
1159 worklist = VEC_alloc (basic_block, 2);
1160 FOR_EACH_EDGE (e, ei, block->succs)
1161 VEC_safe_push (basic_block, worklist, e->dest);
1162 first = VEC_index (basic_block, worklist, 0);
1163 set_copy (ANTIC_OUT, ANTIC_IN (first));
1165 for (i = 1; VEC_iterate (basic_block, worklist, i, bprime); i++)
1167 node = ANTIC_OUT->head;
1168 while (node)
1170 tree val;
1171 value_set_node_t next = node->next;
1172 val = get_value_handle (node->expr);
1173 if (!set_contains_value (ANTIC_IN (bprime), val))
1174 set_remove (ANTIC_OUT, node->expr);
1175 node = next;
1178 VEC_free (basic_block, worklist);
1181 /* Generate ANTIC_OUT - TMP_GEN. */
1182 S = bitmap_set_subtract_from_value_set (ANTIC_OUT, TMP_GEN (block), false);
1184 /* Start ANTIC_IN with EXP_GEN - TMP_GEN */
1185 ANTIC_IN (block) = bitmap_set_subtract_from_value_set (EXP_GEN (block),
1186 TMP_GEN (block),
1187 true);
1189 /* Then union in the ANTIC_OUT - TMP_GEN values,
1190 to get ANTIC_OUT U EXP_GEN - TMP_GEN */
1191 for (node = S->head; node; node = node->next)
1192 value_insert_into_set (ANTIC_IN (block), node->expr);
1194 clean (ANTIC_IN (block));
1195 if (!set_equal (old, ANTIC_IN (block)))
1196 changed = true;
1198 maybe_dump_sets:
1199 if (dump_file && (dump_flags & TDF_DETAILS))
1201 if (ANTIC_OUT)
1202 print_value_set (dump_file, ANTIC_OUT, "ANTIC_OUT", block->index);
1203 print_value_set (dump_file, ANTIC_IN (block), "ANTIC_IN", block->index);
1204 if (S)
1205 print_value_set (dump_file, S, "S", block->index);
1208 return changed;
1211 /* Compute ANTIC sets. Iterates until fixpointed. */
1213 static void
1214 compute_antic (void)
1216 bool changed= true;
1217 int num_iterations = 0;
1218 basic_block block, *worklist;
1219 size_t sp = 0;
1220 sbitmap has_abnormal_preds;
1222 /* If any predecessor edges are abnormal, we punt, so antic_in is empty.
1223 We pre-build the map of blocks with incoming abnormal edges here. */
1224 has_abnormal_preds = sbitmap_alloc (last_basic_block);
1225 sbitmap_zero (has_abnormal_preds);
1226 FOR_EACH_BB (block)
1228 edge_iterator ei;
1229 edge e;
1231 FOR_EACH_EDGE (e, ei, block->preds)
1232 if (e->flags & EDGE_ABNORMAL)
1234 SET_BIT (has_abnormal_preds, block->index);
1235 break;
1238 /* While we are here, give empty ANTIC_IN sets to each block. */
1239 ANTIC_IN (block) = set_new (true);
1241 /* At the exit block we anticipate nothing. */
1242 ANTIC_IN (EXIT_BLOCK_PTR) = set_new (true);
1244 /* Allocate the worklist. */
1245 worklist = xmalloc (sizeof (basic_block) * n_basic_blocks);
1247 /* Loop until fixpointed. */
1248 while (changed)
1250 basic_block son, bb;
1252 changed = false;
1253 num_iterations++;
1255 /* Seed the algorithm by putting post-dominator children of
1256 the exit block in the worklist. */
1257 for (son = first_dom_son (CDI_POST_DOMINATORS, EXIT_BLOCK_PTR);
1258 son;
1259 son = next_dom_son (CDI_POST_DOMINATORS, son))
1260 worklist[sp++] = son;
1262 /* Now visit all blocks in a DFS of the post dominator tree. */
1263 while (sp)
1265 bool bb_has_abnormal_pred;
1267 bb = worklist[--sp];
1268 bb_has_abnormal_pred = TEST_BIT (has_abnormal_preds, bb->index);
1269 changed |= compute_antic_aux (bb, bb_has_abnormal_pred);
1271 for (son = first_dom_son (CDI_POST_DOMINATORS, bb);
1272 son;
1273 son = next_dom_son (CDI_POST_DOMINATORS, son))
1274 worklist[sp++] = son;
1278 free (worklist);
1279 sbitmap_free (has_abnormal_preds);
1281 if (dump_file && (dump_flags & TDF_STATS))
1282 fprintf (dump_file, "compute_antic required %d iterations\n", num_iterations);
1286 /* Find a leader for an expression, or generate one using
1287 create_expression_by_pieces if it's ANTIC but
1288 complex.
1289 BLOCK is the basic_block we are looking for leaders in.
1290 EXPR is the expression to find a leader or generate for.
1291 STMTS is the statement list to put the inserted expressions on.
1292 Returns the SSA_NAME of the LHS of the generated expression or the
1293 leader. */
1295 static tree
1296 find_or_generate_expression (basic_block block, tree expr, tree stmts)
1298 tree genop = bitmap_find_leader (AVAIL_OUT (block), expr);
1300 /* If it's still NULL, see if it is a complex expression, and if
1301 so, generate it recursively, otherwise, abort, because it's
1302 not really . */
1303 if (genop == NULL)
1305 genop = VALUE_HANDLE_EXPR_SET (expr)->head->expr;
1306 gcc_assert (UNARY_CLASS_P (genop)
1307 || BINARY_CLASS_P (genop)
1308 || REFERENCE_CLASS_P (genop));
1309 genop = create_expression_by_pieces (block, genop, stmts);
1311 return genop;
1315 /* Create an expression in pieces, so that we can handle very complex
1316 expressions that may be ANTIC, but not necessary GIMPLE.
1317 BLOCK is the basic block the expression will be inserted into,
1318 EXPR is the expression to insert (in value form)
1319 STMTS is a statement list to append the necessary insertions into.
1321 This function will abort if we hit some value that shouldn't be
1322 ANTIC but is (IE there is no leader for it, or its components).
1323 This function may also generate expressions that are themselves
1324 partially or fully redundant. Those that are will be either made
1325 fully redundant during the next iteration of insert (for partially
1326 redundant ones), or eliminated by eliminate (for fully redundant
1327 ones). */
1329 static tree
1330 create_expression_by_pieces (basic_block block, tree expr, tree stmts)
1332 tree name = NULL_TREE;
1333 tree newexpr = NULL_TREE;
1334 tree v;
1336 switch (TREE_CODE_CLASS (TREE_CODE (expr)))
1338 case tcc_binary:
1340 tree_stmt_iterator tsi;
1341 tree genop1, genop2;
1342 tree temp;
1343 tree op1 = TREE_OPERAND (expr, 0);
1344 tree op2 = TREE_OPERAND (expr, 1);
1345 genop1 = find_or_generate_expression (block, op1, stmts);
1346 genop2 = find_or_generate_expression (block, op2, stmts);
1347 temp = create_tmp_var (TREE_TYPE (expr), "pretmp");
1348 add_referenced_tmp_var (temp);
1349 newexpr = build (TREE_CODE (expr), TREE_TYPE (expr),
1350 genop1, genop2);
1351 newexpr = build (MODIFY_EXPR, TREE_TYPE (expr),
1352 temp, newexpr);
1353 name = make_ssa_name (temp, newexpr);
1354 TREE_OPERAND (newexpr, 0) = name;
1355 tsi = tsi_last (stmts);
1356 tsi_link_after (&tsi, newexpr, TSI_CONTINUE_LINKING);
1357 pre_stats.insertions++;
1358 break;
1360 case tcc_unary:
1362 tree_stmt_iterator tsi;
1363 tree genop1;
1364 tree temp;
1365 tree op1 = TREE_OPERAND (expr, 0);
1366 genop1 = find_or_generate_expression (block, op1, stmts);
1367 temp = create_tmp_var (TREE_TYPE (expr), "pretmp");
1368 add_referenced_tmp_var (temp);
1369 newexpr = build (TREE_CODE (expr), TREE_TYPE (expr),
1370 genop1);
1371 newexpr = build (MODIFY_EXPR, TREE_TYPE (expr),
1372 temp, newexpr);
1373 name = make_ssa_name (temp, newexpr);
1374 TREE_OPERAND (newexpr, 0) = name;
1375 tsi = tsi_last (stmts);
1376 tsi_link_after (&tsi, newexpr, TSI_CONTINUE_LINKING);
1377 pre_stats.insertions++;
1379 break;
1381 default:
1382 gcc_unreachable ();
1385 v = get_value_handle (expr);
1386 vn_add (name, v, NULL);
1388 /* The value may already exist in either NEW_SETS, or AVAIL_OUT, because
1389 we are creating the expression by pieces, and this particular piece of
1390 the expression may have been represented. There is no harm in replacing
1391 here. */
1392 bitmap_value_replace_in_set (NEW_SETS (block), name);
1393 bitmap_value_replace_in_set (AVAIL_OUT (block), name);
1394 if (dump_file && (dump_flags & TDF_DETAILS))
1396 fprintf (dump_file, "Inserted ");
1397 print_generic_expr (dump_file, newexpr, 0);
1398 fprintf (dump_file, " in predecessor %d\n", block->index);
1400 return name;
1403 /* Insert the to-be-made-available values of NODE for each predecessor, stored
1404 in AVAIL, into the predecessors of BLOCK, and merge the result with a phi
1405 node, given the same value handle as NODE. The prefix of the phi node is
1406 given with TMPNAME*/
1408 static bool
1409 insert_into_preds_of_block (basic_block block, value_set_node_t node,
1410 tree *avail, const char *tmpname)
1412 tree val = get_value_handle (node->expr);
1413 edge pred;
1414 basic_block bprime;
1415 tree eprime;
1416 edge_iterator ei;
1417 tree type = TREE_TYPE (avail[EDGE_PRED (block, 0)->src->index]);
1418 tree temp;
1420 if (dump_file && (dump_flags & TDF_DETAILS))
1422 fprintf (dump_file, "Found partial redundancy for expression ");
1423 print_generic_expr (dump_file, node->expr, 0);
1424 fprintf (dump_file, "\n");
1427 /* Make the necessary insertions. */
1428 FOR_EACH_EDGE (pred, ei, block->preds)
1430 tree stmts = alloc_stmt_list ();
1431 tree builtexpr;
1432 bprime = pred->src;
1433 eprime = avail[bprime->index];
1434 if (BINARY_CLASS_P (eprime)
1435 || UNARY_CLASS_P (eprime))
1437 builtexpr = create_expression_by_pieces (bprime,
1438 eprime,
1439 stmts);
1440 bsi_insert_on_edge (pred, stmts);
1441 avail[bprime->index] = builtexpr;
1444 /* Now build a phi for the new variable. */
1445 temp = create_tmp_var (type, tmpname);
1446 add_referenced_tmp_var (temp);
1447 temp = create_phi_node (temp, block);
1449 FOR_EACH_EDGE (pred, ei, block->preds)
1450 add_phi_arg (temp, avail[pred->src->index], pred);
1452 vn_add (PHI_RESULT (temp), val, NULL);
1454 /* The value should *not* exist in PHI_GEN, or else we wouldn't be doing
1455 this insertion, since we test for the existence of this value in PHI_GEN
1456 before proceeding with the partial redundancy checks in insert_aux.
1458 The value may exist in AVAIL_OUT, in particular, it could be represented
1459 by the expression we are trying to eliminate, in which case we want the
1460 replacement to occur. If it's not existing in AVAIL_OUT, we want it
1461 inserted there.
1463 Similarly, to the PHI_GEN case, the value should not exist in NEW_SETS of
1464 this block, because if it did, it would have existed in our dominator's
1465 AVAIL_OUT, and would have been skipped due to the full redundancy check.
1468 bitmap_insert_into_set (PHI_GEN (block),
1469 PHI_RESULT (temp));
1470 bitmap_value_replace_in_set (AVAIL_OUT (block),
1471 PHI_RESULT (temp));
1472 bitmap_insert_into_set (NEW_SETS (block),
1473 PHI_RESULT (temp));
1475 if (dump_file && (dump_flags & TDF_DETAILS))
1477 fprintf (dump_file, "Created phi ");
1478 print_generic_expr (dump_file, temp, 0);
1479 fprintf (dump_file, " in block %d\n", block->index);
1481 pre_stats.phis++;
1482 return true;
1487 /* Perform insertion of partially redundant values.
1488 For BLOCK, do the following:
1489 1. Propagate the NEW_SETS of the dominator into the current block.
1490 If the block has multiple predecessors,
1491 2a. Iterate over the ANTIC expressions for the block to see if
1492 any of them are partially redundant.
1493 2b. If so, insert them into the necessary predecessors to make
1494 the expression fully redundant.
1495 2c. Insert a new PHI merging the values of the predecessors.
1496 2d. Insert the new PHI, and the new expressions, into the
1497 NEW_SETS set.
1498 3. Recursively call ourselves on the dominator children of BLOCK.
1502 static bool
1503 insert_aux (basic_block block)
1505 basic_block son;
1506 bool new_stuff = false;
1508 if (block)
1510 basic_block dom;
1511 dom = get_immediate_dominator (CDI_DOMINATORS, block);
1512 if (dom)
1514 unsigned i;
1515 bitmap_iterator bi;
1516 bitmap_set_t newset = NEW_SETS (dom);
1517 if (newset)
1519 /* Note that we need to value_replace both NEW_SETS, and
1520 AVAIL_OUT. For both the case of NEW_SETS, the value may be
1521 represented by some non-simple expression here that we want
1522 to replace it with. */
1523 EXECUTE_IF_SET_IN_BITMAP (newset->expressions, 0, i, bi)
1525 bitmap_value_replace_in_set (NEW_SETS (block), ssa_name (i));
1526 bitmap_value_replace_in_set (AVAIL_OUT (block), ssa_name (i));
1529 if (EDGE_COUNT (block->preds) > 1)
1531 value_set_node_t node;
1532 for (node = ANTIC_IN (block)->head;
1533 node;
1534 node = node->next)
1536 if (BINARY_CLASS_P (node->expr)
1537 || UNARY_CLASS_P (node->expr))
1539 tree *avail;
1540 tree val;
1541 bool by_some = false;
1542 bool cant_insert = false;
1543 bool all_same = true;
1544 tree first_s = NULL;
1545 edge pred;
1546 basic_block bprime;
1547 tree eprime = NULL_TREE;
1548 edge_iterator ei;
1550 val = get_value_handle (node->expr);
1551 if (bitmap_set_contains_value (PHI_GEN (block), val))
1552 continue;
1553 if (bitmap_set_contains_value (AVAIL_OUT (dom), val))
1555 if (dump_file && (dump_flags & TDF_DETAILS))
1556 fprintf (dump_file, "Found fully redundant value\n");
1557 continue;
1560 avail = xcalloc (last_basic_block, sizeof (tree));
1561 FOR_EACH_EDGE (pred, ei, block->preds)
1563 tree vprime;
1564 tree edoubleprime;
1566 /* This can happen in the very weird case
1567 that our fake infinite loop edges have caused a
1568 critical edge to appear. */
1569 if (EDGE_CRITICAL_P (pred))
1571 cant_insert = true;
1572 break;
1574 bprime = pred->src;
1575 eprime = phi_translate (node->expr,
1576 ANTIC_IN (block),
1577 bprime, block);
1579 /* eprime will generally only be NULL if the
1580 value of the expression, translated
1581 through the PHI for this predecessor, is
1582 undefined. If that is the case, we can't
1583 make the expression fully redundant,
1584 because its value is undefined along a
1585 predecessor path. We can thus break out
1586 early because it doesn't matter what the
1587 rest of the results are. */
1588 if (eprime == NULL)
1590 cant_insert = true;
1591 break;
1594 vprime = get_value_handle (eprime);
1595 gcc_assert (vprime);
1596 edoubleprime = bitmap_find_leader (AVAIL_OUT (bprime),
1597 vprime);
1598 if (edoubleprime == NULL)
1600 avail[bprime->index] = eprime;
1601 all_same = false;
1603 else
1605 avail[bprime->index] = edoubleprime;
1606 by_some = true;
1607 if (first_s == NULL)
1608 first_s = edoubleprime;
1609 else if (!operand_equal_p (first_s, edoubleprime,
1611 all_same = false;
1614 /* If we can insert it, it's not the same value
1615 already existing along every predecessor, and
1616 it's defined by some predecessor, it is
1617 partially redundant. */
1618 if (!cant_insert && !all_same && by_some)
1620 if (insert_into_preds_of_block (block, node, avail,
1621 "prephitmp"))
1622 new_stuff = true;
1625 free (avail);
1631 for (son = first_dom_son (CDI_DOMINATORS, block);
1632 son;
1633 son = next_dom_son (CDI_DOMINATORS, son))
1635 new_stuff |= insert_aux (son);
1638 return new_stuff;
1641 /* Perform insertion of partially redundant values. */
1643 static void
1644 insert (void)
1646 bool new_stuff = true;
1647 basic_block bb;
1648 int num_iterations = 0;
1650 FOR_ALL_BB (bb)
1651 NEW_SETS (bb) = bitmap_set_new ();
1653 while (new_stuff)
1655 num_iterations++;
1656 new_stuff = false;
1657 new_stuff = insert_aux (ENTRY_BLOCK_PTR);
1659 if (num_iterations > 2 && dump_file && (dump_flags & TDF_STATS))
1660 fprintf (dump_file, "insert required %d iterations\n", num_iterations);
1664 /* Return true if VAR is an SSA variable with no defining statement in
1665 this procedure, *AND* isn't a live-on-entry parameter. */
1667 static bool
1668 is_undefined_value (tree expr)
1670 return (TREE_CODE (expr) == SSA_NAME
1671 && IS_EMPTY_STMT (SSA_NAME_DEF_STMT (expr))
1672 /* PARM_DECLs and hard registers are always defined. */
1673 && TREE_CODE (SSA_NAME_VAR (expr)) != PARM_DECL);
1677 /* Given an SSA variable VAR and an expression EXPR, compute the value
1678 number for EXPR and create a value handle (VAL) for it. If VAR and
1679 EXPR are not the same, associate VAL with VAR. Finally, add VAR to
1680 S1 and its value handle to S2.
1682 VUSES represent the virtual use operands associated with EXPR (if
1683 any). They are used when computing the hash value for EXPR. */
1685 static inline void
1686 add_to_sets (tree var, tree expr, vuse_optype vuses, bitmap_set_t s1,
1687 bitmap_set_t s2)
1689 tree val = vn_lookup_or_add (expr, vuses);
1691 /* VAR and EXPR may be the same when processing statements for which
1692 we are not computing value numbers (e.g., non-assignments, or
1693 statements that make aliased stores). In those cases, we are
1694 only interested in making VAR available as its own value. */
1695 if (var != expr)
1696 vn_add (var, val, NULL);
1698 if (s1)
1699 bitmap_insert_into_set (s1, var);
1700 bitmap_value_insert_into_set (s2, var);
1704 /* Given a unary or binary expression EXPR, create and return a new
1705 expression with the same structure as EXPR but with its operands
1706 replaced with the value handles of each of the operands of EXPR.
1707 Insert EXPR's operands into the EXP_GEN set for BLOCK.
1709 VUSES represent the virtual use operands associated with EXPR (if
1710 any). They are used when computing the hash value for EXPR. */
1712 static inline tree
1713 create_value_expr_from (tree expr, basic_block block, vuse_optype vuses)
1715 int i;
1716 enum tree_code code = TREE_CODE (expr);
1717 tree vexpr;
1719 gcc_assert (TREE_CODE_CLASS (code) == tcc_unary
1720 || TREE_CODE_CLASS (code) == tcc_binary
1721 || TREE_CODE_CLASS (code) == tcc_reference);
1723 if (TREE_CODE_CLASS (code) == tcc_unary)
1724 vexpr = pool_alloc (unary_node_pool);
1725 else if (TREE_CODE_CLASS (code) == tcc_reference)
1726 vexpr = pool_alloc (reference_node_pool);
1727 else
1728 vexpr = pool_alloc (binary_node_pool);
1730 memcpy (vexpr, expr, tree_size (expr));
1732 for (i = 0; i < TREE_CODE_LENGTH (code); i++)
1734 tree op = TREE_OPERAND (expr, i);
1735 if (op != NULL)
1737 tree val = vn_lookup_or_add (op, vuses);
1738 if (!is_undefined_value (op))
1739 value_insert_into_set (EXP_GEN (block), op);
1740 if (TREE_CODE (val) == VALUE_HANDLE)
1741 TREE_TYPE (val) = TREE_TYPE (TREE_OPERAND (vexpr, i));
1742 TREE_OPERAND (vexpr, i) = val;
1746 return vexpr;
1750 /* Compute the AVAIL set for all basic blocks.
1752 This function performs value numbering of the statements in each basic
1753 block. The AVAIL sets are built from information we glean while doing
1754 this value numbering, since the AVAIL sets contain only one entry per
1755 value.
1757 AVAIL_IN[BLOCK] = AVAIL_OUT[dom(BLOCK)].
1758 AVAIL_OUT[BLOCK] = AVAIL_IN[BLOCK] U PHI_GEN[BLOCK] U TMP_GEN[BLOCK]. */
1760 static void
1761 compute_avail (void)
1763 basic_block block, son;
1764 basic_block *worklist;
1765 size_t sp = 0;
1766 tree param;
1768 /* For arguments with default definitions, we pretend they are
1769 defined in the entry block. */
1770 for (param = DECL_ARGUMENTS (current_function_decl);
1771 param;
1772 param = TREE_CHAIN (param))
1774 if (default_def (param) != NULL)
1776 tree val;
1777 tree def = default_def (param);
1778 val = vn_lookup_or_add (def, NULL);
1779 bitmap_insert_into_set (TMP_GEN (ENTRY_BLOCK_PTR), def);
1780 bitmap_value_insert_into_set (AVAIL_OUT (ENTRY_BLOCK_PTR), def);
1784 /* Allocate the worklist. */
1785 worklist = xmalloc (sizeof (basic_block) * n_basic_blocks);
1787 /* Seed the algorithm by putting the dominator children of the entry
1788 block on the worklist. */
1789 for (son = first_dom_son (CDI_DOMINATORS, ENTRY_BLOCK_PTR);
1790 son;
1791 son = next_dom_son (CDI_DOMINATORS, son))
1792 worklist[sp++] = son;
1794 /* Loop until the worklist is empty. */
1795 while (sp)
1797 block_stmt_iterator bsi;
1798 tree stmt, phi;
1799 basic_block dom;
1801 /* Pick a block from the worklist. */
1802 block = worklist[--sp];
1804 /* Initially, the set of available values in BLOCK is that of
1805 its immediate dominator. */
1806 dom = get_immediate_dominator (CDI_DOMINATORS, block);
1807 if (dom)
1808 bitmap_set_copy (AVAIL_OUT (block), AVAIL_OUT (dom));
1810 /* Generate values for PHI nodes. */
1811 for (phi = phi_nodes (block); phi; phi = PHI_CHAIN (phi))
1812 /* We have no need for virtual phis, as they don't represent
1813 actual computations. */
1814 if (is_gimple_reg (PHI_RESULT (phi)))
1815 add_to_sets (PHI_RESULT (phi), PHI_RESULT (phi), NULL,
1816 PHI_GEN (block), AVAIL_OUT (block));
1818 /* Now compute value numbers and populate value sets with all
1819 the expressions computed in BLOCK. */
1820 for (bsi = bsi_start (block); !bsi_end_p (bsi); bsi_next (&bsi))
1822 stmt_ann_t ann;
1823 size_t j;
1825 stmt = bsi_stmt (bsi);
1826 ann = stmt_ann (stmt);
1827 get_stmt_operands (stmt);
1829 /* We are only interested in assignments of the form
1830 X_i = EXPR, where EXPR represents an "interesting"
1831 computation, it has no volatile operands and X_i
1832 doesn't flow through an abnormal edge. */
1833 if (TREE_CODE (stmt) == MODIFY_EXPR
1834 && !ann->has_volatile_ops
1835 && TREE_CODE (TREE_OPERAND (stmt, 0)) == SSA_NAME
1836 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (TREE_OPERAND (stmt, 0)))
1838 tree lhs = TREE_OPERAND (stmt, 0);
1839 tree rhs = TREE_OPERAND (stmt, 1);
1840 vuse_optype vuses = STMT_VUSE_OPS (stmt);
1842 STRIP_USELESS_TYPE_CONVERSION (rhs);
1843 if (TREE_CODE (rhs) == SSA_NAME
1844 || is_gimple_min_invariant (rhs))
1846 /* Compute a value number for the RHS of the statement
1847 and add its value to the AVAIL_OUT set for the block.
1848 Add the LHS to TMP_GEN. */
1849 add_to_sets (lhs, rhs, vuses, TMP_GEN (block),
1850 AVAIL_OUT (block));
1852 if (TREE_CODE (rhs) == SSA_NAME
1853 && !is_undefined_value (rhs))
1854 value_insert_into_set (EXP_GEN (block), rhs);
1855 continue;
1857 else if (UNARY_CLASS_P (rhs) || BINARY_CLASS_P (rhs)
1858 || TREE_CODE (rhs) == INDIRECT_REF)
1860 /* For binary, unary, and reference expressions,
1861 create a duplicate expression with the operands
1862 replaced with the value handles of the original
1863 RHS. */
1864 tree newt = create_value_expr_from (rhs, block, vuses);
1865 add_to_sets (lhs, newt, vuses, TMP_GEN (block),
1866 AVAIL_OUT (block));
1867 value_insert_into_set (EXP_GEN (block), newt);
1868 continue;
1872 /* For any other statement that we don't recognize, simply
1873 make the names generated by the statement available in
1874 AVAIL_OUT and TMP_GEN. */
1875 for (j = 0; j < NUM_DEFS (STMT_DEF_OPS (stmt)); j++)
1877 tree def = DEF_OP (STMT_DEF_OPS (stmt), j);
1878 add_to_sets (def, def, NULL, TMP_GEN (block),
1879 AVAIL_OUT (block));
1882 for (j = 0; j < NUM_USES (STMT_USE_OPS (stmt)); j++)
1884 tree use = USE_OP (STMT_USE_OPS (stmt), j);
1885 add_to_sets (use, use, NULL, NULL, AVAIL_OUT (block));
1889 /* Put the dominator children of BLOCK on the worklist of blocks
1890 to compute available sets for. */
1891 for (son = first_dom_son (CDI_DOMINATORS, block);
1892 son;
1893 son = next_dom_son (CDI_DOMINATORS, son))
1894 worklist[sp++] = son;
1897 free (worklist);
1901 /* Eliminate fully redundant computations. */
1903 static void
1904 eliminate (void)
1906 basic_block b;
1908 FOR_EACH_BB (b)
1910 block_stmt_iterator i;
1912 for (i = bsi_start (b); !bsi_end_p (i); bsi_next (&i))
1914 tree stmt = bsi_stmt (i);
1916 /* Lookup the RHS of the expression, see if we have an
1917 available computation for it. If so, replace the RHS with
1918 the available computation. */
1919 if (TREE_CODE (stmt) == MODIFY_EXPR
1920 && TREE_CODE (TREE_OPERAND (stmt, 0)) == SSA_NAME
1921 && TREE_CODE (TREE_OPERAND (stmt ,1)) != SSA_NAME
1922 && !is_gimple_min_invariant (TREE_OPERAND (stmt, 1))
1923 && !stmt_ann (stmt)->has_volatile_ops)
1925 tree lhs = TREE_OPERAND (stmt, 0);
1926 tree *rhs_p = &TREE_OPERAND (stmt, 1);
1927 tree sprime;
1929 sprime = bitmap_find_leader (AVAIL_OUT (b),
1930 vn_lookup (lhs, NULL));
1931 if (sprime
1932 && sprime != lhs
1933 && (TREE_CODE (*rhs_p) != SSA_NAME
1934 || may_propagate_copy (*rhs_p, sprime)))
1936 gcc_assert (sprime != *rhs_p);
1938 if (dump_file && (dump_flags & TDF_DETAILS))
1940 fprintf (dump_file, "Replaced ");
1941 print_generic_expr (dump_file, *rhs_p, 0);
1942 fprintf (dump_file, " with ");
1943 print_generic_expr (dump_file, sprime, 0);
1944 fprintf (dump_file, " in ");
1945 print_generic_stmt (dump_file, stmt, 0);
1947 pre_stats.eliminations++;
1948 propagate_tree_value (rhs_p, sprime);
1949 modify_stmt (stmt);
1951 /* If we removed EH side effects from the statement, clean
1952 its EH information. */
1953 if (maybe_clean_eh_stmt (stmt))
1955 bitmap_set_bit (need_eh_cleanup,
1956 bb_for_stmt (stmt)->index);
1957 if (dump_file && (dump_flags & TDF_DETAILS))
1958 fprintf (dump_file, " Removed EH side effects.\n");
1967 /* Initialize data structures used by PRE. */
1969 static void
1970 init_pre (void)
1972 basic_block bb;
1974 connect_infinite_loops_to_exit ();
1975 vn_init ();
1976 memset (&pre_stats, 0, sizeof (pre_stats));
1978 /* If block 0 has more than one predecessor, it means that its PHI
1979 nodes will have arguments coming from block -1. This creates
1980 problems for several places in PRE that keep local arrays indexed
1981 by block number. To prevent this, we split the edge coming from
1982 ENTRY_BLOCK_PTR (FIXME, if ENTRY_BLOCK_PTR had an index number
1983 different than -1 we wouldn't have to hack this. tree-ssa-dce.c
1984 needs a similar change). */
1985 if (EDGE_COUNT (EDGE_SUCC (ENTRY_BLOCK_PTR, 0)->dest->preds) > 1)
1986 if (!(EDGE_SUCC (ENTRY_BLOCK_PTR, 0)->flags & EDGE_ABNORMAL))
1987 split_edge (EDGE_SUCC (ENTRY_BLOCK_PTR, 0));
1989 FOR_ALL_BB (bb)
1990 bb->aux = xcalloc (1, sizeof (struct bb_value_sets));
1992 bitmap_obstack_initialize (&grand_bitmap_obstack);
1993 phi_translate_table = htab_create (511, expr_pred_trans_hash,
1994 expr_pred_trans_eq, free);
1995 value_set_pool = create_alloc_pool ("Value sets",
1996 sizeof (struct value_set), 30);
1997 bitmap_set_pool = create_alloc_pool ("Bitmap sets",
1998 sizeof (struct bitmap_set), 30);
1999 value_set_node_pool = create_alloc_pool ("Value set nodes",
2000 sizeof (struct value_set_node), 30);
2001 calculate_dominance_info (CDI_POST_DOMINATORS);
2002 calculate_dominance_info (CDI_DOMINATORS);
2003 binary_node_pool = create_alloc_pool ("Binary tree nodes",
2004 tree_code_size (PLUS_EXPR), 30);
2005 unary_node_pool = create_alloc_pool ("Unary tree nodes",
2006 tree_code_size (NEGATE_EXPR), 30);
2007 reference_node_pool = create_alloc_pool ("Reference tree nodes",
2008 tree_code_size (ARRAY_REF), 30);
2009 FOR_ALL_BB (bb)
2011 EXP_GEN (bb) = set_new (true);
2012 PHI_GEN (bb) = bitmap_set_new ();
2013 TMP_GEN (bb) = bitmap_set_new ();
2014 AVAIL_OUT (bb) = bitmap_set_new ();
2017 need_eh_cleanup = BITMAP_XMALLOC ();
2021 /* Deallocate data structures used by PRE. */
2023 static void
2024 fini_pre (void)
2026 basic_block bb;
2027 unsigned int i;
2029 bsi_commit_edge_inserts ();
2031 bitmap_obstack_release (&grand_bitmap_obstack);
2032 free_alloc_pool (value_set_pool);
2033 free_alloc_pool (bitmap_set_pool);
2034 free_alloc_pool (value_set_node_pool);
2035 free_alloc_pool (binary_node_pool);
2036 free_alloc_pool (reference_node_pool);
2037 free_alloc_pool (unary_node_pool);
2038 htab_delete (phi_translate_table);
2039 remove_fake_exit_edges ();
2041 FOR_ALL_BB (bb)
2043 free (bb->aux);
2044 bb->aux = NULL;
2047 free_dominance_info (CDI_POST_DOMINATORS);
2048 vn_delete ();
2050 if (!bitmap_empty_p (need_eh_cleanup))
2052 tree_purge_all_dead_eh_edges (need_eh_cleanup);
2053 cleanup_tree_cfg ();
2056 BITMAP_XFREE (need_eh_cleanup);
2058 /* Wipe out pointers to VALUE_HANDLEs. In the not terribly distant
2059 future we will want them to be persistent though. */
2060 for (i = 0; i < num_ssa_names; i++)
2062 tree name = ssa_name (i);
2064 if (!name)
2065 continue;
2067 if (SSA_NAME_VALUE (name)
2068 && TREE_CODE (SSA_NAME_VALUE (name)) == VALUE_HANDLE)
2069 SSA_NAME_VALUE (name) = NULL;
2074 /* Main entry point to the SSA-PRE pass. DO_FRE is true if the caller
2075 only wants to do full redundancy elimination. */
2077 static void
2078 execute_pre (bool do_fre)
2080 init_pre ();
2082 /* Collect and value number expressions computed in each basic block. */
2083 compute_avail ();
2085 if (dump_file && (dump_flags & TDF_DETAILS))
2087 basic_block bb;
2089 FOR_ALL_BB (bb)
2091 print_value_set (dump_file, EXP_GEN (bb), "exp_gen", bb->index);
2092 bitmap_print_value_set (dump_file, TMP_GEN (bb), "tmp_gen",
2093 bb->index);
2094 bitmap_print_value_set (dump_file, AVAIL_OUT (bb), "avail_out",
2095 bb->index);
2099 /* Insert can get quite slow on an incredibly large number of basic
2100 blocks due to some quadratic behavior. Until this behavior is
2101 fixed, don't run it when he have an incredibly large number of
2102 bb's. If we aren't going to run insert, there is no point in
2103 computing ANTIC, either, even though it's plenty fast. */
2104 if (!do_fre && n_basic_blocks < 4000)
2106 compute_antic ();
2107 insert ();
2110 /* Remove all the redundant expressions. */
2111 eliminate ();
2113 if (dump_file && (dump_flags & TDF_STATS))
2115 fprintf (dump_file, "Insertions:%d\n", pre_stats.insertions);
2116 fprintf (dump_file, "New PHIs:%d\n", pre_stats.phis);
2117 fprintf (dump_file, "Eliminated:%d\n", pre_stats.eliminations);
2120 fini_pre ();
2124 /* Gate and execute functions for PRE. */
2126 static void
2127 do_pre (void)
2129 execute_pre (false);
2132 static bool
2133 gate_pre (void)
2135 return flag_tree_pre != 0;
2138 struct tree_opt_pass pass_pre =
2140 "pre", /* name */
2141 gate_pre, /* gate */
2142 do_pre, /* execute */
2143 NULL, /* sub */
2144 NULL, /* next */
2145 0, /* static_pass_number */
2146 TV_TREE_PRE, /* tv_id */
2147 PROP_no_crit_edges | PROP_cfg
2148 | PROP_ssa | PROP_alias, /* properties_required */
2149 0, /* properties_provided */
2150 0, /* properties_destroyed */
2151 0, /* todo_flags_start */
2152 TODO_dump_func | TODO_ggc_collect | TODO_verify_ssa, /* todo_flags_finish */
2153 0 /* letter */
2157 /* Gate and execute functions for FRE. */
2159 static void
2160 do_fre (void)
2162 execute_pre (true);
2165 static bool
2166 gate_fre (void)
2168 return flag_tree_fre != 0;
2171 struct tree_opt_pass pass_fre =
2173 "fre", /* name */
2174 gate_fre, /* gate */
2175 do_fre, /* execute */
2176 NULL, /* sub */
2177 NULL, /* next */
2178 0, /* static_pass_number */
2179 TV_TREE_FRE, /* tv_id */
2180 PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
2181 0, /* properties_provided */
2182 0, /* properties_destroyed */
2183 0, /* todo_flags_start */
2184 TODO_dump_func | TODO_ggc_collect | TODO_verify_ssa, /* todo_flags_finish */
2185 0 /* letter */