2005-06-07 Adrian Straetling <straetling@de.ibm.com>
[official-gcc.git] / gcc / tree-ssa-pre.c
blob6ec3cdc194b975fd90c071e2b53469342d3124c5
1 /* SSA-PRE for trees.
2 Copyright (C) 2001, 2002, 2003, 2004, 2005 Free Software Foundation, Inc.
3 Contributed by Daniel Berlin <dan@dberlin.org> and Steven Bosscher
4 <stevenb@suse.de>
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2, or (at your option)
11 any later version.
13 GCC is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING. If not, write to
20 the Free Software Foundation, 59 Temple Place - Suite 330,
21 Boston, MA 02111-1307, USA. */
23 #include "config.h"
24 #include "system.h"
25 #include "coretypes.h"
26 #include "tm.h"
27 #include "ggc.h"
28 #include "tree.h"
29 #include "basic-block.h"
30 #include "diagnostic.h"
31 #include "tree-inline.h"
32 #include "tree-flow.h"
33 #include "tree-gimple.h"
34 #include "tree-dump.h"
35 #include "timevar.h"
36 #include "fibheap.h"
37 #include "hashtab.h"
38 #include "tree-iterator.h"
39 #include "real.h"
40 #include "alloc-pool.h"
41 #include "tree-pass.h"
42 #include "flags.h"
43 #include "bitmap.h"
44 #include "langhooks.h"
45 #include "cfgloop.h"
47 /* TODO:
49 1. Avail sets can be shared by making an avail_find_leader that
50 walks up the dominator tree and looks in those avail sets.
51 This might affect code optimality, it's unclear right now.
52 2. Load motion can be performed by value numbering the loads the
53 same as we do other expressions. This requires iterative
54 hashing the vuses into the values. Right now we simply assign
55 a new value every time we see a statement with a vuse.
56 3. Strength reduction can be performed by anticipating expressions
57 we can repair later on.
58 4. We can do back-substitution or smarter value numbering to catch
59 commutative expressions split up over multiple statements.
60 */
62 /* For ease of terminology, "expression node" in the below refers to
63 every expression node but MODIFY_EXPR, because MODIFY_EXPR's represent
64 the actual statement containing the expressions we care about, and
65 we cache the value number by putting it in the expression. */
67 /* Basic algorithm
69 First we walk the statements to generate the AVAIL sets, the
70 EXP_GEN sets, and the tmp_gen sets. EXP_GEN sets represent the
71 generation of values/expressions by a given block. We use them
72 when computing the ANTIC sets. The AVAIL sets consist of
73 SSA_NAME's that represent values, so we know what values are
74 available in what blocks. AVAIL is a forward dataflow problem. In
75 SSA, values are never killed, so we don't need a kill set, or a
76 fixpoint iteration, in order to calculate the AVAIL sets. In
77 traditional parlance, AVAIL sets tell us the downsafety of the
78 expressions/values.
80 Next, we generate the ANTIC sets. These sets represent the
81 anticipatable expressions. ANTIC is a backwards dataflow
82 problem.An expression is anticipatable in a given block if it could
83 be generated in that block. This means that if we had to perform
84 an insertion in that block, of the value of that expression, we
85 could. Calculating the ANTIC sets requires phi translation of
86 expressions, because the flow goes backwards through phis. We must
87 iterate to a fixpoint of the ANTIC sets, because we have a kill
88 set. Even in SSA form, values are not live over the entire
89 function, only from their definition point onwards. So we have to
90 remove values from the ANTIC set once we go past the definition
91 point of the leaders that make them up.
92 compute_antic/compute_antic_aux performs this computation.
94 Third, we perform insertions to make partially redundant
95 expressions fully redundant.
97 An expression is partially redundant (excluding partial
98 anticipation) if:
100 1. It is AVAIL in some, but not all, of the predecessors of a
101 given block.
102 2. It is ANTIC in all the predecessors.
104 In order to make it fully redundant, we insert the expression into
105 the predecessors where it is not available, but is ANTIC.
106 insert/insert_aux performs this insertion.
108 Fourth, we eliminate fully redundant expressions.
109 This is a simple statement walk that replaces redundant
110 calculations with the now available values. */
112 /* Representations of value numbers:
114 Value numbers are represented using the "value handle" approach.
115 This means that each SSA_NAME (and for other reasons to be
116 disclosed in a moment, expression nodes) has a value handle that
117 can be retrieved through get_value_handle. This value handle, *is*
118 the value number of the SSA_NAME. You can pointer compare the
119 value handles for equivalence purposes.
121 For debugging reasons, the value handle is internally more than
122 just a number, it is a VAR_DECL named "value.x", where x is a
123 unique number for each value number in use. This allows
124 expressions with SSA_NAMES replaced by value handles to still be
125 pretty printed in a sane way. They simply print as "value.3 *
126 value.5", etc.
128 Expression nodes have value handles associated with them as a
129 cache. Otherwise, we'd have to look them up again in the hash
130 table This makes significant difference (factor of two or more) on
131 some test cases. They can be thrown away after the pass is
132 finished. */
134 /* Representation of expressions on value numbers:
136 In some portions of this code, you will notice we allocate "fake"
137 analogues to the expression we are value numbering, and replace the
138 operands with the values of the expression. Since we work on
139 values, and not just names, we canonicalize expressions to value
140 expressions for use in the ANTIC sets, the EXP_GEN set, etc.
142 This is theoretically unnecessary, it just saves a bunch of
143 repeated get_value_handle and find_leader calls in the remainder of
144 the code, trading off temporary memory usage for speed. The tree
145 nodes aren't actually creating more garbage, since they are
146 allocated in a special pools which are thrown away at the end of
147 this pass.
149 All of this also means that if you print the EXP_GEN or ANTIC sets,
150 you will see "value.5 + value.7" in the set, instead of "a_55 +
151 b_66" or something. The only thing that actually cares about
152 seeing the value leaders is phi translation, and it needs to be
153 able to find the leader for a value in an arbitrary block, so this
154 "value expression" form is perfect for it (otherwise you'd do
155 get_value_handle->find_leader->translate->get_value_handle->find_leader).*/
158 /* Representation of sets:
160 There are currently two types of sets used, hopefully to be unified soon.
161 The AVAIL sets do not need to be sorted in any particular order,
162 and thus, are simply represented as two bitmaps, one that keeps
163 track of values present in the set, and one that keeps track of
164 expressions present in the set.
166 The other sets are represented as doubly linked lists kept in topological
167 order, with an optional supporting bitmap of values present in the
168 set. The sets represent values, and the elements can be values or
169 expressions. The elements can appear in different sets, but each
170 element can only appear once in each set.
172 Since each node in the set represents a value, we also want to be
173 able to map expression, set pairs to something that tells us
174 whether the value is present is a set. We use a per-set bitmap for
175 that. The value handles also point to a linked list of the
176 expressions they represent via a tree annotation. This is mainly
177 useful only for debugging, since we don't do identity lookups. */
180 static bool in_fre = false;
182 /* A value set element. Basically a single linked list of
183 expressions/values. */
184 typedef struct value_set_node
186 /* An expression. */
187 tree expr;
189 /* A pointer to the next element of the value set. */
190 struct value_set_node *next;
191 } *value_set_node_t;
194 /* A value set. This is a singly linked list of value_set_node
195 elements with a possible bitmap that tells us what values exist in
196 the set. This set must be kept in topologically sorted order. */
197 typedef struct value_set
199 /* The head of the list. Used for iterating over the list in
200 order. */
201 value_set_node_t head;
203 /* The tail of the list. Used for tail insertions, which are
204 necessary to keep the set in topologically sorted order because
205 of how the set is built. */
206 value_set_node_t tail;
208 /* The length of the list. */
209 size_t length;
211 /* True if the set is indexed, which means it contains a backing
212 bitmap for quick determination of whether certain values exist in the
213 set. */
214 bool indexed;
216 /* The bitmap of values that exist in the set. May be NULL in an
217 empty or non-indexed set. */
218 bitmap values;
220 } *value_set_t;
223 /* An unordered bitmap set. One bitmap tracks values, the other,
224 expressions. */
225 typedef struct bitmap_set
227 bitmap expressions;
228 bitmap values;
229 } *bitmap_set_t;
231 /* Sets that we need to keep track of. */
232 typedef struct bb_value_sets
234 /* The EXP_GEN set, which represents expressions/values generated in
235 a basic block. */
236 value_set_t exp_gen;
238 /* The PHI_GEN set, which represents PHI results generated in a
239 basic block. */
240 bitmap_set_t phi_gen;
242 /* The TMP_GEN set, which represents results/temporaries generated
243 in a basic block. IE the LHS of an expression. */
244 bitmap_set_t tmp_gen;
246 /* The AVAIL_OUT set, which represents which values are available in
247 a given basic block. */
248 bitmap_set_t avail_out;
250 /* The ANTIC_IN set, which represents which values are anticiptable
251 in a given basic block. */
252 value_set_t antic_in;
254 /* The NEW_SETS set, which is used during insertion to augment the
255 AVAIL_OUT set of blocks with the new insertions performed during
256 the current iteration. */
257 bitmap_set_t new_sets;
258 } *bb_value_sets_t;
260 #define EXP_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->exp_gen
261 #define PHI_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->phi_gen
262 #define TMP_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->tmp_gen
263 #define AVAIL_OUT(BB) ((bb_value_sets_t) ((BB)->aux))->avail_out
264 #define ANTIC_IN(BB) ((bb_value_sets_t) ((BB)->aux))->antic_in
265 #define NEW_SETS(BB) ((bb_value_sets_t) ((BB)->aux))->new_sets
267 /* This structure is used to keep track of statistics on what
268 optimization PRE was able to perform. */
269 static struct
271 /* The number of RHS computations eliminated by PRE. */
272 int eliminations;
274 /* The number of new expressions/temporaries generated by PRE. */
275 int insertions;
277 /* The number of new PHI nodes added by PRE. */
278 int phis;
280 /* The number of values found constant. */
281 int constified;
283 } pre_stats;
286 static tree bitmap_find_leader (bitmap_set_t, tree);
287 static tree find_leader (value_set_t, tree);
288 static void value_insert_into_set (value_set_t, tree);
289 static void bitmap_value_insert_into_set (bitmap_set_t, tree);
290 static void bitmap_value_replace_in_set (bitmap_set_t, tree);
291 static void insert_into_set (value_set_t, tree);
292 static void bitmap_set_copy (bitmap_set_t, bitmap_set_t);
293 static bool bitmap_set_contains_value (bitmap_set_t, tree);
294 static bitmap_set_t bitmap_set_new (void);
295 static value_set_t set_new (bool);
296 static bool is_undefined_value (tree);
297 static tree create_expression_by_pieces (basic_block, tree, tree);
300 /* We can add and remove elements and entries to and from sets
301 and hash tables, so we use alloc pools for them. */
303 static alloc_pool value_set_pool;
304 static alloc_pool bitmap_set_pool;
305 static alloc_pool value_set_node_pool;
306 static alloc_pool binary_node_pool;
307 static alloc_pool unary_node_pool;
308 static alloc_pool reference_node_pool;
309 static alloc_pool comparison_node_pool;
310 static alloc_pool expression_node_pool;
311 static alloc_pool list_node_pool;
312 static bitmap_obstack grand_bitmap_obstack;
314 /* Set of blocks with statements that have had its EH information
315 cleaned up. */
316 static bitmap need_eh_cleanup;
318 /* The phi_translate_table caches phi translations for a given
319 expression and predecessor. */
321 static htab_t phi_translate_table;
323 /* A three tuple {e, pred, v} used to cache phi translations in the
324 phi_translate_table. */
326 typedef struct expr_pred_trans_d
328 /* The expression. */
329 tree e;
331 /* The predecessor block along which we translated the expression. */
332 basic_block pred;
334 /* The value that resulted from the translation. */
335 tree v;
337 /* The hashcode for the expression, pred pair. This is cached for
338 speed reasons. */
339 hashval_t hashcode;
340 } *expr_pred_trans_t;
342 /* Return the hash value for a phi translation table entry. */
344 static hashval_t
345 expr_pred_trans_hash (const void *p)
347 const expr_pred_trans_t ve = (expr_pred_trans_t) p;
348 return ve->hashcode;
351 /* Return true if two phi translation table entries are the same.
352 P1 and P2 should point to the expr_pred_trans_t's to be compared.*/
354 static int
355 expr_pred_trans_eq (const void *p1, const void *p2)
357 const expr_pred_trans_t ve1 = (expr_pred_trans_t) p1;
358 const expr_pred_trans_t ve2 = (expr_pred_trans_t) p2;
359 basic_block b1 = ve1->pred;
360 basic_block b2 = ve2->pred;
363 /* If they are not translations for the same basic block, they can't
364 be equal. */
365 if (b1 != b2)
366 return false;
368 /* If they are for the same basic block, determine if the
369 expressions are equal. */
370 if (expressions_equal_p (ve1->e, ve2->e))
371 return true;
373 return false;
376 /* Search in the phi translation table for the translation of
377 expression E in basic block PRED. Return the translated value, if
378 found, NULL otherwise. */
380 static inline tree
381 phi_trans_lookup (tree e, basic_block pred)
383 void **slot;
384 struct expr_pred_trans_d ept;
385 ept.e = e;
386 ept.pred = pred;
387 ept.hashcode = vn_compute (e, (unsigned long) pred, NULL);
388 slot = htab_find_slot_with_hash (phi_translate_table, &ept, ept.hashcode,
389 NO_INSERT);
390 if (!slot)
391 return NULL;
392 else
393 return ((expr_pred_trans_t) *slot)->v;
397 /* Add the tuple mapping from {expression E, basic block PRED} to
398 value V, to the phi translation table. */
400 static inline void
401 phi_trans_add (tree e, tree v, basic_block pred)
403 void **slot;
404 expr_pred_trans_t new_pair = xmalloc (sizeof (*new_pair));
405 new_pair->e = e;
406 new_pair->pred = pred;
407 new_pair->v = v;
408 new_pair->hashcode = vn_compute (e, (unsigned long) pred, NULL);
409 slot = htab_find_slot_with_hash (phi_translate_table, new_pair,
410 new_pair->hashcode, INSERT);
411 if (*slot)
412 free (*slot);
413 *slot = (void *) new_pair;
417 /* Add expression E to the expression set of value V. */
419 void
420 add_to_value (tree v, tree e)
422 /* Constants have no expression sets. */
423 if (is_gimple_min_invariant (v))
424 return;
426 if (VALUE_HANDLE_EXPR_SET (v) == NULL)
427 VALUE_HANDLE_EXPR_SET (v) = set_new (false);
429 insert_into_set (VALUE_HANDLE_EXPR_SET (v), e);
433 /* Return true if value V exists in the bitmap for SET. */
435 static inline bool
436 value_exists_in_set_bitmap (value_set_t set, tree v)
438 if (!set->values)
439 return false;
441 return bitmap_bit_p (set->values, VALUE_HANDLE_ID (v));
445 /* Remove value V from the bitmap for SET. */
447 static void
448 value_remove_from_set_bitmap (value_set_t set, tree v)
450 gcc_assert (set->indexed);
452 if (!set->values)
453 return;
455 bitmap_clear_bit (set->values, VALUE_HANDLE_ID (v));
459 /* Insert the value number V into the bitmap of values existing in
460 SET. */
462 static inline void
463 value_insert_into_set_bitmap (value_set_t set, tree v)
465 gcc_assert (set->indexed);
467 if (set->values == NULL)
468 set->values = BITMAP_ALLOC (&grand_bitmap_obstack);
470 bitmap_set_bit (set->values, VALUE_HANDLE_ID (v));
474 /* Create a new bitmap set and return it. */
476 static bitmap_set_t
477 bitmap_set_new (void)
479 bitmap_set_t ret = pool_alloc (bitmap_set_pool);
480 ret->expressions = BITMAP_ALLOC (&grand_bitmap_obstack);
481 ret->values = BITMAP_ALLOC (&grand_bitmap_obstack);
482 return ret;
485 /* Create a new set. */
487 static value_set_t
488 set_new (bool indexed)
490 value_set_t ret;
491 ret = pool_alloc (value_set_pool);
492 ret->head = ret->tail = NULL;
493 ret->length = 0;
494 ret->indexed = indexed;
495 ret->values = NULL;
496 return ret;
499 /* Insert an expression EXPR into a bitmapped set. */
501 static void
502 bitmap_insert_into_set (bitmap_set_t set, tree expr)
504 tree val;
505 /* XXX: For now, we only let SSA_NAMES into the bitmap sets. */
506 gcc_assert (TREE_CODE (expr) == SSA_NAME);
507 val = get_value_handle (expr);
509 gcc_assert (val);
510 if (!is_gimple_min_invariant (val))
512 bitmap_set_bit (set->values, VALUE_HANDLE_ID (val));
513 bitmap_set_bit (set->expressions, SSA_NAME_VERSION (expr));
517 /* Insert EXPR into SET. */
519 static void
520 insert_into_set (value_set_t set, tree expr)
522 value_set_node_t newnode = pool_alloc (value_set_node_pool);
523 tree val = get_value_handle (expr);
524 gcc_assert (val);
526 if (is_gimple_min_invariant (val))
527 return;
529 /* For indexed sets, insert the value into the set value bitmap.
530 For all sets, add it to the linked list and increment the list
531 length. */
532 if (set->indexed)
533 value_insert_into_set_bitmap (set, val);
535 newnode->next = NULL;
536 newnode->expr = expr;
537 set->length ++;
538 if (set->head == NULL)
540 set->head = set->tail = newnode;
542 else
544 set->tail->next = newnode;
545 set->tail = newnode;
549 /* Copy a bitmapped set ORIG, into bitmapped set DEST. */
551 static void
552 bitmap_set_copy (bitmap_set_t dest, bitmap_set_t orig)
554 bitmap_copy (dest->expressions, orig->expressions);
555 bitmap_copy (dest->values, orig->values);
558 /* Copy the set ORIG to the set DEST. */
560 static void
561 set_copy (value_set_t dest, value_set_t orig)
563 value_set_node_t node;
565 if (!orig || !orig->head)
566 return;
568 for (node = orig->head;
569 node;
570 node = node->next)
572 insert_into_set (dest, node->expr);
576 /* Remove EXPR from SET. */
578 static void
579 set_remove (value_set_t set, tree expr)
581 value_set_node_t node, prev;
583 /* Remove the value of EXPR from the bitmap, decrement the set
584 length, and remove it from the actual double linked list. */
585 value_remove_from_set_bitmap (set, get_value_handle (expr));
586 set->length--;
587 prev = NULL;
588 for (node = set->head;
589 node != NULL;
590 prev = node, node = node->next)
592 if (node->expr == expr)
594 if (prev == NULL)
595 set->head = node->next;
596 else
597 prev->next= node->next;
599 if (node == set->tail)
600 set->tail = prev;
601 pool_free (value_set_node_pool, node);
602 return;
607 /* Return true if SET contains the value VAL. */
609 static bool
610 set_contains_value (value_set_t set, tree val)
612 /* All constants are in every set. */
613 if (is_gimple_min_invariant (val))
614 return true;
616 if (set->length == 0)
617 return false;
619 return value_exists_in_set_bitmap (set, val);
622 /* Return true if bitmapped set SET contains the expression EXPR. */
623 static bool
624 bitmap_set_contains (bitmap_set_t set, tree expr)
626 /* All constants are in every set. */
627 if (is_gimple_min_invariant (get_value_handle (expr)))
628 return true;
630 /* XXX: Bitmapped sets only contain SSA_NAME's for now. */
631 if (TREE_CODE (expr) != SSA_NAME)
632 return false;
633 return bitmap_bit_p (set->expressions, SSA_NAME_VERSION (expr));
637 /* Return true if bitmapped set SET contains the value VAL. */
639 static bool
640 bitmap_set_contains_value (bitmap_set_t set, tree val)
642 if (is_gimple_min_invariant (val))
643 return true;
644 return bitmap_bit_p (set->values, VALUE_HANDLE_ID (val));
647 /* Replace an instance of value LOOKFOR with expression EXPR in SET. */
649 static void
650 bitmap_set_replace_value (bitmap_set_t set, tree lookfor, tree expr)
652 value_set_t exprset;
653 value_set_node_t node;
654 if (is_gimple_min_invariant (lookfor))
655 return;
656 if (!bitmap_set_contains_value (set, lookfor))
657 return;
659 /* The number of expressions having a given value is usually
660 significantly less than the total number of expressions in SET.
661 Thus, rather than check, for each expression in SET, whether it
662 has the value LOOKFOR, we walk the reverse mapping that tells us
663 what expressions have a given value, and see if any of those
664 expressions are in our set. For large testcases, this is about
665 5-10x faster than walking the bitmap. If this is somehow a
666 significant lose for some cases, we can choose which set to walk
667 based on the set size. */
668 exprset = VALUE_HANDLE_EXPR_SET (lookfor);
669 for (node = exprset->head; node; node = node->next)
671 if (TREE_CODE (node->expr) == SSA_NAME)
673 if (bitmap_bit_p (set->expressions, SSA_NAME_VERSION (node->expr)))
675 bitmap_clear_bit (set->expressions, SSA_NAME_VERSION (node->expr));
676 bitmap_set_bit (set->expressions, SSA_NAME_VERSION (expr));
677 return;
683 /* Subtract bitmapped set B from value set A, and return the new set. */
685 static value_set_t
686 bitmap_set_subtract_from_value_set (value_set_t a, bitmap_set_t b,
687 bool indexed)
689 value_set_t ret = set_new (indexed);
690 value_set_node_t node;
691 for (node = a->head;
692 node;
693 node = node->next)
695 if (!bitmap_set_contains (b, node->expr))
696 insert_into_set (ret, node->expr);
698 return ret;
701 /* Return true if two sets are equal. */
703 static bool
704 set_equal (value_set_t a, value_set_t b)
706 value_set_node_t node;
708 if (a->length != b->length)
709 return false;
710 for (node = a->head;
711 node;
712 node = node->next)
714 if (!set_contains_value (b, get_value_handle (node->expr)))
715 return false;
717 return true;
720 /* Replace an instance of EXPR's VALUE with EXPR in SET if it exists,
721 and add it otherwise. */
723 static void
724 bitmap_value_replace_in_set (bitmap_set_t set, tree expr)
726 tree val = get_value_handle (expr);
727 if (bitmap_set_contains_value (set, val))
728 bitmap_set_replace_value (set, val, expr);
729 else
730 bitmap_insert_into_set (set, expr);
733 /* Insert EXPR into SET if EXPR's value is not already present in
734 SET. */
736 static void
737 bitmap_value_insert_into_set (bitmap_set_t set, tree expr)
739 tree val = get_value_handle (expr);
741 if (is_gimple_min_invariant (val))
742 return;
744 if (!bitmap_set_contains_value (set, val))
745 bitmap_insert_into_set (set, expr);
748 /* Insert the value for EXPR into SET, if it doesn't exist already. */
750 static void
751 value_insert_into_set (value_set_t set, tree expr)
753 tree val = get_value_handle (expr);
755 /* Constant and invariant values exist everywhere, and thus,
756 actually keeping them in the sets is pointless. */
757 if (is_gimple_min_invariant (val))
758 return;
760 if (!set_contains_value (set, val))
761 insert_into_set (set, expr);
765 /* Print out SET to OUTFILE. */
767 static void
768 bitmap_print_value_set (FILE *outfile, bitmap_set_t set,
769 const char *setname, int blockindex)
771 fprintf (outfile, "%s[%d] := { ", setname, blockindex);
772 if (set)
774 bool first = true;
775 unsigned i;
776 bitmap_iterator bi;
778 EXECUTE_IF_SET_IN_BITMAP (set->expressions, 0, i, bi)
780 if (!first)
781 fprintf (outfile, ", ");
782 first = false;
783 print_generic_expr (outfile, ssa_name (i), 0);
785 fprintf (outfile, " (");
786 print_generic_expr (outfile, get_value_handle (ssa_name (i)), 0);
787 fprintf (outfile, ") ");
790 fprintf (outfile, " }\n");
792 /* Print out the value_set SET to OUTFILE. */
794 static void
795 print_value_set (FILE *outfile, value_set_t set,
796 const char *setname, int blockindex)
798 value_set_node_t node;
799 fprintf (outfile, "%s[%d] := { ", setname, blockindex);
800 if (set)
802 for (node = set->head;
803 node;
804 node = node->next)
806 print_generic_expr (outfile, node->expr, 0);
808 fprintf (outfile, " (");
809 print_generic_expr (outfile, get_value_handle (node->expr), 0);
810 fprintf (outfile, ") ");
812 if (node->next)
813 fprintf (outfile, ", ");
817 fprintf (outfile, " }\n");
820 /* Print out the expressions that have VAL to OUTFILE. */
822 void
823 print_value_expressions (FILE *outfile, tree val)
825 if (VALUE_HANDLE_EXPR_SET (val))
827 char s[10];
828 sprintf (s, "VH.%04d", VALUE_HANDLE_ID (val));
829 print_value_set (outfile, VALUE_HANDLE_EXPR_SET (val), s, 0);
834 void
835 debug_value_expressions (tree val)
837 print_value_expressions (stderr, val);
841 void debug_value_set (value_set_t, const char *, int);
843 void
844 debug_value_set (value_set_t set, const char *setname, int blockindex)
846 print_value_set (stderr, set, setname, blockindex);
849 /* Return the folded version of T if T, when folded, is a gimple
850 min_invariant. Otherwise, return T. */
852 static tree
853 fully_constant_expression (tree t)
855 tree folded;
856 folded = fold (t);
857 if (folded && is_gimple_min_invariant (folded))
858 return folded;
859 return t;
862 /* Return a copy of a chain of nodes, chained through the TREE_CHAIN field.
863 For example, this can copy a list made of TREE_LIST nodes.
864 Allocates the nodes in list_node_pool*/
866 static tree
867 pool_copy_list (tree list)
869 tree head;
870 tree prev, next;
872 if (list == 0)
873 return 0;
874 head = pool_alloc (list_node_pool);
876 memcpy (head, list, tree_size (list));
877 prev = head;
879 next = TREE_CHAIN (list);
880 while (next)
882 TREE_CHAIN (prev) = pool_alloc (list_node_pool);
883 memcpy (TREE_CHAIN (prev), next, tree_size (next));
884 prev = TREE_CHAIN (prev);
885 next = TREE_CHAIN (next);
887 return head;
891 /* Translate EXPR using phis in PHIBLOCK, so that it has the values of
892 the phis in PRED. Return NULL if we can't find a leader for each
893 part of the translated expression. */
895 static tree
896 phi_translate (tree expr, value_set_t set, basic_block pred,
897 basic_block phiblock)
899 tree phitrans = NULL;
900 tree oldexpr = expr;
902 if (expr == NULL)
903 return NULL;
905 if (is_gimple_min_invariant (expr))
906 return expr;
908 /* Phi translations of a given expression don't change. */
909 phitrans = phi_trans_lookup (expr, pred);
910 if (phitrans)
911 return phitrans;
913 switch (TREE_CODE_CLASS (TREE_CODE (expr)))
915 case tcc_expression:
917 if (TREE_CODE (expr) != CALL_EXPR)
918 return NULL;
919 else
921 tree oldop0 = TREE_OPERAND (expr, 0);
922 tree oldarglist = TREE_OPERAND (expr, 1);
923 tree oldop2 = TREE_OPERAND (expr, 2);
924 tree newop0;
925 tree newarglist;
926 tree newop2 = NULL;
927 tree oldwalker;
928 tree newwalker;
929 tree newexpr;
930 bool listchanged = false;
932 /* Call expressions are kind of weird because they have an
933 argument list. We don't want to value number the list
934 as one value number, because that doesn't make much
935 sense, and just breaks the support functions we call,
936 which expect TREE_OPERAND (call_expr, 2) to be a
937 TREE_LIST. */
939 newop0 = phi_translate (find_leader (set, oldop0),
940 set, pred, phiblock);
941 if (newop0 == NULL)
942 return NULL;
943 if (oldop2)
945 newop2 = phi_translate (find_leader (set, oldop2),
946 set, pred, phiblock);
947 if (newop2 == NULL)
948 return NULL;
951 /* phi translate the argument list piece by piece.
953 We could actually build the list piece by piece here,
954 but it's likely to not be worth the memory we will save,
955 unless you have millions of call arguments. */
957 newarglist = pool_copy_list (oldarglist);
958 for (oldwalker = oldarglist, newwalker = newarglist;
959 oldwalker && newwalker;
960 oldwalker = TREE_CHAIN (oldwalker),
961 newwalker = TREE_CHAIN (newwalker))
964 tree oldval = TREE_VALUE (oldwalker);
965 tree newval;
966 if (oldval)
968 newval = phi_translate (find_leader (set, oldval),
969 set, pred, phiblock);
970 if (newval == NULL)
971 return NULL;
972 if (newval != oldval)
974 listchanged = true;
975 TREE_VALUE (newwalker) = get_value_handle (newval);
979 if (listchanged)
980 vn_lookup_or_add (newarglist, NULL);
982 if (listchanged || (newop0 != oldop0) || (oldop2 != newop2))
984 newexpr = pool_alloc (expression_node_pool);
985 memcpy (newexpr, expr, tree_size (expr));
986 TREE_OPERAND (newexpr, 0) = newop0 == oldop0 ? oldop0 : get_value_handle (newop0);
987 TREE_OPERAND (newexpr, 1) = listchanged ? newarglist : oldarglist;
988 TREE_OPERAND (newexpr, 2) = newop2 == oldop2 ? oldop2 : get_value_handle (newop2);
989 create_tree_ann (newexpr);
990 vn_lookup_or_add (newexpr, NULL);
991 expr = newexpr;
992 phi_trans_add (oldexpr, newexpr, pred);
996 return expr;
998 case tcc_reference:
999 /* XXX: Until we have PRE of loads working, none will be ANTIC. */
1000 return NULL;
1002 case tcc_binary:
1003 case tcc_comparison:
1005 tree oldop1 = TREE_OPERAND (expr, 0);
1006 tree oldop2 = TREE_OPERAND (expr, 1);
1007 tree newop1;
1008 tree newop2;
1009 tree newexpr;
1011 newop1 = phi_translate (find_leader (set, oldop1),
1012 set, pred, phiblock);
1013 if (newop1 == NULL)
1014 return NULL;
1015 newop2 = phi_translate (find_leader (set, oldop2),
1016 set, pred, phiblock);
1017 if (newop2 == NULL)
1018 return NULL;
1019 if (newop1 != oldop1 || newop2 != oldop2)
1021 tree t;
1022 newexpr = pool_alloc (binary_node_pool);
1023 memcpy (newexpr, expr, tree_size (expr));
1024 TREE_OPERAND (newexpr, 0) = newop1 == oldop1 ? oldop1 : get_value_handle (newop1);
1025 TREE_OPERAND (newexpr, 1) = newop2 == oldop2 ? oldop2 : get_value_handle (newop2);
1026 t = fully_constant_expression (newexpr);
1027 if (t != newexpr)
1029 pool_free (binary_node_pool, newexpr);
1030 newexpr = t;
1032 else
1034 create_tree_ann (newexpr);
1035 vn_lookup_or_add (newexpr, NULL);
1037 expr = newexpr;
1038 phi_trans_add (oldexpr, newexpr, pred);
1041 return expr;
1043 case tcc_unary:
1045 tree oldop1 = TREE_OPERAND (expr, 0);
1046 tree newop1;
1047 tree newexpr;
1049 newop1 = phi_translate (find_leader (set, oldop1),
1050 set, pred, phiblock);
1051 if (newop1 == NULL)
1052 return NULL;
1053 if (newop1 != oldop1)
1055 tree t;
1056 newexpr = pool_alloc (unary_node_pool);
1057 memcpy (newexpr, expr, tree_size (expr));
1058 TREE_OPERAND (newexpr, 0) = get_value_handle (newop1);
1059 t = fully_constant_expression (newexpr);
1060 if (t != newexpr)
1062 pool_free (unary_node_pool, newexpr);
1063 newexpr = t;
1065 else
1067 create_tree_ann (newexpr);
1068 vn_lookup_or_add (newexpr, NULL);
1070 expr = newexpr;
1071 phi_trans_add (oldexpr, newexpr, pred);
1074 return expr;
1076 case tcc_exceptional:
1078 tree phi = NULL;
1079 edge e;
1080 gcc_assert (TREE_CODE (expr) == SSA_NAME);
1081 if (TREE_CODE (SSA_NAME_DEF_STMT (expr)) == PHI_NODE)
1082 phi = SSA_NAME_DEF_STMT (expr);
1083 else
1084 return expr;
1086 e = find_edge (pred, bb_for_stmt (phi));
1087 if (e)
1089 if (is_undefined_value (PHI_ARG_DEF (phi, e->dest_idx)))
1090 return NULL;
1091 vn_lookup_or_add (PHI_ARG_DEF (phi, e->dest_idx), NULL);
1092 return PHI_ARG_DEF (phi, e->dest_idx);
1095 return expr;
1097 default:
1098 gcc_unreachable ();
1102 /* For each expression in SET, translate the value handles through phi nodes
1103 in PHIBLOCK using edge PHIBLOCK->PRED, and store the resulting
1104 expressions in DEST. */
1106 static void
1107 phi_translate_set (value_set_t dest, value_set_t set, basic_block pred,
1108 basic_block phiblock)
1110 value_set_node_t node;
1111 for (node = set->head;
1112 node;
1113 node = node->next)
1115 tree translated;
1116 translated = phi_translate (node->expr, set, pred, phiblock);
1117 phi_trans_add (node->expr, translated, pred);
1119 if (translated != NULL)
1120 value_insert_into_set (dest, translated);
1124 /* Find the leader for a value (i.e., the name representing that
1125 value) in a given set, and return it. Return NULL if no leader is
1126 found. */
1128 static tree
1129 bitmap_find_leader (bitmap_set_t set, tree val)
1131 if (val == NULL)
1132 return NULL;
1134 if (is_gimple_min_invariant (val))
1135 return val;
1136 if (bitmap_set_contains_value (set, val))
1138 /* Rather than walk the entire bitmap of expressions, and see
1139 whether any of them has the value we are looking for, we look
1140 at the reverse mapping, which tells us the set of expressions
1141 that have a given value (IE value->expressions with that
1142 value) and see if any of those expressions are in our set.
1143 The number of expressions per value is usually significantly
1144 less than the number of expressions in the set. In fact, for
1145 large testcases, doing it this way is roughly 5-10x faster
1146 than walking the bitmap.
1147 If this is somehow a significant lose for some cases, we can
1148 choose which set to walk based on which set is smaller. */
1149 value_set_t exprset;
1150 value_set_node_t node;
1151 exprset = VALUE_HANDLE_EXPR_SET (val);
1152 for (node = exprset->head; node; node = node->next)
1154 if (TREE_CODE (node->expr) == SSA_NAME)
1156 if (bitmap_bit_p (set->expressions,
1157 SSA_NAME_VERSION (node->expr)))
1158 return node->expr;
1162 return NULL;
1166 /* Find the leader for a value (i.e., the name representing that
1167 value) in a given set, and return it. Return NULL if no leader is
1168 found. */
1170 static tree
1171 find_leader (value_set_t set, tree val)
1173 value_set_node_t node;
1175 if (val == NULL)
1176 return NULL;
1178 /* Constants represent themselves. */
1179 if (is_gimple_min_invariant (val))
1180 return val;
1182 if (set->length == 0)
1183 return NULL;
1185 if (value_exists_in_set_bitmap (set, val))
1187 for (node = set->head;
1188 node;
1189 node = node->next)
1191 if (get_value_handle (node->expr) == val)
1192 return node->expr;
1196 return NULL;
1199 /* Determine if the expression EXPR is valid in SET. This means that
1200 we have a leader for each part of the expression (if it consists of
1201 values), or the expression is an SSA_NAME.
1203 NB: We never should run into a case where we have SSA_NAME +
1204 SSA_NAME or SSA_NAME + value. The sets valid_in_set is called on,
1205 the ANTIC sets, will only ever have SSA_NAME's or value expressions
1206 (IE VALUE1 + VALUE2, *VALUE1, VALUE1 < VALUE2) */
1208 static bool
1209 valid_in_set (value_set_t set, tree expr)
1211 switch (TREE_CODE_CLASS (TREE_CODE (expr)))
1213 case tcc_binary:
1214 case tcc_comparison:
1216 tree op1 = TREE_OPERAND (expr, 0);
1217 tree op2 = TREE_OPERAND (expr, 1);
1218 return set_contains_value (set, op1) && set_contains_value (set, op2);
1221 case tcc_unary:
1223 tree op1 = TREE_OPERAND (expr, 0);
1224 return set_contains_value (set, op1);
1227 case tcc_expression:
1229 if (TREE_CODE (expr) == CALL_EXPR)
1231 tree op0 = TREE_OPERAND (expr, 0);
1232 tree arglist = TREE_OPERAND (expr, 1);
1233 tree op2 = TREE_OPERAND (expr, 2);
1235 /* Check the non-list operands first. */
1236 if (!set_contains_value (set, op0)
1237 || (op2 && !set_contains_value (set, op2)))
1238 return false;
1240 /* Now check the operands. */
1241 for (; arglist; arglist = TREE_CHAIN (arglist))
1243 if (!set_contains_value (set, TREE_VALUE (arglist)))
1244 return false;
1246 return true;
1248 return false;
1251 case tcc_reference:
1252 /* XXX: Until PRE of loads works, no reference nodes are ANTIC. */
1253 return false;
1255 case tcc_exceptional:
1256 gcc_assert (TREE_CODE (expr) == SSA_NAME);
1257 return true;
1259 case tcc_declaration:
1260 /* VAR_DECL and PARM_DECL are never anticipatable. */
1261 return false;
1263 default:
1264 /* No other cases should be encountered. */
1265 gcc_unreachable ();
1269 /* Clean the set of expressions that are no longer valid in SET. This
1270 means expressions that are made up of values we have no leaders for
1271 in SET. */
1273 static void
1274 clean (value_set_t set)
1276 value_set_node_t node;
1277 value_set_node_t next;
1278 node = set->head;
1279 while (node)
1281 next = node->next;
1282 if (!valid_in_set (set, node->expr))
1283 set_remove (set, node->expr);
1284 node = next;
1288 DEF_VEC_P (basic_block);
1289 DEF_VEC_ALLOC_P (basic_block, heap);
1290 static sbitmap has_abnormal_preds;
1292 /* Compute the ANTIC set for BLOCK.
1294 If succs(BLOCK) > 1 then
1295 ANTIC_OUT[BLOCK] = intersection of ANTIC_IN[b] for all succ(BLOCK)
1296 else if succs(BLOCK) == 1 then
1297 ANTIC_OUT[BLOCK] = phi_translate (ANTIC_IN[succ(BLOCK)])
1299 ANTIC_IN[BLOCK] = clean(ANTIC_OUT[BLOCK] U EXP_GEN[BLOCK] - TMP_GEN[BLOCK])
1301 XXX: It would be nice to either write a set_clear, and use it for
1302 ANTIC_OUT, or to mark the antic_out set as deleted at the end
1303 of this routine, so that the pool can hand the same memory back out
1304 again for the next ANTIC_OUT. */
1306 static bool
1307 compute_antic_aux (basic_block block, bool block_has_abnormal_pred_edge)
1309 basic_block son;
1310 bool changed = false;
1311 value_set_t S, old, ANTIC_OUT;
1312 value_set_node_t node;
1314 ANTIC_OUT = S = NULL;
1316 /* If any edges from predecessors are abnormal, antic_in is empty,
1317 so do nothing. */
1318 if (block_has_abnormal_pred_edge)
1319 goto maybe_dump_sets;
1321 old = set_new (false);
1322 set_copy (old, ANTIC_IN (block));
1323 ANTIC_OUT = set_new (true);
1325 /* If the block has no successors, ANTIC_OUT is empty. */
1326 if (EDGE_COUNT (block->succs) == 0)
1328 /* If we have one successor, we could have some phi nodes to
1329 translate through. */
1330 else if (single_succ_p (block))
1332 phi_translate_set (ANTIC_OUT, ANTIC_IN (single_succ (block)),
1333 block, single_succ (block));
1335 /* If we have multiple successors, we take the intersection of all of
1336 them. */
1337 else
1339 VEC(basic_block, heap) * worklist;
1340 edge e;
1341 size_t i;
1342 basic_block bprime, first;
1343 edge_iterator ei;
1345 worklist = VEC_alloc (basic_block, heap, EDGE_COUNT (block->succs));
1346 FOR_EACH_EDGE (e, ei, block->succs)
1347 VEC_quick_push (basic_block, worklist, e->dest);
1348 first = VEC_index (basic_block, worklist, 0);
1349 set_copy (ANTIC_OUT, ANTIC_IN (first));
1351 for (i = 1; VEC_iterate (basic_block, worklist, i, bprime); i++)
1353 node = ANTIC_OUT->head;
1354 while (node)
1356 tree val;
1357 value_set_node_t next = node->next;
1358 val = get_value_handle (node->expr);
1359 if (!set_contains_value (ANTIC_IN (bprime), val))
1360 set_remove (ANTIC_OUT, node->expr);
1361 node = next;
1364 VEC_free (basic_block, heap, worklist);
1367 /* Generate ANTIC_OUT - TMP_GEN. */
1368 S = bitmap_set_subtract_from_value_set (ANTIC_OUT, TMP_GEN (block), false);
1370 /* Start ANTIC_IN with EXP_GEN - TMP_GEN */
1371 ANTIC_IN (block) = bitmap_set_subtract_from_value_set (EXP_GEN (block),
1372 TMP_GEN (block),
1373 true);
1375 /* Then union in the ANTIC_OUT - TMP_GEN values,
1376 to get ANTIC_OUT U EXP_GEN - TMP_GEN */
1377 for (node = S->head; node; node = node->next)
1378 value_insert_into_set (ANTIC_IN (block), node->expr);
1380 clean (ANTIC_IN (block));
1381 if (!set_equal (old, ANTIC_IN (block)))
1382 changed = true;
1384 maybe_dump_sets:
1385 if (dump_file && (dump_flags & TDF_DETAILS))
1387 if (ANTIC_OUT)
1388 print_value_set (dump_file, ANTIC_OUT, "ANTIC_OUT", block->index);
1389 print_value_set (dump_file, ANTIC_IN (block), "ANTIC_IN", block->index);
1390 if (S)
1391 print_value_set (dump_file, S, "S", block->index);
1394 for (son = first_dom_son (CDI_POST_DOMINATORS, block);
1395 son;
1396 son = next_dom_son (CDI_POST_DOMINATORS, son))
1398 changed |= compute_antic_aux (son,
1399 TEST_BIT (has_abnormal_preds, son->index));
1401 return changed;
1404 /* Compute ANTIC sets. */
1406 static void
1407 compute_antic (void)
1409 bool changed = true;
1410 int num_iterations = 0;
1411 basic_block block;
1413 /* If any predecessor edges are abnormal, we punt, so antic_in is empty.
1414 We pre-build the map of blocks with incoming abnormal edges here. */
1415 has_abnormal_preds = sbitmap_alloc (last_basic_block);
1416 sbitmap_zero (has_abnormal_preds);
1417 FOR_EACH_BB (block)
1419 edge_iterator ei;
1420 edge e;
1422 FOR_EACH_EDGE (e, ei, block->preds)
1423 if (e->flags & EDGE_ABNORMAL)
1425 SET_BIT (has_abnormal_preds, block->index);
1426 break;
1429 /* While we are here, give empty ANTIC_IN sets to each block. */
1430 ANTIC_IN (block) = set_new (true);
1432 /* At the exit block we anticipate nothing. */
1433 ANTIC_IN (EXIT_BLOCK_PTR) = set_new (true);
1435 while (changed)
1437 num_iterations++;
1438 changed = false;
1439 changed = compute_antic_aux (EXIT_BLOCK_PTR, false);
1442 sbitmap_free (has_abnormal_preds);
1444 if (dump_file && (dump_flags & TDF_STATS))
1445 fprintf (dump_file, "compute_antic required %d iterations\n", num_iterations);
1448 static VEC(tree,heap) *inserted_exprs;
1449 /* Find a leader for an expression, or generate one using
1450 create_expression_by_pieces if it's ANTIC but
1451 complex.
1452 BLOCK is the basic_block we are looking for leaders in.
1453 EXPR is the expression to find a leader or generate for.
1454 STMTS is the statement list to put the inserted expressions on.
1455 Returns the SSA_NAME of the LHS of the generated expression or the
1456 leader. */
1458 static tree
1459 find_or_generate_expression (basic_block block, tree expr, tree stmts)
1461 tree genop = bitmap_find_leader (AVAIL_OUT (block), expr);
1463 /* If it's still NULL, it must be a complex expression, so generate
1464 it recursively. */
1465 if (genop == NULL)
1467 genop = VALUE_HANDLE_EXPR_SET (expr)->head->expr;
1468 gcc_assert (UNARY_CLASS_P (genop)
1469 || BINARY_CLASS_P (genop)
1470 || COMPARISON_CLASS_P (genop)
1471 || REFERENCE_CLASS_P (genop)
1472 || TREE_CODE (genop) == CALL_EXPR);
1473 genop = create_expression_by_pieces (block, genop, stmts);
1475 return genop;
1478 #define NECESSARY(stmt) stmt->common.asm_written_flag
1479 /* Create an expression in pieces, so that we can handle very complex
1480 expressions that may be ANTIC, but not necessary GIMPLE.
1481 BLOCK is the basic block the expression will be inserted into,
1482 EXPR is the expression to insert (in value form)
1483 STMTS is a statement list to append the necessary insertions into.
1485 This function will die if we hit some value that shouldn't be
1486 ANTIC but is (IE there is no leader for it, or its components).
1487 This function may also generate expressions that are themselves
1488 partially or fully redundant. Those that are will be either made
1489 fully redundant during the next iteration of insert (for partially
1490 redundant ones), or eliminated by eliminate (for fully redundant
1491 ones). */
1493 static tree
1494 create_expression_by_pieces (basic_block block, tree expr, tree stmts)
1496 tree temp, name;
1497 tree folded, forced_stmts, newexpr;
1498 tree v;
1499 tree_stmt_iterator tsi;
1501 switch (TREE_CODE_CLASS (TREE_CODE (expr)))
1503 case tcc_expression:
1505 tree op0, op2;
1506 tree arglist;
1507 tree genop0, genop2;
1508 tree genarglist;
1509 tree walker, genwalker;
1511 gcc_assert (TREE_CODE (expr) == CALL_EXPR);
1512 genop2 = NULL;
1514 op0 = TREE_OPERAND (expr, 0);
1515 arglist = TREE_OPERAND (expr, 1);
1516 op2 = TREE_OPERAND (expr, 2);
1518 genop0 = find_or_generate_expression (block, op0, stmts);
1519 genarglist = copy_list (arglist);
1520 for (walker = arglist, genwalker = genarglist;
1521 genwalker && walker;
1522 genwalker = TREE_CHAIN (genwalker), walker = TREE_CHAIN (walker))
1524 TREE_VALUE (genwalker) = find_or_generate_expression (block,
1525 TREE_VALUE (walker),
1526 stmts);
1529 if (op2)
1530 genop2 = find_or_generate_expression (block, op2, stmts);
1531 folded = fold (build (TREE_CODE (expr), TREE_TYPE (expr),
1532 genop0, genarglist, genop2));
1533 break;
1537 break;
1539 case tcc_binary:
1540 case tcc_comparison:
1542 tree op1 = TREE_OPERAND (expr, 0);
1543 tree op2 = TREE_OPERAND (expr, 1);
1544 tree genop1 = find_or_generate_expression (block, op1, stmts);
1545 tree genop2 = find_or_generate_expression (block, op2, stmts);
1546 folded = fold (build (TREE_CODE (expr), TREE_TYPE (expr),
1547 genop1, genop2));
1548 break;
1551 case tcc_unary:
1553 tree op1 = TREE_OPERAND (expr, 0);
1554 tree genop1 = find_or_generate_expression (block, op1, stmts);
1555 folded = fold (build (TREE_CODE (expr), TREE_TYPE (expr),
1556 genop1));
1557 break;
1560 default:
1561 gcc_unreachable ();
1564 /* Force the generated expression to be a sequence of GIMPLE
1565 statements.
1566 We have to call unshare_expr because force_gimple_operand may
1567 modify the tree we pass to it. */
1568 newexpr = force_gimple_operand (unshare_expr (folded), &forced_stmts,
1569 false, NULL);
1571 /* If we have any intermediate expressions to the value sets, add them
1572 to the value sets and chain them on in the instruction stream. */
1573 if (forced_stmts)
1575 tsi = tsi_start (forced_stmts);
1576 for (; !tsi_end_p (tsi); tsi_next (&tsi))
1578 tree stmt = tsi_stmt (tsi);
1579 tree forcedname = TREE_OPERAND (stmt, 0);
1580 tree forcedexpr = TREE_OPERAND (stmt, 1);
1581 tree val = vn_lookup_or_add (forcedexpr, NULL);
1583 VEC_safe_push (tree, heap, inserted_exprs, stmt);
1584 vn_add (forcedname, val, NULL);
1585 bitmap_value_replace_in_set (NEW_SETS (block), forcedname);
1586 bitmap_value_replace_in_set (AVAIL_OUT (block), forcedname);
1588 tsi = tsi_last (stmts);
1589 tsi_link_after (&tsi, forced_stmts, TSI_CONTINUE_LINKING);
1592 /* Build and insert the assignment of the end result to the temporary
1593 that we will return. */
1594 temp = create_tmp_var (TREE_TYPE (expr), "pretmp");
1595 add_referenced_tmp_var (temp);
1596 newexpr = build (MODIFY_EXPR, TREE_TYPE (expr), temp, newexpr);
1597 name = make_ssa_name (temp, newexpr);
1598 TREE_OPERAND (newexpr, 0) = name;
1599 NECESSARY (newexpr) = 0;
1600 tsi = tsi_last (stmts);
1601 tsi_link_after (&tsi, newexpr, TSI_CONTINUE_LINKING);
1602 VEC_safe_push (tree, heap, inserted_exprs, newexpr);
1604 /* Add a value handle to the temporary.
1605 The value may already exist in either NEW_SETS, or AVAIL_OUT, because
1606 we are creating the expression by pieces, and this particular piece of
1607 the expression may have been represented. There is no harm in replacing
1608 here. */
1609 v = get_value_handle (expr);
1610 vn_add (name, v, NULL);
1611 bitmap_value_replace_in_set (NEW_SETS (block), name);
1612 bitmap_value_replace_in_set (AVAIL_OUT (block), name);
1614 pre_stats.insertions++;
1615 if (dump_file && (dump_flags & TDF_DETAILS))
1617 fprintf (dump_file, "Inserted ");
1618 print_generic_expr (dump_file, newexpr, 0);
1619 fprintf (dump_file, " in predecessor %d\n", block->index);
1622 return name;
1625 /* Insert the to-be-made-available values of NODE for each predecessor, stored
1626 in AVAIL, into the predecessors of BLOCK, and merge the result with a phi
1627 node, given the same value handle as NODE. The prefix of the phi node is
1628 given with TMPNAME. Return true if we have inserted new stuff. */
1630 static bool
1631 insert_into_preds_of_block (basic_block block, value_set_node_t node,
1632 tree *avail, const char *tmpname)
1634 tree val = get_value_handle (node->expr);
1635 edge pred;
1636 bool insertions = false;
1637 bool nophi = false;
1638 basic_block bprime;
1639 tree eprime;
1640 edge_iterator ei;
1641 tree type = TREE_TYPE (avail[EDGE_PRED (block, 0)->src->index]);
1642 tree temp;
1644 if (dump_file && (dump_flags & TDF_DETAILS))
1646 fprintf (dump_file, "Found partial redundancy for expression ");
1647 print_generic_expr (dump_file, node->expr, 0);
1648 fprintf (dump_file, "\n");
1651 /* Make sure we aren't creating an induction variable. */
1652 if (block->loop_depth > 0 && EDGE_COUNT (block->preds) == 2)
1654 bool firstinsideloop = false;
1655 bool secondinsideloop = false;
1656 firstinsideloop = flow_bb_inside_loop_p (block->loop_father,
1657 EDGE_PRED (block, 0)->src);
1658 secondinsideloop = flow_bb_inside_loop_p (block->loop_father,
1659 EDGE_PRED (block, 1)->src);
1660 /* Induction variables only have one edge inside the loop. */
1661 if (firstinsideloop ^ secondinsideloop)
1663 if (dump_file && (dump_flags & TDF_DETAILS))
1664 fprintf (dump_file, "Skipping insertion of phi for partial redundancy: Looks like an induction variable\n");
1665 nophi = true;
1670 /* Make the necessary insertions. */
1671 FOR_EACH_EDGE (pred, ei, block->preds)
1673 tree stmts = alloc_stmt_list ();
1674 tree builtexpr;
1675 bprime = pred->src;
1676 eprime = avail[bprime->index];
1677 if (BINARY_CLASS_P (eprime)
1678 || COMPARISON_CLASS_P (eprime)
1679 || UNARY_CLASS_P (eprime)
1680 || TREE_CODE (eprime) == CALL_EXPR)
1682 builtexpr = create_expression_by_pieces (bprime,
1683 eprime,
1684 stmts);
1685 bsi_insert_on_edge (pred, stmts);
1686 avail[bprime->index] = builtexpr;
1687 insertions = true;
1690 /* If we didn't want a phi node, and we made insertions, we still have
1691 inserted new stuff, and thus return true. If we didn't want a phi node,
1692 and didn't make insertions, we haven't added anything new, so return
1693 false. */
1694 if (nophi && insertions)
1695 return true;
1696 else if (nophi && !insertions)
1697 return false;
1699 /* Now build a phi for the new variable. */
1700 temp = create_tmp_var (type, tmpname);
1701 add_referenced_tmp_var (temp);
1702 temp = create_phi_node (temp, block);
1703 NECESSARY (temp) = 0;
1704 VEC_safe_push (tree, heap, inserted_exprs, temp);
1705 FOR_EACH_EDGE (pred, ei, block->preds)
1706 add_phi_arg (temp, avail[pred->src->index], pred);
1708 vn_add (PHI_RESULT (temp), val, NULL);
1710 /* The value should *not* exist in PHI_GEN, or else we wouldn't be doing
1711 this insertion, since we test for the existence of this value in PHI_GEN
1712 before proceeding with the partial redundancy checks in insert_aux.
1714 The value may exist in AVAIL_OUT, in particular, it could be represented
1715 by the expression we are trying to eliminate, in which case we want the
1716 replacement to occur. If it's not existing in AVAIL_OUT, we want it
1717 inserted there.
1719 Similarly, to the PHI_GEN case, the value should not exist in NEW_SETS of
1720 this block, because if it did, it would have existed in our dominator's
1721 AVAIL_OUT, and would have been skipped due to the full redundancy check.
1724 bitmap_insert_into_set (PHI_GEN (block),
1725 PHI_RESULT (temp));
1726 bitmap_value_replace_in_set (AVAIL_OUT (block),
1727 PHI_RESULT (temp));
1728 bitmap_insert_into_set (NEW_SETS (block),
1729 PHI_RESULT (temp));
1731 if (dump_file && (dump_flags & TDF_DETAILS))
1733 fprintf (dump_file, "Created phi ");
1734 print_generic_expr (dump_file, temp, 0);
1735 fprintf (dump_file, " in block %d\n", block->index);
1737 pre_stats.phis++;
1738 return true;
1743 /* Perform insertion of partially redundant values.
1744 For BLOCK, do the following:
1745 1. Propagate the NEW_SETS of the dominator into the current block.
1746 If the block has multiple predecessors,
1747 2a. Iterate over the ANTIC expressions for the block to see if
1748 any of them are partially redundant.
1749 2b. If so, insert them into the necessary predecessors to make
1750 the expression fully redundant.
1751 2c. Insert a new PHI merging the values of the predecessors.
1752 2d. Insert the new PHI, and the new expressions, into the
1753 NEW_SETS set.
1754 3. Recursively call ourselves on the dominator children of BLOCK.
1758 static bool
1759 insert_aux (basic_block block)
1761 basic_block son;
1762 bool new_stuff = false;
1764 if (block)
1766 basic_block dom;
1767 dom = get_immediate_dominator (CDI_DOMINATORS, block);
1768 if (dom)
1770 unsigned i;
1771 bitmap_iterator bi;
1772 bitmap_set_t newset = NEW_SETS (dom);
1773 if (newset)
1775 /* Note that we need to value_replace both NEW_SETS, and
1776 AVAIL_OUT. For both the case of NEW_SETS, the value may be
1777 represented by some non-simple expression here that we want
1778 to replace it with. */
1779 EXECUTE_IF_SET_IN_BITMAP (newset->expressions, 0, i, bi)
1781 bitmap_value_replace_in_set (NEW_SETS (block), ssa_name (i));
1782 bitmap_value_replace_in_set (AVAIL_OUT (block), ssa_name (i));
1785 if (!single_pred_p (block))
1787 value_set_node_t node;
1788 for (node = ANTIC_IN (block)->head;
1789 node;
1790 node = node->next)
1792 if (BINARY_CLASS_P (node->expr)
1793 || COMPARISON_CLASS_P (node->expr)
1794 || UNARY_CLASS_P (node->expr)
1795 || TREE_CODE (node->expr) == CALL_EXPR)
1797 tree *avail;
1798 tree val;
1799 bool by_some = false;
1800 bool cant_insert = false;
1801 bool all_same = true;
1802 tree first_s = NULL;
1803 edge pred;
1804 basic_block bprime;
1805 tree eprime = NULL_TREE;
1806 edge_iterator ei;
1808 val = get_value_handle (node->expr);
1809 if (bitmap_set_contains_value (PHI_GEN (block), val))
1810 continue;
1811 if (bitmap_set_contains_value (AVAIL_OUT (dom), val))
1813 if (dump_file && (dump_flags & TDF_DETAILS))
1814 fprintf (dump_file, "Found fully redundant value\n");
1815 continue;
1818 avail = xcalloc (last_basic_block, sizeof (tree));
1819 FOR_EACH_EDGE (pred, ei, block->preds)
1821 tree vprime;
1822 tree edoubleprime;
1824 /* This can happen in the very weird case
1825 that our fake infinite loop edges have caused a
1826 critical edge to appear. */
1827 if (EDGE_CRITICAL_P (pred))
1829 cant_insert = true;
1830 break;
1832 bprime = pred->src;
1833 eprime = phi_translate (node->expr,
1834 ANTIC_IN (block),
1835 bprime, block);
1837 /* eprime will generally only be NULL if the
1838 value of the expression, translated
1839 through the PHI for this predecessor, is
1840 undefined. If that is the case, we can't
1841 make the expression fully redundant,
1842 because its value is undefined along a
1843 predecessor path. We can thus break out
1844 early because it doesn't matter what the
1845 rest of the results are. */
1846 if (eprime == NULL)
1848 cant_insert = true;
1849 break;
1852 eprime = fully_constant_expression (eprime);
1853 vprime = get_value_handle (eprime);
1854 gcc_assert (vprime);
1855 edoubleprime = bitmap_find_leader (AVAIL_OUT (bprime),
1856 vprime);
1857 if (edoubleprime == NULL)
1859 avail[bprime->index] = eprime;
1860 all_same = false;
1862 else
1864 avail[bprime->index] = edoubleprime;
1865 by_some = true;
1866 if (first_s == NULL)
1867 first_s = edoubleprime;
1868 else if (!operand_equal_p (first_s, edoubleprime,
1870 all_same = false;
1873 /* If we can insert it, it's not the same value
1874 already existing along every predecessor, and
1875 it's defined by some predecessor, it is
1876 partially redundant. */
1877 if (!cant_insert && !all_same && by_some)
1879 if (insert_into_preds_of_block (block, node, avail,
1880 "prephitmp"))
1881 new_stuff = true;
1883 /* If all edges produce the same value and that value is
1884 an invariant, then the PHI has the same value on all
1885 edges. Note this. */
1886 else if (!cant_insert && all_same && eprime
1887 && is_gimple_min_invariant (eprime)
1888 && !is_gimple_min_invariant (val))
1890 value_set_t exprset = VALUE_HANDLE_EXPR_SET (val);
1891 value_set_node_t node;
1892 for (node = exprset->head; node; node = node->next)
1894 if (TREE_CODE (node->expr) == SSA_NAME)
1896 vn_add (node->expr, eprime, NULL);
1897 pre_stats.constified++;
1901 free (avail);
1907 for (son = first_dom_son (CDI_DOMINATORS, block);
1908 son;
1909 son = next_dom_son (CDI_DOMINATORS, son))
1911 new_stuff |= insert_aux (son);
1914 return new_stuff;
1917 /* Perform insertion of partially redundant values. */
1919 static void
1920 insert (void)
1922 bool new_stuff = true;
1923 basic_block bb;
1924 int num_iterations = 0;
1926 FOR_ALL_BB (bb)
1927 NEW_SETS (bb) = bitmap_set_new ();
1929 while (new_stuff)
1931 num_iterations++;
1932 new_stuff = false;
1933 new_stuff = insert_aux (ENTRY_BLOCK_PTR);
1935 if (num_iterations > 2 && dump_file && (dump_flags & TDF_STATS))
1936 fprintf (dump_file, "insert required %d iterations\n", num_iterations);
1940 /* Return true if VAR is an SSA variable with no defining statement in
1941 this procedure, *AND* isn't a live-on-entry parameter. */
1943 static bool
1944 is_undefined_value (tree expr)
1946 return (TREE_CODE (expr) == SSA_NAME
1947 && IS_EMPTY_STMT (SSA_NAME_DEF_STMT (expr))
1948 /* PARM_DECLs and hard registers are always defined. */
1949 && TREE_CODE (SSA_NAME_VAR (expr)) != PARM_DECL);
1953 /* Given an SSA variable VAR and an expression EXPR, compute the value
1954 number for EXPR and create a value handle (VAL) for it. If VAR and
1955 EXPR are not the same, associate VAL with VAR. Finally, add VAR to
1956 S1 and its value handle to S2.
1958 VUSES represent the virtual use operands associated with EXPR (if
1959 any). They are used when computing the hash value for EXPR. */
1961 static inline void
1962 add_to_sets (tree var, tree expr, tree stmt, bitmap_set_t s1,
1963 bitmap_set_t s2)
1965 tree val = vn_lookup_or_add (expr, stmt);
1967 /* VAR and EXPR may be the same when processing statements for which
1968 we are not computing value numbers (e.g., non-assignments, or
1969 statements that make aliased stores). In those cases, we are
1970 only interested in making VAR available as its own value. */
1971 if (var != expr)
1972 vn_add (var, val, NULL_TREE);
1974 if (s1)
1975 bitmap_insert_into_set (s1, var);
1976 bitmap_value_insert_into_set (s2, var);
1980 /* Given a unary or binary expression EXPR, create and return a new
1981 expression with the same structure as EXPR but with its operands
1982 replaced with the value handles of each of the operands of EXPR.
1984 VUSES represent the virtual use operands associated with EXPR (if
1985 any). They are used when computing the hash value for EXPR.
1986 Insert EXPR's operands into the EXP_GEN set for BLOCK. */
1988 static inline tree
1989 create_value_expr_from (tree expr, basic_block block, tree stmt)
1991 int i;
1992 enum tree_code code = TREE_CODE (expr);
1993 tree vexpr;
1994 alloc_pool pool;
1996 gcc_assert (TREE_CODE_CLASS (code) == tcc_unary
1997 || TREE_CODE_CLASS (code) == tcc_binary
1998 || TREE_CODE_CLASS (code) == tcc_comparison
1999 || TREE_CODE_CLASS (code) == tcc_reference
2000 || TREE_CODE_CLASS (code) == tcc_expression
2001 || TREE_CODE_CLASS (code) == tcc_exceptional);
2003 if (TREE_CODE_CLASS (code) == tcc_unary)
2004 pool = unary_node_pool;
2005 else if (TREE_CODE_CLASS (code) == tcc_reference)
2006 pool = reference_node_pool;
2007 else if (TREE_CODE_CLASS (code) == tcc_binary)
2008 pool = binary_node_pool;
2009 else if (TREE_CODE_CLASS (code) == tcc_comparison)
2010 pool = comparison_node_pool;
2011 else if (TREE_CODE_CLASS (code) == tcc_exceptional)
2013 gcc_assert (code == TREE_LIST);
2014 pool = list_node_pool;
2016 else
2018 gcc_assert (code == CALL_EXPR);
2019 pool = expression_node_pool;
2022 vexpr = pool_alloc (pool);
2023 memcpy (vexpr, expr, tree_size (expr));
2025 /* This case is only for TREE_LIST's that appear as part of
2026 CALL_EXPR's. Anything else is a bug, but we can't easily verify
2027 this, hence this comment. TREE_LIST is not handled by the
2028 general case below is because they don't have a fixed length, or
2029 operands, so you can't access purpose/value/chain through
2030 TREE_OPERAND macros. */
2032 if (code == TREE_LIST)
2034 tree op = NULL_TREE;
2035 tree temp = NULL_TREE;
2036 if (TREE_CHAIN (vexpr))
2037 temp = create_value_expr_from (TREE_CHAIN (vexpr), block, stmt);
2038 TREE_CHAIN (vexpr) = temp ? temp : TREE_CHAIN (vexpr);
2041 /* Recursively value-numberize reference ops. */
2042 if (REFERENCE_CLASS_P (TREE_VALUE (vexpr)))
2044 tree tempop;
2045 op = TREE_VALUE (vexpr);
2046 tempop = create_value_expr_from (op, block, stmt);
2047 op = tempop ? tempop : op;
2049 TREE_VALUE (vexpr) = vn_lookup_or_add (op, stmt);
2051 else
2053 op = TREE_VALUE (vexpr);
2054 TREE_VALUE (vexpr) = vn_lookup_or_add (TREE_VALUE (vexpr), NULL);
2056 /* This is the equivalent of inserting op into EXP_GEN like we
2057 do below */
2058 if (!is_undefined_value (op))
2059 value_insert_into_set (EXP_GEN (block), op);
2061 return vexpr;
2064 for (i = 0; i < TREE_CODE_LENGTH (code); i++)
2066 tree val, op;
2068 op = TREE_OPERAND (expr, i);
2069 if (op == NULL_TREE)
2070 continue;
2072 /* If OP is a constant that has overflowed, do not value number
2073 this expression. */
2074 if (CONSTANT_CLASS_P (op)
2075 && TREE_OVERFLOW (op))
2077 pool_free (pool, vexpr);
2078 return NULL;
2081 /* Recursively value-numberize reference ops and tree lists. */
2082 if (REFERENCE_CLASS_P (op))
2084 tree tempop = create_value_expr_from (op, block, stmt);
2085 op = tempop ? tempop : op;
2086 val = vn_lookup_or_add (op, stmt);
2088 else if (TREE_CODE (op) == TREE_LIST)
2090 tree tempop;
2092 gcc_assert (TREE_CODE (expr) == CALL_EXPR);
2093 tempop = create_value_expr_from (op, block, stmt);
2095 op = tempop ? tempop : op;
2096 vn_lookup_or_add (op, NULL);
2097 /* Unlike everywhere else, we do *not* want to replace the
2098 TREE_LIST itself with a value number, because support
2099 functions we call will blow up. */
2100 val = op;
2102 else
2103 /* Create a value handle for OP and add it to VEXPR. */
2104 val = vn_lookup_or_add (op, NULL);
2106 if (!is_undefined_value (op) && TREE_CODE (op) != TREE_LIST)
2107 value_insert_into_set (EXP_GEN (block), op);
2109 if (TREE_CODE (val) == VALUE_HANDLE)
2110 TREE_TYPE (val) = TREE_TYPE (TREE_OPERAND (vexpr, i));
2112 TREE_OPERAND (vexpr, i) = val;
2115 return vexpr;
2119 /* Return true if we can value number a call. This is true if we have
2120 a pure or constant call. */
2121 static bool
2122 can_value_number_call (tree stmt)
2124 tree call = get_call_expr_in (stmt);
2126 /* This is a temporary restriction until we translate vuses through
2127 phi nodes. This is only needed for PRE, of course. */
2128 if (!in_fre && !ZERO_SSA_OPERANDS (stmt, SSA_OP_ALL_VIRTUALS))
2129 return false;
2130 if (call_expr_flags (call) & (ECF_PURE | ECF_CONST))
2131 return true;
2132 return false;
2135 /* Compute the AVAIL set for all basic blocks.
2137 This function performs value numbering of the statements in each basic
2138 block. The AVAIL sets are built from information we glean while doing
2139 this value numbering, since the AVAIL sets contain only one entry per
2140 value.
2142 AVAIL_IN[BLOCK] = AVAIL_OUT[dom(BLOCK)].
2143 AVAIL_OUT[BLOCK] = AVAIL_IN[BLOCK] U PHI_GEN[BLOCK] U TMP_GEN[BLOCK]. */
2145 static void
2146 compute_avail (void)
2148 basic_block block, son;
2149 basic_block *worklist;
2150 size_t sp = 0;
2151 tree param;
2153 /* For arguments with default definitions, we pretend they are
2154 defined in the entry block. */
2155 for (param = DECL_ARGUMENTS (current_function_decl);
2156 param;
2157 param = TREE_CHAIN (param))
2159 if (default_def (param) != NULL)
2161 tree def = default_def (param);
2162 vn_lookup_or_add (def, NULL);
2163 bitmap_insert_into_set (TMP_GEN (ENTRY_BLOCK_PTR), def);
2164 bitmap_value_insert_into_set (AVAIL_OUT (ENTRY_BLOCK_PTR), def);
2168 /* Allocate the worklist. */
2169 worklist = xmalloc (sizeof (basic_block) * n_basic_blocks);
2171 /* Seed the algorithm by putting the dominator children of the entry
2172 block on the worklist. */
2173 for (son = first_dom_son (CDI_DOMINATORS, ENTRY_BLOCK_PTR);
2174 son;
2175 son = next_dom_son (CDI_DOMINATORS, son))
2176 worklist[sp++] = son;
2178 /* Loop until the worklist is empty. */
2179 while (sp)
2181 block_stmt_iterator bsi;
2182 tree stmt, phi;
2183 basic_block dom;
2185 /* Pick a block from the worklist. */
2186 block = worklist[--sp];
2188 /* Initially, the set of available values in BLOCK is that of
2189 its immediate dominator. */
2190 dom = get_immediate_dominator (CDI_DOMINATORS, block);
2191 if (dom)
2192 bitmap_set_copy (AVAIL_OUT (block), AVAIL_OUT (dom));
2194 /* Generate values for PHI nodes. */
2195 for (phi = phi_nodes (block); phi; phi = PHI_CHAIN (phi))
2196 /* We have no need for virtual phis, as they don't represent
2197 actual computations. */
2198 if (is_gimple_reg (PHI_RESULT (phi)))
2199 add_to_sets (PHI_RESULT (phi), PHI_RESULT (phi), NULL,
2200 PHI_GEN (block), AVAIL_OUT (block));
2202 /* Now compute value numbers and populate value sets with all
2203 the expressions computed in BLOCK. */
2204 for (bsi = bsi_start (block); !bsi_end_p (bsi); bsi_next (&bsi))
2206 stmt_ann_t ann;
2207 ssa_op_iter iter;
2208 tree op;
2210 stmt = bsi_stmt (bsi);
2211 ann = stmt_ann (stmt);
2213 /* We are only interested in assignments of the form
2214 X_i = EXPR, where EXPR represents an "interesting"
2215 computation, it has no volatile operands and X_i
2216 doesn't flow through an abnormal edge. */
2217 if (TREE_CODE (stmt) == MODIFY_EXPR
2218 && !ann->has_volatile_ops
2219 && TREE_CODE (TREE_OPERAND (stmt, 0)) == SSA_NAME
2220 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (TREE_OPERAND (stmt, 0)))
2222 tree lhs = TREE_OPERAND (stmt, 0);
2223 tree rhs = TREE_OPERAND (stmt, 1);
2225 STRIP_USELESS_TYPE_CONVERSION (rhs);
2226 if (UNARY_CLASS_P (rhs)
2227 || BINARY_CLASS_P (rhs)
2228 || COMPARISON_CLASS_P (rhs)
2229 || REFERENCE_CLASS_P (rhs)
2230 || (TREE_CODE (rhs) == CALL_EXPR
2231 && can_value_number_call (stmt)))
2233 /* For binary, unary, and reference expressions,
2234 create a duplicate expression with the operands
2235 replaced with the value handles of the original
2236 RHS. */
2237 tree newt = create_value_expr_from (rhs, block, stmt);
2238 if (newt)
2240 add_to_sets (lhs, newt, stmt, TMP_GEN (block),
2241 AVAIL_OUT (block));
2242 value_insert_into_set (EXP_GEN (block), newt);
2243 continue;
2246 else if (TREE_CODE (rhs) == SSA_NAME
2247 || is_gimple_min_invariant (rhs)
2248 || TREE_CODE (rhs) == ADDR_EXPR
2249 || TREE_INVARIANT (rhs)
2250 || DECL_P (rhs))
2252 /* Compute a value number for the RHS of the statement
2253 and add its value to the AVAIL_OUT set for the block.
2254 Add the LHS to TMP_GEN. */
2255 add_to_sets (lhs, rhs, stmt, TMP_GEN (block),
2256 AVAIL_OUT (block));
2258 if (TREE_CODE (rhs) == SSA_NAME
2259 && !is_undefined_value (rhs))
2260 value_insert_into_set (EXP_GEN (block), rhs);
2261 continue;
2265 /* For any other statement that we don't recognize, simply
2266 make the names generated by the statement available in
2267 AVAIL_OUT and TMP_GEN. */
2268 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_DEF)
2269 add_to_sets (op, op, NULL, TMP_GEN (block), AVAIL_OUT (block));
2271 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
2272 add_to_sets (op, op, NULL, NULL , AVAIL_OUT (block));
2275 /* Put the dominator children of BLOCK on the worklist of blocks
2276 to compute available sets for. */
2277 for (son = first_dom_son (CDI_DOMINATORS, block);
2278 son;
2279 son = next_dom_son (CDI_DOMINATORS, son))
2280 worklist[sp++] = son;
2283 free (worklist);
2287 /* Eliminate fully redundant computations. */
2289 static void
2290 eliminate (void)
2292 basic_block b;
2294 FOR_EACH_BB (b)
2296 block_stmt_iterator i;
2298 for (i = bsi_start (b); !bsi_end_p (i); bsi_next (&i))
2300 tree stmt = bsi_stmt (i);
2302 /* Lookup the RHS of the expression, see if we have an
2303 available computation for it. If so, replace the RHS with
2304 the available computation. */
2305 if (TREE_CODE (stmt) == MODIFY_EXPR
2306 && TREE_CODE (TREE_OPERAND (stmt, 0)) == SSA_NAME
2307 && TREE_CODE (TREE_OPERAND (stmt ,1)) != SSA_NAME
2308 && !is_gimple_min_invariant (TREE_OPERAND (stmt, 1))
2309 && !stmt_ann (stmt)->has_volatile_ops)
2311 tree lhs = TREE_OPERAND (stmt, 0);
2312 tree *rhs_p = &TREE_OPERAND (stmt, 1);
2313 tree sprime;
2315 sprime = bitmap_find_leader (AVAIL_OUT (b),
2316 vn_lookup (lhs, NULL));
2317 if (sprime
2318 && sprime != lhs
2319 && (TREE_CODE (*rhs_p) != SSA_NAME
2320 || may_propagate_copy (*rhs_p, sprime)))
2322 gcc_assert (sprime != *rhs_p);
2324 if (dump_file && (dump_flags & TDF_DETAILS))
2326 fprintf (dump_file, "Replaced ");
2327 print_generic_expr (dump_file, *rhs_p, 0);
2328 fprintf (dump_file, " with ");
2329 print_generic_expr (dump_file, sprime, 0);
2330 fprintf (dump_file, " in ");
2331 print_generic_stmt (dump_file, stmt, 0);
2333 if (TREE_CODE (sprime) == SSA_NAME)
2334 NECESSARY (SSA_NAME_DEF_STMT (sprime)) = 1;
2335 pre_stats.eliminations++;
2336 propagate_tree_value (rhs_p, sprime);
2337 update_stmt (stmt);
2339 /* If we removed EH side effects from the statement, clean
2340 its EH information. */
2341 if (maybe_clean_or_replace_eh_stmt (stmt, stmt))
2343 bitmap_set_bit (need_eh_cleanup,
2344 bb_for_stmt (stmt)->index);
2345 if (dump_file && (dump_flags & TDF_DETAILS))
2346 fprintf (dump_file, " Removed EH side effects.\n");
2354 /* Borrow a bit of tree-ssa-dce.c for the moment.
2355 XXX: In 4.1, we should be able to just run a DCE pass after PRE, though
2356 this may be a bit faster, and we may want critical edges kept split. */
2358 /* If OP's defining statement has not already been determined to be necessary,
2359 mark that statement necessary. Return the stmt, if it is newly
2360 necessary. */
2362 static inline tree
2363 mark_operand_necessary (tree op)
2365 tree stmt;
2367 gcc_assert (op);
2369 stmt = SSA_NAME_DEF_STMT (op);
2370 gcc_assert (stmt);
2372 if (NECESSARY (stmt)
2373 || IS_EMPTY_STMT (stmt))
2374 return NULL;
2376 NECESSARY (stmt) = 1;
2377 return stmt;
2380 /* Because we don't follow exactly the standard PRE algorithm, and decide not
2381 to insert PHI nodes sometimes, and because value numbering of casts isn't
2382 perfect, we sometimes end up inserting dead code. This simple DCE-like
2383 pass removes any insertions we made that weren't actually used. */
2385 static void
2386 remove_dead_inserted_code (void)
2388 VEC(tree,heap) *worklist = NULL;
2389 int i;
2390 tree t;
2392 worklist = VEC_alloc (tree, heap, VEC_length (tree, inserted_exprs));
2393 for (i = 0; VEC_iterate (tree, inserted_exprs, i, t); i++)
2395 if (NECESSARY (t))
2396 VEC_quick_push (tree, worklist, t);
2398 while (VEC_length (tree, worklist) > 0)
2400 t = VEC_pop (tree, worklist);
2401 if (TREE_CODE (t) == PHI_NODE)
2403 /* PHI nodes are somewhat special in that each PHI alternative has
2404 data and control dependencies. All the statements feeding the
2405 PHI node's arguments are always necessary. In aggressive mode,
2406 we also consider the control dependent edges leading to the
2407 predecessor block associated with each PHI alternative as
2408 necessary. */
2409 int k;
2411 VEC_reserve (tree, heap, worklist, PHI_NUM_ARGS (t));
2412 for (k = 0; k < PHI_NUM_ARGS (t); k++)
2414 tree arg = PHI_ARG_DEF (t, k);
2415 if (TREE_CODE (arg) == SSA_NAME)
2417 arg = mark_operand_necessary (arg);
2418 if (arg)
2419 VEC_quick_push (tree, worklist, arg);
2423 else
2425 /* Propagate through the operands. Examine all the USE, VUSE and
2426 V_MAY_DEF operands in this statement. Mark all the statements
2427 which feed this statement's uses as necessary. */
2428 ssa_op_iter iter;
2429 tree use;
2431 /* The operands of V_MAY_DEF expressions are also needed as they
2432 represent potential definitions that may reach this
2433 statement (V_MAY_DEF operands allow us to follow def-def
2434 links). */
2436 FOR_EACH_SSA_TREE_OPERAND (use, t, iter, SSA_OP_ALL_USES)
2438 tree n = mark_operand_necessary (use);
2439 if (n)
2440 VEC_safe_push (tree, heap, worklist, n);
2444 for (i = 0; VEC_iterate (tree, inserted_exprs, i, t); i++)
2446 if (!NECESSARY (t))
2448 block_stmt_iterator bsi;
2449 if (dump_file && (dump_flags & TDF_DETAILS))
2451 fprintf (dump_file, "Removing unnecessary insertion:");
2452 print_generic_stmt (dump_file, t, 0);
2454 if (TREE_CODE (t) == PHI_NODE)
2456 remove_phi_node (t, NULL);
2458 else
2460 bsi = bsi_for_stmt (t);
2461 bsi_remove (&bsi);
2465 VEC_free (tree, heap, worklist);
2467 /* Initialize data structures used by PRE. */
2469 static void
2470 init_pre (bool do_fre)
2472 basic_block bb;
2474 in_fre = do_fre;
2476 inserted_exprs = NULL;
2477 vn_init ();
2478 if (!do_fre)
2479 current_loops = loop_optimizer_init (dump_file);
2480 connect_infinite_loops_to_exit ();
2481 memset (&pre_stats, 0, sizeof (pre_stats));
2483 /* If block 0 has more than one predecessor, it means that its PHI
2484 nodes will have arguments coming from block -1. This creates
2485 problems for several places in PRE that keep local arrays indexed
2486 by block number. To prevent this, we split the edge coming from
2487 ENTRY_BLOCK_PTR (FIXME, if ENTRY_BLOCK_PTR had an index number
2488 different than -1 we wouldn't have to hack this. tree-ssa-dce.c
2489 needs a similar change). */
2490 if (!single_pred_p (single_succ (ENTRY_BLOCK_PTR)))
2491 if (!(single_succ_edge (ENTRY_BLOCK_PTR)->flags & EDGE_ABNORMAL))
2492 split_edge (single_succ_edge (ENTRY_BLOCK_PTR));
2494 FOR_ALL_BB (bb)
2495 bb->aux = xcalloc (1, sizeof (struct bb_value_sets));
2497 bitmap_obstack_initialize (&grand_bitmap_obstack);
2498 phi_translate_table = htab_create (511, expr_pred_trans_hash,
2499 expr_pred_trans_eq, free);
2500 value_set_pool = create_alloc_pool ("Value sets",
2501 sizeof (struct value_set), 30);
2502 bitmap_set_pool = create_alloc_pool ("Bitmap sets",
2503 sizeof (struct bitmap_set), 30);
2504 value_set_node_pool = create_alloc_pool ("Value set nodes",
2505 sizeof (struct value_set_node), 30);
2506 calculate_dominance_info (CDI_POST_DOMINATORS);
2507 calculate_dominance_info (CDI_DOMINATORS);
2508 binary_node_pool = create_alloc_pool ("Binary tree nodes",
2509 tree_code_size (PLUS_EXPR), 30);
2510 unary_node_pool = create_alloc_pool ("Unary tree nodes",
2511 tree_code_size (NEGATE_EXPR), 30);
2512 reference_node_pool = create_alloc_pool ("Reference tree nodes",
2513 tree_code_size (ARRAY_REF), 30);
2514 expression_node_pool = create_alloc_pool ("Expression tree nodes",
2515 tree_code_size (CALL_EXPR), 30);
2516 list_node_pool = create_alloc_pool ("List tree nodes",
2517 tree_code_size (TREE_LIST), 30);
2518 comparison_node_pool = create_alloc_pool ("Comparison tree nodes",
2519 tree_code_size (EQ_EXPR), 30);
2520 FOR_ALL_BB (bb)
2522 EXP_GEN (bb) = set_new (true);
2523 PHI_GEN (bb) = bitmap_set_new ();
2524 TMP_GEN (bb) = bitmap_set_new ();
2525 AVAIL_OUT (bb) = bitmap_set_new ();
2528 need_eh_cleanup = BITMAP_ALLOC (NULL);
2532 /* Deallocate data structures used by PRE. */
2534 static void
2535 fini_pre (bool do_fre)
2537 basic_block bb;
2538 unsigned int i;
2540 VEC_free (tree, heap, inserted_exprs);
2541 bitmap_obstack_release (&grand_bitmap_obstack);
2542 free_alloc_pool (value_set_pool);
2543 free_alloc_pool (bitmap_set_pool);
2544 free_alloc_pool (value_set_node_pool);
2545 free_alloc_pool (binary_node_pool);
2546 free_alloc_pool (reference_node_pool);
2547 free_alloc_pool (unary_node_pool);
2548 free_alloc_pool (list_node_pool);
2549 free_alloc_pool (expression_node_pool);
2550 free_alloc_pool (comparison_node_pool);
2551 htab_delete (phi_translate_table);
2552 remove_fake_exit_edges ();
2554 FOR_ALL_BB (bb)
2556 free (bb->aux);
2557 bb->aux = NULL;
2560 free_dominance_info (CDI_POST_DOMINATORS);
2561 vn_delete ();
2563 if (!bitmap_empty_p (need_eh_cleanup))
2565 tree_purge_all_dead_eh_edges (need_eh_cleanup);
2566 cleanup_tree_cfg ();
2569 BITMAP_FREE (need_eh_cleanup);
2571 /* Wipe out pointers to VALUE_HANDLEs. In the not terribly distant
2572 future we will want them to be persistent though. */
2573 for (i = 0; i < num_ssa_names; i++)
2575 tree name = ssa_name (i);
2577 if (!name)
2578 continue;
2580 if (SSA_NAME_VALUE (name)
2581 && TREE_CODE (SSA_NAME_VALUE (name)) == VALUE_HANDLE)
2582 SSA_NAME_VALUE (name) = NULL;
2584 if (!do_fre && current_loops)
2586 loop_optimizer_finalize (current_loops, dump_file);
2587 current_loops = NULL;
2592 /* Main entry point to the SSA-PRE pass. DO_FRE is true if the caller
2593 only wants to do full redundancy elimination. */
2595 static void
2596 execute_pre (bool do_fre)
2598 init_pre (do_fre);
2600 /* Collect and value number expressions computed in each basic block. */
2601 compute_avail ();
2603 if (dump_file && (dump_flags & TDF_DETAILS))
2605 basic_block bb;
2607 FOR_ALL_BB (bb)
2609 print_value_set (dump_file, EXP_GEN (bb), "exp_gen", bb->index);
2610 bitmap_print_value_set (dump_file, TMP_GEN (bb), "tmp_gen",
2611 bb->index);
2612 bitmap_print_value_set (dump_file, AVAIL_OUT (bb), "avail_out",
2613 bb->index);
2617 /* Insert can get quite slow on an incredibly large number of basic
2618 blocks due to some quadratic behavior. Until this behavior is
2619 fixed, don't run it when he have an incredibly large number of
2620 bb's. If we aren't going to run insert, there is no point in
2621 computing ANTIC, either, even though it's plenty fast. */
2622 if (!do_fre && n_basic_blocks < 4000)
2624 compute_antic ();
2625 insert ();
2628 /* Remove all the redundant expressions. */
2629 eliminate ();
2632 if (dump_file && (dump_flags & TDF_STATS))
2634 fprintf (dump_file, "Insertions: %d\n", pre_stats.insertions);
2635 fprintf (dump_file, "New PHIs: %d\n", pre_stats.phis);
2636 fprintf (dump_file, "Eliminated: %d\n", pre_stats.eliminations);
2637 fprintf (dump_file, "Constified: %d\n", pre_stats.constified);
2640 bsi_commit_edge_inserts ();
2641 if (!do_fre)
2642 remove_dead_inserted_code ();
2643 fini_pre (do_fre);
2648 /* Gate and execute functions for PRE. */
2650 static void
2651 do_pre (void)
2653 execute_pre (false);
2656 static bool
2657 gate_pre (void)
2659 return flag_tree_pre != 0;
2662 struct tree_opt_pass pass_pre =
2664 "pre", /* name */
2665 gate_pre, /* gate */
2666 do_pre, /* execute */
2667 NULL, /* sub */
2668 NULL, /* next */
2669 0, /* static_pass_number */
2670 TV_TREE_PRE, /* tv_id */
2671 PROP_no_crit_edges | PROP_cfg
2672 | PROP_ssa | PROP_alias, /* properties_required */
2673 0, /* properties_provided */
2674 0, /* properties_destroyed */
2675 0, /* todo_flags_start */
2676 TODO_update_ssa | TODO_dump_func | TODO_ggc_collect
2677 | TODO_verify_ssa, /* todo_flags_finish */
2678 0 /* letter */
2682 /* Gate and execute functions for FRE. */
2684 static void
2685 execute_fre (void)
2687 execute_pre (true);
2690 static bool
2691 gate_fre (void)
2693 return flag_tree_fre != 0;
2696 struct tree_opt_pass pass_fre =
2698 "fre", /* name */
2699 gate_fre, /* gate */
2700 execute_fre, /* execute */
2701 NULL, /* sub */
2702 NULL, /* next */
2703 0, /* static_pass_number */
2704 TV_TREE_FRE, /* tv_id */
2705 PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
2706 0, /* properties_provided */
2707 0, /* properties_destroyed */
2708 0, /* todo_flags_start */
2709 TODO_dump_func | TODO_ggc_collect | TODO_verify_ssa, /* todo_flags_finish */
2710 0 /* letter */