2 Copyright (C) 2001, 2002, 2003, 2004, 2005 Free Software Foundation, Inc.
3 Contributed by Daniel Berlin <dan@dberlin.org> and Steven Bosscher
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2, or (at your option)
13 GCC is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING. If not, write to
20 the Free Software Foundation, 51 Franklin Street, Fifth Floor,
21 Boston, MA 02110-1301, USA. */
25 #include "coretypes.h"
29 #include "basic-block.h"
30 #include "diagnostic.h"
31 #include "tree-inline.h"
32 #include "tree-flow.h"
33 #include "tree-gimple.h"
34 #include "tree-dump.h"
38 #include "tree-iterator.h"
40 #include "alloc-pool.h"
41 #include "tree-pass.h"
44 #include "langhooks.h"
49 1. Avail sets can be shared by making an avail_find_leader that
50 walks up the dominator tree and looks in those avail sets.
51 This might affect code optimality, it's unclear right now.
52 2. Strength reduction can be performed by anticipating expressions
53 we can repair later on.
54 3. We can do back-substitution or smarter value numbering to catch
55 commutative expressions split up over multiple statements.
56 4. ANTIC_SAFE_LOADS could be a lot smarter than it is now.
57 Right now, it is simply calculating loads that occur before
58 any store in a block, instead of loads that occur before
59 stores that affect them. This is relatively more expensive, and
60 it's not clear how much more it will buy us.
63 /* For ease of terminology, "expression node" in the below refers to
64 every expression node but MODIFY_EXPR, because MODIFY_EXPR's represent
65 the actual statement containing the expressions we care about, and
66 we cache the value number by putting it in the expression. */
70 First we walk the statements to generate the AVAIL sets, the
71 EXP_GEN sets, and the tmp_gen sets. EXP_GEN sets represent the
72 generation of values/expressions by a given block. We use them
73 when computing the ANTIC sets. The AVAIL sets consist of
74 SSA_NAME's that represent values, so we know what values are
75 available in what blocks. AVAIL is a forward dataflow problem. In
76 SSA, values are never killed, so we don't need a kill set, or a
77 fixpoint iteration, in order to calculate the AVAIL sets. In
78 traditional parlance, AVAIL sets tell us the downsafety of the
81 Next, we generate the ANTIC sets. These sets represent the
82 anticipatable expressions. ANTIC is a backwards dataflow
83 problem.An expression is anticipatable in a given block if it could
84 be generated in that block. This means that if we had to perform
85 an insertion in that block, of the value of that expression, we
86 could. Calculating the ANTIC sets requires phi translation of
87 expressions, because the flow goes backwards through phis. We must
88 iterate to a fixpoint of the ANTIC sets, because we have a kill
89 set. Even in SSA form, values are not live over the entire
90 function, only from their definition point onwards. So we have to
91 remove values from the ANTIC set once we go past the definition
92 point of the leaders that make them up.
93 compute_antic/compute_antic_aux performs this computation.
95 Third, we perform insertions to make partially redundant
96 expressions fully redundant.
98 An expression is partially redundant (excluding partial
101 1. It is AVAIL in some, but not all, of the predecessors of a
103 2. It is ANTIC in all the predecessors.
105 In order to make it fully redundant, we insert the expression into
106 the predecessors where it is not available, but is ANTIC.
107 insert/insert_aux performs this insertion.
109 Fourth, we eliminate fully redundant expressions.
110 This is a simple statement walk that replaces redundant
111 calculations with the now available values. */
113 /* Representations of value numbers:
115 Value numbers are represented using the "value handle" approach.
116 This means that each SSA_NAME (and for other reasons to be
117 disclosed in a moment, expression nodes) has a value handle that
118 can be retrieved through get_value_handle. This value handle, *is*
119 the value number of the SSA_NAME. You can pointer compare the
120 value handles for equivalence purposes.
122 For debugging reasons, the value handle is internally more than
123 just a number, it is a VAR_DECL named "value.x", where x is a
124 unique number for each value number in use. This allows
125 expressions with SSA_NAMES replaced by value handles to still be
126 pretty printed in a sane way. They simply print as "value.3 *
129 Expression nodes have value handles associated with them as a
130 cache. Otherwise, we'd have to look them up again in the hash
131 table This makes significant difference (factor of two or more) on
132 some test cases. They can be thrown away after the pass is
135 /* Representation of expressions on value numbers:
137 In some portions of this code, you will notice we allocate "fake"
138 analogues to the expression we are value numbering, and replace the
139 operands with the values of the expression. Since we work on
140 values, and not just names, we canonicalize expressions to value
141 expressions for use in the ANTIC sets, the EXP_GEN set, etc.
143 This is theoretically unnecessary, it just saves a bunch of
144 repeated get_value_handle and find_leader calls in the remainder of
145 the code, trading off temporary memory usage for speed. The tree
146 nodes aren't actually creating more garbage, since they are
147 allocated in a special pools which are thrown away at the end of
150 All of this also means that if you print the EXP_GEN or ANTIC sets,
151 you will see "value.5 + value.7" in the set, instead of "a_55 +
152 b_66" or something. The only thing that actually cares about
153 seeing the value leaders is phi translation, and it needs to be
154 able to find the leader for a value in an arbitrary block, so this
155 "value expression" form is perfect for it (otherwise you'd do
156 get_value_handle->find_leader->translate->get_value_handle->find_leader).*/
159 /* Representation of sets:
161 There are currently two types of sets used, hopefully to be unified soon.
162 The AVAIL sets do not need to be sorted in any particular order,
163 and thus, are simply represented as two bitmaps, one that keeps
164 track of values present in the set, and one that keeps track of
165 expressions present in the set.
167 The other sets are represented as doubly linked lists kept in topological
168 order, with an optional supporting bitmap of values present in the
169 set. The sets represent values, and the elements can be values or
170 expressions. The elements can appear in different sets, but each
171 element can only appear once in each set.
173 Since each node in the set represents a value, we also want to be
174 able to map expression, set pairs to something that tells us
175 whether the value is present is a set. We use a per-set bitmap for
176 that. The value handles also point to a linked list of the
177 expressions they represent via a tree annotation. This is mainly
178 useful only for debugging, since we don't do identity lookups. */
181 static bool in_fre
= false;
183 /* A value set element. Basically a single linked list of
184 expressions/values. */
185 typedef struct value_set_node
190 /* A pointer to the next element of the value set. */
191 struct value_set_node
*next
;
195 /* A value set. This is a singly linked list of value_set_node
196 elements with a possible bitmap that tells us what values exist in
197 the set. This set must be kept in topologically sorted order. */
198 typedef struct value_set
200 /* The head of the list. Used for iterating over the list in
202 value_set_node_t head
;
204 /* The tail of the list. Used for tail insertions, which are
205 necessary to keep the set in topologically sorted order because
206 of how the set is built. */
207 value_set_node_t tail
;
209 /* The length of the list. */
212 /* True if the set is indexed, which means it contains a backing
213 bitmap for quick determination of whether certain values exist in the
217 /* The bitmap of values that exist in the set. May be NULL in an
218 empty or non-indexed set. */
224 /* An unordered bitmap set. One bitmap tracks values, the other,
226 typedef struct bitmap_set
232 /* Sets that we need to keep track of. */
233 typedef struct bb_value_sets
235 /* The EXP_GEN set, which represents expressions/values generated in
239 /* The PHI_GEN set, which represents PHI results generated in a
241 bitmap_set_t phi_gen
;
243 /* The TMP_GEN set, which represents results/temporaries generated
244 in a basic block. IE the LHS of an expression. */
245 bitmap_set_t tmp_gen
;
247 /* The AVAIL_OUT set, which represents which values are available in
248 a given basic block. */
249 bitmap_set_t avail_out
;
251 /* The ANTIC_IN set, which represents which values are anticipatable
252 in a given basic block. */
253 value_set_t antic_in
;
255 /* The NEW_SETS set, which is used during insertion to augment the
256 AVAIL_OUT set of blocks with the new insertions performed during
257 the current iteration. */
258 bitmap_set_t new_sets
;
260 /* The RVUSE sets, which are used during ANTIC computation to ensure
261 that we don't mark loads ANTIC once they have died. */
267 /* For actually occurring loads, as long as they occur before all the
268 other stores in the block, we know they are antic at the top of
269 the block, regardless of RVUSE_KILL. */
270 value_set_t antic_safe_loads
;
273 #define EXP_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->exp_gen
274 #define PHI_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->phi_gen
275 #define TMP_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->tmp_gen
276 #define AVAIL_OUT(BB) ((bb_value_sets_t) ((BB)->aux))->avail_out
277 #define ANTIC_IN(BB) ((bb_value_sets_t) ((BB)->aux))->antic_in
278 #define RVUSE_IN(BB) ((bb_value_sets_t) ((BB)->aux))->rvuse_in
279 #define RVUSE_GEN(BB) ((bb_value_sets_t) ((BB)->aux))->rvuse_gen
280 #define RVUSE_KILL(BB) ((bb_value_sets_t) ((BB)->aux))->rvuse_kill
281 #define RVUSE_OUT(BB) ((bb_value_sets_t) ((BB)->aux))->rvuse_out
282 #define NEW_SETS(BB) ((bb_value_sets_t) ((BB)->aux))->new_sets
283 #define ANTIC_SAFE_LOADS(BB) ((bb_value_sets_t) ((BB)->aux))->antic_safe_loads
285 /* This structure is used to keep track of statistics on what
286 optimization PRE was able to perform. */
289 /* The number of RHS computations eliminated by PRE. */
292 /* The number of new expressions/temporaries generated by PRE. */
295 /* The number of new PHI nodes added by PRE. */
298 /* The number of values found constant. */
304 static tree
bitmap_find_leader (bitmap_set_t
, tree
);
305 static tree
find_leader (value_set_t
, tree
);
306 static void value_insert_into_set (value_set_t
, tree
);
307 static void bitmap_value_insert_into_set (bitmap_set_t
, tree
);
308 static void bitmap_value_replace_in_set (bitmap_set_t
, tree
);
309 static void insert_into_set (value_set_t
, tree
);
310 static void bitmap_set_copy (bitmap_set_t
, bitmap_set_t
);
311 static bool bitmap_set_contains_value (bitmap_set_t
, tree
);
312 static bitmap_set_t
bitmap_set_new (void);
313 static value_set_t
set_new (bool);
314 static bool is_undefined_value (tree
);
315 static tree
create_expression_by_pieces (basic_block
, tree
, tree
);
316 static tree
find_or_generate_expression (basic_block
, tree
, tree
);
319 /* We can add and remove elements and entries to and from sets
320 and hash tables, so we use alloc pools for them. */
322 static alloc_pool value_set_pool
;
323 static alloc_pool bitmap_set_pool
;
324 static alloc_pool value_set_node_pool
;
325 static alloc_pool binary_node_pool
;
326 static alloc_pool unary_node_pool
;
327 static alloc_pool reference_node_pool
;
328 static alloc_pool comparison_node_pool
;
329 static alloc_pool expression_node_pool
;
330 static alloc_pool list_node_pool
;
331 static alloc_pool modify_expr_node_pool
;
332 static bitmap_obstack grand_bitmap_obstack
;
334 /* To avoid adding 300 temporary variables when we only need one, we
335 only create one temporary variable, on demand, and build ssa names
336 off that. We do have to change the variable if the types don't
337 match the current variable's type. */
339 static tree storetemp
;
340 static tree mergephitemp
;
341 static tree prephitemp
;
343 /* Set of blocks with statements that have had its EH information
345 static bitmap need_eh_cleanup
;
347 /* The phi_translate_table caches phi translations for a given
348 expression and predecessor. */
350 static htab_t phi_translate_table
;
352 /* A three tuple {e, pred, v} used to cache phi translations in the
353 phi_translate_table. */
355 typedef struct expr_pred_trans_d
357 /* The expression. */
360 /* The predecessor block along which we translated the expression. */
363 /* vuses associated with the expression. */
364 VEC (tree
, gc
) *vuses
;
366 /* The value that resulted from the translation. */
370 /* The hashcode for the expression, pred pair. This is cached for
373 } *expr_pred_trans_t
;
375 /* Return the hash value for a phi translation table entry. */
378 expr_pred_trans_hash (const void *p
)
380 const expr_pred_trans_t ve
= (expr_pred_trans_t
) p
;
384 /* Return true if two phi translation table entries are the same.
385 P1 and P2 should point to the expr_pred_trans_t's to be compared.*/
388 expr_pred_trans_eq (const void *p1
, const void *p2
)
390 const expr_pred_trans_t ve1
= (expr_pred_trans_t
) p1
;
391 const expr_pred_trans_t ve2
= (expr_pred_trans_t
) p2
;
392 basic_block b1
= ve1
->pred
;
393 basic_block b2
= ve2
->pred
;
397 /* If they are not translations for the same basic block, they can't
403 /* If they are for the same basic block, determine if the
404 expressions are equal. */
405 if (!expressions_equal_p (ve1
->e
, ve2
->e
))
408 /* Make sure the vuses are equivalent. */
409 if (ve1
->vuses
== ve2
->vuses
)
412 if (VEC_length (tree
, ve1
->vuses
) != VEC_length (tree
, ve2
->vuses
))
415 for (i
= 0; VEC_iterate (tree
, ve1
->vuses
, i
, vuse1
); i
++)
417 if (VEC_index (tree
, ve2
->vuses
, i
) != vuse1
)
424 /* Search in the phi translation table for the translation of
425 expression E in basic block PRED with vuses VUSES.
426 Return the translated value, if found, NULL otherwise. */
429 phi_trans_lookup (tree e
, basic_block pred
, VEC (tree
, gc
) *vuses
)
432 struct expr_pred_trans_d ept
;
437 ept
.hashcode
= vn_compute (e
, (unsigned long) pred
);
438 slot
= htab_find_slot_with_hash (phi_translate_table
, &ept
, ept
.hashcode
,
443 return ((expr_pred_trans_t
) *slot
)->v
;
447 /* Add the tuple mapping from {expression E, basic block PRED, vuses VUSES} to
448 value V, to the phi translation table. */
451 phi_trans_add (tree e
, tree v
, basic_block pred
, VEC (tree
, gc
) *vuses
)
454 expr_pred_trans_t new_pair
= XNEW (struct expr_pred_trans_d
);
456 new_pair
->pred
= pred
;
457 new_pair
->vuses
= vuses
;
459 new_pair
->hashcode
= vn_compute (e
, (unsigned long) pred
);
460 slot
= htab_find_slot_with_hash (phi_translate_table
, new_pair
,
461 new_pair
->hashcode
, INSERT
);
464 *slot
= (void *) new_pair
;
468 /* Add expression E to the expression set of value V. */
471 add_to_value (tree v
, tree e
)
473 /* Constants have no expression sets. */
474 if (is_gimple_min_invariant (v
))
477 if (VALUE_HANDLE_EXPR_SET (v
) == NULL
)
478 VALUE_HANDLE_EXPR_SET (v
) = set_new (false);
480 insert_into_set (VALUE_HANDLE_EXPR_SET (v
), e
);
484 /* Return true if value V exists in the bitmap for SET. */
487 value_exists_in_set_bitmap (value_set_t set
, tree v
)
492 return bitmap_bit_p (set
->values
, VALUE_HANDLE_ID (v
));
496 /* Remove value V from the bitmap for SET. */
499 value_remove_from_set_bitmap (value_set_t set
, tree v
)
501 gcc_assert (set
->indexed
);
506 bitmap_clear_bit (set
->values
, VALUE_HANDLE_ID (v
));
510 /* Insert the value number V into the bitmap of values existing in
514 value_insert_into_set_bitmap (value_set_t set
, tree v
)
516 gcc_assert (set
->indexed
);
518 if (set
->values
== NULL
)
519 set
->values
= BITMAP_ALLOC (&grand_bitmap_obstack
);
521 bitmap_set_bit (set
->values
, VALUE_HANDLE_ID (v
));
525 /* Create a new bitmap set and return it. */
528 bitmap_set_new (void)
530 bitmap_set_t ret
= (bitmap_set_t
) pool_alloc (bitmap_set_pool
);
531 ret
->expressions
= BITMAP_ALLOC (&grand_bitmap_obstack
);
532 ret
->values
= BITMAP_ALLOC (&grand_bitmap_obstack
);
536 /* Create a new set. */
539 set_new (bool indexed
)
542 ret
= (value_set_t
) pool_alloc (value_set_pool
);
543 ret
->head
= ret
->tail
= NULL
;
545 ret
->indexed
= indexed
;
550 /* Insert an expression EXPR into a bitmapped set. */
553 bitmap_insert_into_set (bitmap_set_t set
, tree expr
)
556 /* XXX: For now, we only let SSA_NAMES into the bitmap sets. */
557 gcc_assert (TREE_CODE (expr
) == SSA_NAME
);
558 val
= get_value_handle (expr
);
561 if (!is_gimple_min_invariant (val
))
563 bitmap_set_bit (set
->values
, VALUE_HANDLE_ID (val
));
564 bitmap_set_bit (set
->expressions
, SSA_NAME_VERSION (expr
));
568 /* Insert EXPR into SET. */
571 insert_into_set (value_set_t set
, tree expr
)
573 value_set_node_t newnode
= (value_set_node_t
) pool_alloc (value_set_node_pool
);
574 tree val
= get_value_handle (expr
);
577 if (is_gimple_min_invariant (val
))
580 /* For indexed sets, insert the value into the set value bitmap.
581 For all sets, add it to the linked list and increment the list
584 value_insert_into_set_bitmap (set
, val
);
586 newnode
->next
= NULL
;
587 newnode
->expr
= expr
;
589 if (set
->head
== NULL
)
591 set
->head
= set
->tail
= newnode
;
595 set
->tail
->next
= newnode
;
600 /* Copy a bitmapped set ORIG, into bitmapped set DEST. */
603 bitmap_set_copy (bitmap_set_t dest
, bitmap_set_t orig
)
605 bitmap_copy (dest
->expressions
, orig
->expressions
);
606 bitmap_copy (dest
->values
, orig
->values
);
609 /* Perform bitmapped set operation DEST &= ORIG. */
612 bitmap_set_and (bitmap_set_t dest
, bitmap_set_t orig
)
616 bitmap temp
= BITMAP_ALLOC (&grand_bitmap_obstack
);
618 bitmap_and_into (dest
->values
, orig
->values
);
619 bitmap_copy (temp
, dest
->expressions
);
620 EXECUTE_IF_SET_IN_BITMAP (temp
, 0, i
, bi
)
622 tree name
= ssa_name (i
);
623 tree val
= get_value_handle (name
);
624 if (!bitmap_bit_p (dest
->values
, VALUE_HANDLE_ID (val
)))
625 bitmap_clear_bit (dest
->expressions
, i
);
630 /* Perform bitmapped value set operation DEST = DEST & ~ORIG. */
633 bitmap_set_and_compl (bitmap_set_t dest
, bitmap_set_t orig
)
637 bitmap temp
= BITMAP_ALLOC (&grand_bitmap_obstack
);
639 bitmap_and_compl_into (dest
->values
, orig
->values
);
640 bitmap_copy (temp
, dest
->expressions
);
641 EXECUTE_IF_SET_IN_BITMAP (temp
, 0, i
, bi
)
643 tree name
= ssa_name (i
);
644 tree val
= get_value_handle (name
);
645 if (!bitmap_bit_p (dest
->values
, VALUE_HANDLE_ID (val
)))
646 bitmap_clear_bit (dest
->expressions
, i
);
651 /* Return true if the bitmap set SET is empty. */
654 bitmap_set_empty_p (bitmap_set_t set
)
656 return bitmap_empty_p (set
->values
);
659 /* Copy the set ORIG to the set DEST. */
662 set_copy (value_set_t dest
, value_set_t orig
)
664 value_set_node_t node
;
666 if (!orig
|| !orig
->head
)
669 for (node
= orig
->head
;
673 insert_into_set (dest
, node
->expr
);
677 /* Remove EXPR from SET. */
680 set_remove (value_set_t set
, tree expr
)
682 value_set_node_t node
, prev
;
684 /* Remove the value of EXPR from the bitmap, decrement the set
685 length, and remove it from the actual double linked list. */
686 value_remove_from_set_bitmap (set
, get_value_handle (expr
));
689 for (node
= set
->head
;
691 prev
= node
, node
= node
->next
)
693 if (node
->expr
== expr
)
696 set
->head
= node
->next
;
698 prev
->next
= node
->next
;
700 if (node
== set
->tail
)
702 pool_free (value_set_node_pool
, node
);
708 /* Return true if SET contains the value VAL. */
711 set_contains_value (value_set_t set
, tree val
)
713 /* All constants are in every set. */
714 if (is_gimple_min_invariant (val
))
717 if (!set
|| set
->length
== 0)
720 return value_exists_in_set_bitmap (set
, val
);
723 /* Return true if bitmapped set SET contains the expression EXPR. */
725 bitmap_set_contains (bitmap_set_t set
, tree expr
)
727 /* All constants are in every set. */
728 if (is_gimple_min_invariant (get_value_handle (expr
)))
731 /* XXX: Bitmapped sets only contain SSA_NAME's for now. */
732 if (TREE_CODE (expr
) != SSA_NAME
)
734 return bitmap_bit_p (set
->expressions
, SSA_NAME_VERSION (expr
));
738 /* Return true if bitmapped set SET contains the value VAL. */
741 bitmap_set_contains_value (bitmap_set_t set
, tree val
)
743 if (is_gimple_min_invariant (val
))
745 return bitmap_bit_p (set
->values
, VALUE_HANDLE_ID (val
));
748 /* Replace an instance of value LOOKFOR with expression EXPR in SET. */
751 bitmap_set_replace_value (bitmap_set_t set
, tree lookfor
, tree expr
)
754 value_set_node_t node
;
755 if (is_gimple_min_invariant (lookfor
))
757 if (!bitmap_set_contains_value (set
, lookfor
))
760 /* The number of expressions having a given value is usually
761 significantly less than the total number of expressions in SET.
762 Thus, rather than check, for each expression in SET, whether it
763 has the value LOOKFOR, we walk the reverse mapping that tells us
764 what expressions have a given value, and see if any of those
765 expressions are in our set. For large testcases, this is about
766 5-10x faster than walking the bitmap. If this is somehow a
767 significant lose for some cases, we can choose which set to walk
768 based on the set size. */
769 exprset
= VALUE_HANDLE_EXPR_SET (lookfor
);
770 for (node
= exprset
->head
; node
; node
= node
->next
)
772 if (TREE_CODE (node
->expr
) == SSA_NAME
)
774 if (bitmap_bit_p (set
->expressions
, SSA_NAME_VERSION (node
->expr
)))
776 bitmap_clear_bit (set
->expressions
, SSA_NAME_VERSION (node
->expr
));
777 bitmap_set_bit (set
->expressions
, SSA_NAME_VERSION (expr
));
784 /* Subtract bitmapped set B from value set A, and return the new set. */
787 bitmap_set_subtract_from_value_set (value_set_t a
, bitmap_set_t b
,
790 value_set_t ret
= set_new (indexed
);
791 value_set_node_t node
;
796 if (!bitmap_set_contains (b
, node
->expr
))
797 insert_into_set (ret
, node
->expr
);
802 /* Return true if two sets are equal. */
805 set_equal (value_set_t a
, value_set_t b
)
807 value_set_node_t node
;
809 if (a
->length
!= b
->length
)
815 if (!set_contains_value (b
, get_value_handle (node
->expr
)))
821 /* Replace an instance of EXPR's VALUE with EXPR in SET if it exists,
822 and add it otherwise. */
825 bitmap_value_replace_in_set (bitmap_set_t set
, tree expr
)
827 tree val
= get_value_handle (expr
);
828 if (bitmap_set_contains_value (set
, val
))
829 bitmap_set_replace_value (set
, val
, expr
);
831 bitmap_insert_into_set (set
, expr
);
834 /* Insert EXPR into SET if EXPR's value is not already present in
838 bitmap_value_insert_into_set (bitmap_set_t set
, tree expr
)
840 tree val
= get_value_handle (expr
);
842 if (is_gimple_min_invariant (val
))
845 if (!bitmap_set_contains_value (set
, val
))
846 bitmap_insert_into_set (set
, expr
);
849 /* Insert the value for EXPR into SET, if it doesn't exist already. */
852 value_insert_into_set (value_set_t set
, tree expr
)
854 tree val
= get_value_handle (expr
);
856 /* Constant and invariant values exist everywhere, and thus,
857 actually keeping them in the sets is pointless. */
858 if (is_gimple_min_invariant (val
))
861 if (!set_contains_value (set
, val
))
862 insert_into_set (set
, expr
);
866 /* Print out SET to OUTFILE. */
869 bitmap_print_value_set (FILE *outfile
, bitmap_set_t set
,
870 const char *setname
, int blockindex
)
872 fprintf (outfile
, "%s[%d] := { ", setname
, blockindex
);
879 EXECUTE_IF_SET_IN_BITMAP (set
->expressions
, 0, i
, bi
)
882 fprintf (outfile
, ", ");
884 print_generic_expr (outfile
, ssa_name (i
), 0);
886 fprintf (outfile
, " (");
887 print_generic_expr (outfile
, get_value_handle (ssa_name (i
)), 0);
888 fprintf (outfile
, ") ");
891 fprintf (outfile
, " }\n");
893 /* Print out the value_set SET to OUTFILE. */
896 print_value_set (FILE *outfile
, value_set_t set
,
897 const char *setname
, int blockindex
)
899 value_set_node_t node
;
900 fprintf (outfile
, "%s[%d] := { ", setname
, blockindex
);
903 for (node
= set
->head
;
907 print_generic_expr (outfile
, node
->expr
, 0);
909 fprintf (outfile
, " (");
910 print_generic_expr (outfile
, get_value_handle (node
->expr
), 0);
911 fprintf (outfile
, ") ");
914 fprintf (outfile
, ", ");
918 fprintf (outfile
, " }\n");
921 /* Print out the expressions that have VAL to OUTFILE. */
924 print_value_expressions (FILE *outfile
, tree val
)
926 if (VALUE_HANDLE_EXPR_SET (val
))
929 sprintf (s
, "VH.%04d", VALUE_HANDLE_ID (val
));
930 print_value_set (outfile
, VALUE_HANDLE_EXPR_SET (val
), s
, 0);
936 debug_value_expressions (tree val
)
938 print_value_expressions (stderr
, val
);
942 void debug_value_set (value_set_t
, const char *, int);
945 debug_value_set (value_set_t set
, const char *setname
, int blockindex
)
947 print_value_set (stderr
, set
, setname
, blockindex
);
950 /* Return the folded version of T if T, when folded, is a gimple
951 min_invariant. Otherwise, return T. */
954 fully_constant_expression (tree t
)
958 if (folded
&& is_gimple_min_invariant (folded
))
963 /* Return a copy of a chain of nodes, chained through the TREE_CHAIN field.
964 For example, this can copy a list made of TREE_LIST nodes.
965 Allocates the nodes in list_node_pool*/
968 pool_copy_list (tree list
)
975 head
= (tree
) pool_alloc (list_node_pool
);
977 memcpy (head
, list
, tree_size (list
));
980 next
= TREE_CHAIN (list
);
983 TREE_CHAIN (prev
) = (tree
) pool_alloc (list_node_pool
);
984 memcpy (TREE_CHAIN (prev
), next
, tree_size (next
));
985 prev
= TREE_CHAIN (prev
);
986 next
= TREE_CHAIN (next
);
991 /* Translate the vuses in the VUSES vector backwards through phi
992 nodes, so that they have the value they would have in BLOCK. */
994 static VEC(tree
, gc
) *
995 translate_vuses_through_block (VEC (tree
, gc
) *vuses
, basic_block block
)
998 VEC(tree
, gc
) *result
= NULL
;
1001 for (i
= 0; VEC_iterate (tree
, vuses
, i
, oldvuse
); i
++)
1003 tree phi
= SSA_NAME_DEF_STMT (oldvuse
);
1004 if (TREE_CODE (phi
) == PHI_NODE
)
1006 edge e
= find_edge (block
, bb_for_stmt (phi
));
1009 tree def
= PHI_ARG_DEF (phi
, e
->dest_idx
);
1013 result
= VEC_copy (tree
, gc
, vuses
);
1014 VEC_replace (tree
, result
, i
, def
);
1021 sort_vuses (result
);
1027 /* Translate EXPR using phis in PHIBLOCK, so that it has the values of
1028 the phis in PRED. Return NULL if we can't find a leader for each
1029 part of the translated expression. */
1032 phi_translate (tree expr
, value_set_t set
, basic_block pred
,
1033 basic_block phiblock
)
1035 tree phitrans
= NULL
;
1036 tree oldexpr
= expr
;
1040 if (is_gimple_min_invariant (expr
))
1043 /* Phi translations of a given expression don't change. */
1048 vh
= get_value_handle (expr
);
1049 if (vh
&& TREE_CODE (vh
) == VALUE_HANDLE
)
1050 phitrans
= phi_trans_lookup (expr
, pred
, VALUE_HANDLE_VUSES (vh
));
1052 phitrans
= phi_trans_lookup (expr
, pred
, NULL
);
1055 phitrans
= phi_trans_lookup (expr
, pred
, NULL
);
1060 switch (TREE_CODE_CLASS (TREE_CODE (expr
)))
1062 case tcc_expression
:
1064 if (TREE_CODE (expr
) != CALL_EXPR
)
1068 tree oldop0
= TREE_OPERAND (expr
, 0);
1069 tree oldarglist
= TREE_OPERAND (expr
, 1);
1070 tree oldop2
= TREE_OPERAND (expr
, 2);
1077 tree vh
= get_value_handle (expr
);
1078 bool listchanged
= false;
1079 VEC (tree
, gc
) *vuses
= VALUE_HANDLE_VUSES (vh
);
1080 VEC (tree
, gc
) *tvuses
;
1082 /* Call expressions are kind of weird because they have an
1083 argument list. We don't want to value number the list
1084 as one value number, because that doesn't make much
1085 sense, and just breaks the support functions we call,
1086 which expect TREE_OPERAND (call_expr, 2) to be a
1089 newop0
= phi_translate (find_leader (set
, oldop0
),
1090 set
, pred
, phiblock
);
1095 newop2
= phi_translate (find_leader (set
, oldop2
),
1096 set
, pred
, phiblock
);
1101 /* phi translate the argument list piece by piece.
1103 We could actually build the list piece by piece here,
1104 but it's likely to not be worth the memory we will save,
1105 unless you have millions of call arguments. */
1107 newarglist
= pool_copy_list (oldarglist
);
1108 for (oldwalker
= oldarglist
, newwalker
= newarglist
;
1109 oldwalker
&& newwalker
;
1110 oldwalker
= TREE_CHAIN (oldwalker
),
1111 newwalker
= TREE_CHAIN (newwalker
))
1114 tree oldval
= TREE_VALUE (oldwalker
);
1118 /* This may seem like a weird place for this
1119 check, but it's actually the easiest place to
1120 do it. We can't do it lower on in the
1121 recursion because it's valid for pieces of a
1122 component ref to be of AGGREGATE_TYPE, as long
1123 as the outermost one is not.
1124 To avoid *that* case, we have a check for
1125 AGGREGATE_TYPE_P in insert_aux. However, that
1126 check will *not* catch this case because here
1127 it occurs in the argument list. */
1128 if (AGGREGATE_TYPE_P (TREE_TYPE (oldval
)))
1130 newval
= phi_translate (find_leader (set
, oldval
),
1131 set
, pred
, phiblock
);
1134 if (newval
!= oldval
)
1137 TREE_VALUE (newwalker
) = get_value_handle (newval
);
1142 vn_lookup_or_add (newarglist
, NULL
);
1144 tvuses
= translate_vuses_through_block (vuses
, pred
);
1146 if (listchanged
|| (newop0
!= oldop0
) || (oldop2
!= newop2
)
1149 newexpr
= (tree
) pool_alloc (expression_node_pool
);
1150 memcpy (newexpr
, expr
, tree_size (expr
));
1151 TREE_OPERAND (newexpr
, 0) = newop0
== oldop0
? oldop0
: get_value_handle (newop0
);
1152 TREE_OPERAND (newexpr
, 1) = listchanged
? newarglist
: oldarglist
;
1153 TREE_OPERAND (newexpr
, 2) = newop2
== oldop2
? oldop2
: get_value_handle (newop2
);
1154 newexpr
->common
.ann
= NULL
;
1155 vn_lookup_or_add_with_vuses (newexpr
, tvuses
);
1157 phi_trans_add (oldexpr
, newexpr
, pred
, tvuses
);
1163 case tcc_declaration
:
1165 VEC (tree
, gc
) * oldvuses
= NULL
;
1166 VEC (tree
, gc
) * newvuses
= NULL
;
1168 oldvuses
= VALUE_HANDLE_VUSES (get_value_handle (expr
));
1170 newvuses
= translate_vuses_through_block (oldvuses
, pred
);
1172 if (oldvuses
!= newvuses
)
1173 vn_lookup_or_add_with_vuses (expr
, newvuses
);
1175 phi_trans_add (oldexpr
, expr
, pred
, newvuses
);
1181 tree oldop0
= TREE_OPERAND (expr
, 0);
1190 VEC (tree
, gc
) * oldvuses
= NULL
;
1191 VEC (tree
, gc
) * newvuses
= NULL
;
1193 if (TREE_CODE (expr
) != INDIRECT_REF
1194 && TREE_CODE (expr
) != COMPONENT_REF
1195 && TREE_CODE (expr
) != ARRAY_REF
)
1198 newop0
= phi_translate (find_leader (set
, oldop0
),
1199 set
, pred
, phiblock
);
1203 if (TREE_CODE (expr
) == ARRAY_REF
)
1205 oldop1
= TREE_OPERAND (expr
, 1);
1206 newop1
= phi_translate (find_leader (set
, oldop1
),
1207 set
, pred
, phiblock
);
1211 oldop2
= TREE_OPERAND (expr
, 2);
1214 newop2
= phi_translate (find_leader (set
, oldop2
),
1215 set
, pred
, phiblock
);
1220 oldop3
= TREE_OPERAND (expr
, 3);
1223 newop3
= phi_translate (find_leader (set
, oldop3
),
1224 set
, pred
, phiblock
);
1231 oldvuses
= VALUE_HANDLE_VUSES (get_value_handle (expr
));
1233 newvuses
= translate_vuses_through_block (oldvuses
, pred
);
1235 if (newop0
!= oldop0
|| newvuses
!= oldvuses
1238 || newop3
!= oldop3
)
1242 newexpr
= pool_alloc (reference_node_pool
);
1243 memcpy (newexpr
, expr
, tree_size (expr
));
1244 TREE_OPERAND (newexpr
, 0) = get_value_handle (newop0
);
1245 if (TREE_CODE (expr
) == ARRAY_REF
)
1247 TREE_OPERAND (newexpr
, 1) = get_value_handle (newop1
);
1249 TREE_OPERAND (newexpr
, 2) = get_value_handle (newop2
);
1251 TREE_OPERAND (newexpr
, 3) = get_value_handle (newop3
);
1254 t
= fully_constant_expression (newexpr
);
1258 pool_free (reference_node_pool
, newexpr
);
1263 newexpr
->common
.ann
= NULL
;
1264 vn_lookup_or_add_with_vuses (newexpr
, newvuses
);
1267 phi_trans_add (oldexpr
, newexpr
, pred
, newvuses
);
1274 case tcc_comparison
:
1276 tree oldop1
= TREE_OPERAND (expr
, 0);
1277 tree oldop2
= TREE_OPERAND (expr
, 1);
1282 newop1
= phi_translate (find_leader (set
, oldop1
),
1283 set
, pred
, phiblock
);
1286 newop2
= phi_translate (find_leader (set
, oldop2
),
1287 set
, pred
, phiblock
);
1290 if (newop1
!= oldop1
|| newop2
!= oldop2
)
1293 newexpr
= (tree
) pool_alloc (binary_node_pool
);
1294 memcpy (newexpr
, expr
, tree_size (expr
));
1295 TREE_OPERAND (newexpr
, 0) = newop1
== oldop1
? oldop1
: get_value_handle (newop1
);
1296 TREE_OPERAND (newexpr
, 1) = newop2
== oldop2
? oldop2
: get_value_handle (newop2
);
1297 t
= fully_constant_expression (newexpr
);
1300 pool_free (binary_node_pool
, newexpr
);
1305 newexpr
->common
.ann
= NULL
;
1306 vn_lookup_or_add (newexpr
, NULL
);
1309 phi_trans_add (oldexpr
, newexpr
, pred
, NULL
);
1316 tree oldop1
= TREE_OPERAND (expr
, 0);
1320 newop1
= phi_translate (find_leader (set
, oldop1
),
1321 set
, pred
, phiblock
);
1324 if (newop1
!= oldop1
)
1327 newexpr
= (tree
) pool_alloc (unary_node_pool
);
1328 memcpy (newexpr
, expr
, tree_size (expr
));
1329 TREE_OPERAND (newexpr
, 0) = get_value_handle (newop1
);
1330 t
= fully_constant_expression (newexpr
);
1333 pool_free (unary_node_pool
, newexpr
);
1338 newexpr
->common
.ann
= NULL
;
1339 vn_lookup_or_add (newexpr
, NULL
);
1342 phi_trans_add (oldexpr
, newexpr
, pred
, NULL
);
1347 case tcc_exceptional
:
1351 gcc_assert (TREE_CODE (expr
) == SSA_NAME
);
1352 if (TREE_CODE (SSA_NAME_DEF_STMT (expr
)) == PHI_NODE
)
1353 phi
= SSA_NAME_DEF_STMT (expr
);
1357 e
= find_edge (pred
, bb_for_stmt (phi
));
1360 if (is_undefined_value (PHI_ARG_DEF (phi
, e
->dest_idx
)))
1362 vn_lookup_or_add (PHI_ARG_DEF (phi
, e
->dest_idx
), NULL
);
1363 return PHI_ARG_DEF (phi
, e
->dest_idx
);
1373 /* For each expression in SET, translate the value handles through phi nodes
1374 in PHIBLOCK using edge PHIBLOCK->PRED, and store the resulting
1375 expressions in DEST. */
1378 phi_translate_set (value_set_t dest
, value_set_t set
, basic_block pred
,
1379 basic_block phiblock
)
1381 value_set_node_t node
;
1382 for (node
= set
->head
;
1388 translated
= phi_translate (node
->expr
, set
, pred
, phiblock
);
1390 /* Don't add constants or empty translations to the cache, since
1391 we won't look them up that way, or use the result, anyway. */
1392 if (translated
&& !is_gimple_min_invariant (translated
))
1394 tree vh
= get_value_handle (translated
);
1395 VEC (tree
, gc
) *vuses
;
1397 /* The value handle itself may also be an invariant, in
1398 which case, it has no vuses. */
1399 vuses
= !is_gimple_min_invariant (vh
)
1400 ? VALUE_HANDLE_VUSES (vh
) : NULL
;
1401 phi_trans_add (node
->expr
, translated
, pred
, vuses
);
1404 if (translated
!= NULL
)
1405 value_insert_into_set (dest
, translated
);
1409 /* Find the leader for a value (i.e., the name representing that
1410 value) in a given set, and return it. Return NULL if no leader is
1414 bitmap_find_leader (bitmap_set_t set
, tree val
)
1419 if (is_gimple_min_invariant (val
))
1421 if (bitmap_set_contains_value (set
, val
))
1423 /* Rather than walk the entire bitmap of expressions, and see
1424 whether any of them has the value we are looking for, we look
1425 at the reverse mapping, which tells us the set of expressions
1426 that have a given value (IE value->expressions with that
1427 value) and see if any of those expressions are in our set.
1428 The number of expressions per value is usually significantly
1429 less than the number of expressions in the set. In fact, for
1430 large testcases, doing it this way is roughly 5-10x faster
1431 than walking the bitmap.
1432 If this is somehow a significant lose for some cases, we can
1433 choose which set to walk based on which set is smaller. */
1434 value_set_t exprset
;
1435 value_set_node_t node
;
1436 exprset
= VALUE_HANDLE_EXPR_SET (val
);
1437 for (node
= exprset
->head
; node
; node
= node
->next
)
1439 if (TREE_CODE (node
->expr
) == SSA_NAME
)
1441 if (bitmap_bit_p (set
->expressions
,
1442 SSA_NAME_VERSION (node
->expr
)))
1451 /* Find the leader for a value (i.e., the name representing that
1452 value) in a given set, and return it. Return NULL if no leader is
1456 find_leader (value_set_t set
, tree val
)
1458 value_set_node_t node
;
1463 /* Constants represent themselves. */
1464 if (is_gimple_min_invariant (val
))
1467 if (set
->length
== 0)
1470 if (value_exists_in_set_bitmap (set
, val
))
1472 for (node
= set
->head
;
1476 if (get_value_handle (node
->expr
) == val
)
1484 /* Given the vuse representative map, MAP, and an SSA version number,
1485 ID, return the bitmap of names ID represents, or NULL, if none
1489 get_representative (bitmap
*map
, int id
)
1491 if (map
[id
] != NULL
)
1496 /* A vuse is anticipable at the top of block x, from the bottom of the
1497 block, if it reaches the top of the block, and is not killed in the
1498 block. In effect, we are trying to see if the vuse is transparent
1499 backwards in the block. */
1502 vuses_dies_in_block_x (VEC (tree
, gc
) *vuses
, basic_block block
)
1507 for (i
= 0; VEC_iterate (tree
, vuses
, i
, vuse
); i
++)
1509 /* Any places where this is too conservative, are places
1510 where we created a new version and shouldn't have. */
1512 if (!bitmap_bit_p (RVUSE_IN (block
), SSA_NAME_VERSION (vuse
))
1513 || bitmap_bit_p (RVUSE_KILL (block
), SSA_NAME_VERSION (vuse
)))
1519 /* Determine if the expression EXPR is valid in SET. This means that
1520 we have a leader for each part of the expression (if it consists of
1521 values), or the expression is an SSA_NAME.
1523 NB: We never should run into a case where we have SSA_NAME +
1524 SSA_NAME or SSA_NAME + value. The sets valid_in_set is called on,
1525 the ANTIC sets, will only ever have SSA_NAME's or value expressions
1526 (IE VALUE1 + VALUE2, *VALUE1, VALUE1 < VALUE2) */
1529 valid_in_set (value_set_t set
, tree expr
, basic_block block
)
1531 tree vh
= get_value_handle (expr
);
1532 switch (TREE_CODE_CLASS (TREE_CODE (expr
)))
1535 case tcc_comparison
:
1537 tree op1
= TREE_OPERAND (expr
, 0);
1538 tree op2
= TREE_OPERAND (expr
, 1);
1539 return set_contains_value (set
, op1
) && set_contains_value (set
, op2
);
1544 tree op1
= TREE_OPERAND (expr
, 0);
1545 return set_contains_value (set
, op1
);
1548 case tcc_expression
:
1550 if (TREE_CODE (expr
) == CALL_EXPR
)
1552 tree op0
= TREE_OPERAND (expr
, 0);
1553 tree arglist
= TREE_OPERAND (expr
, 1);
1554 tree op2
= TREE_OPERAND (expr
, 2);
1556 /* Check the non-list operands first. */
1557 if (!set_contains_value (set
, op0
)
1558 || (op2
&& !set_contains_value (set
, op2
)))
1561 /* Now check the operands. */
1562 for (; arglist
; arglist
= TREE_CHAIN (arglist
))
1564 if (!set_contains_value (set
, TREE_VALUE (arglist
)))
1567 return !vuses_dies_in_block_x (VALUE_HANDLE_VUSES (vh
), block
);
1574 if (TREE_CODE (expr
) == INDIRECT_REF
1575 || TREE_CODE (expr
) == COMPONENT_REF
1576 || TREE_CODE (expr
) == ARRAY_REF
)
1578 tree op0
= TREE_OPERAND (expr
, 0);
1579 gcc_assert (is_gimple_min_invariant (op0
)
1580 || TREE_CODE (op0
) == VALUE_HANDLE
);
1581 if (!set_contains_value (set
, op0
))
1583 if (TREE_CODE (expr
) == ARRAY_REF
)
1585 tree op1
= TREE_OPERAND (expr
, 1);
1586 tree op2
= TREE_OPERAND (expr
, 2);
1587 tree op3
= TREE_OPERAND (expr
, 3);
1588 gcc_assert (is_gimple_min_invariant (op1
)
1589 || TREE_CODE (op1
) == VALUE_HANDLE
);
1590 if (!set_contains_value (set
, op1
))
1592 gcc_assert (!op2
|| is_gimple_min_invariant (op2
)
1593 || TREE_CODE (op2
) == VALUE_HANDLE
);
1595 && !set_contains_value (set
, op2
))
1597 gcc_assert (!op3
|| is_gimple_min_invariant (op3
)
1598 || TREE_CODE (op3
) == VALUE_HANDLE
);
1600 && !set_contains_value (set
, op3
))
1603 return set_contains_value (ANTIC_SAFE_LOADS (block
),
1605 || !vuses_dies_in_block_x (VALUE_HANDLE_VUSES (vh
),
1611 case tcc_exceptional
:
1612 gcc_assert (TREE_CODE (expr
) == SSA_NAME
);
1615 case tcc_declaration
:
1616 return !vuses_dies_in_block_x (VALUE_HANDLE_VUSES (vh
), block
);
1619 /* No other cases should be encountered. */
1624 /* Clean the set of expressions that are no longer valid in SET. This
1625 means expressions that are made up of values we have no leaders for
1629 clean (value_set_t set
, basic_block block
)
1631 value_set_node_t node
;
1632 value_set_node_t next
;
1637 if (!valid_in_set (set
, node
->expr
, block
))
1638 set_remove (set
, node
->expr
);
1643 static sbitmap has_abnormal_preds
;
1645 /* Compute the ANTIC set for BLOCK.
1647 If succs(BLOCK) > 1 then
1648 ANTIC_OUT[BLOCK] = intersection of ANTIC_IN[b] for all succ(BLOCK)
1649 else if succs(BLOCK) == 1 then
1650 ANTIC_OUT[BLOCK] = phi_translate (ANTIC_IN[succ(BLOCK)])
1652 ANTIC_IN[BLOCK] = clean(ANTIC_OUT[BLOCK] U EXP_GEN[BLOCK] - TMP_GEN[BLOCK])
1654 XXX: It would be nice to either write a set_clear, and use it for
1655 ANTIC_OUT, or to mark the antic_out set as deleted at the end
1656 of this routine, so that the pool can hand the same memory back out
1657 again for the next ANTIC_OUT. */
1660 compute_antic_aux (basic_block block
, bool block_has_abnormal_pred_edge
)
1663 bool changed
= false;
1664 value_set_t S
, old
, ANTIC_OUT
;
1665 value_set_node_t node
;
1667 ANTIC_OUT
= S
= NULL
;
1669 /* If any edges from predecessors are abnormal, antic_in is empty,
1671 if (block_has_abnormal_pred_edge
)
1672 goto maybe_dump_sets
;
1674 old
= set_new (false);
1675 set_copy (old
, ANTIC_IN (block
));
1676 ANTIC_OUT
= set_new (true);
1678 /* If the block has no successors, ANTIC_OUT is empty. */
1679 if (EDGE_COUNT (block
->succs
) == 0)
1681 /* If we have one successor, we could have some phi nodes to
1682 translate through. */
1683 else if (single_succ_p (block
))
1685 phi_translate_set (ANTIC_OUT
, ANTIC_IN (single_succ (block
)),
1686 block
, single_succ (block
));
1688 /* If we have multiple successors, we take the intersection of all of
1692 VEC(basic_block
, heap
) * worklist
;
1695 basic_block bprime
, first
;
1698 worklist
= VEC_alloc (basic_block
, heap
, EDGE_COUNT (block
->succs
));
1699 FOR_EACH_EDGE (e
, ei
, block
->succs
)
1700 VEC_quick_push (basic_block
, worklist
, e
->dest
);
1701 first
= VEC_index (basic_block
, worklist
, 0);
1702 set_copy (ANTIC_OUT
, ANTIC_IN (first
));
1704 for (i
= 1; VEC_iterate (basic_block
, worklist
, i
, bprime
); i
++)
1706 node
= ANTIC_OUT
->head
;
1710 value_set_node_t next
= node
->next
;
1712 val
= get_value_handle (node
->expr
);
1713 if (!set_contains_value (ANTIC_IN (bprime
), val
))
1714 set_remove (ANTIC_OUT
, node
->expr
);
1718 VEC_free (basic_block
, heap
, worklist
);
1721 /* Generate ANTIC_OUT - TMP_GEN. */
1722 S
= bitmap_set_subtract_from_value_set (ANTIC_OUT
, TMP_GEN (block
), false);
1724 /* Start ANTIC_IN with EXP_GEN - TMP_GEN */
1725 ANTIC_IN (block
) = bitmap_set_subtract_from_value_set (EXP_GEN (block
),
1729 /* Then union in the ANTIC_OUT - TMP_GEN values,
1730 to get ANTIC_OUT U EXP_GEN - TMP_GEN */
1731 for (node
= S
->head
; node
; node
= node
->next
)
1732 value_insert_into_set (ANTIC_IN (block
), node
->expr
);
1734 clean (ANTIC_IN (block
), block
);
1735 if (!set_equal (old
, ANTIC_IN (block
)))
1739 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
1742 print_value_set (dump_file
, ANTIC_OUT
, "ANTIC_OUT", block
->index
);
1744 if (ANTIC_SAFE_LOADS (block
))
1745 print_value_set (dump_file
, ANTIC_SAFE_LOADS (block
),
1746 "ANTIC_SAFE_LOADS", block
->index
);
1747 print_value_set (dump_file
, ANTIC_IN (block
), "ANTIC_IN", block
->index
);
1750 print_value_set (dump_file
, S
, "S", block
->index
);
1753 for (son
= first_dom_son (CDI_POST_DOMINATORS
, block
);
1755 son
= next_dom_son (CDI_POST_DOMINATORS
, son
))
1757 changed
|= compute_antic_aux (son
,
1758 TEST_BIT (has_abnormal_preds
, son
->index
));
1763 /* Compute ANTIC sets. */
1766 compute_antic (void)
1768 bool changed
= true;
1769 int num_iterations
= 0;
1772 /* If any predecessor edges are abnormal, we punt, so antic_in is empty.
1773 We pre-build the map of blocks with incoming abnormal edges here. */
1774 has_abnormal_preds
= sbitmap_alloc (last_basic_block
);
1775 sbitmap_zero (has_abnormal_preds
);
1781 FOR_EACH_EDGE (e
, ei
, block
->preds
)
1782 if (e
->flags
& EDGE_ABNORMAL
)
1784 SET_BIT (has_abnormal_preds
, block
->index
);
1788 /* While we are here, give empty ANTIC_IN sets to each block. */
1789 ANTIC_IN (block
) = set_new (true);
1791 /* At the exit block we anticipate nothing. */
1792 ANTIC_IN (EXIT_BLOCK_PTR
) = set_new (true);
1798 changed
= compute_antic_aux (EXIT_BLOCK_PTR
, false);
1801 sbitmap_free (has_abnormal_preds
);
1803 if (dump_file
&& (dump_flags
& TDF_STATS
))
1804 fprintf (dump_file
, "compute_antic required %d iterations\n", num_iterations
);
1807 /* Print the names represented by the bitmap NAMES, to the file OUT. */
1809 dump_bitmap_of_names (FILE *out
, bitmap names
)
1814 fprintf (out
, " { ");
1815 EXECUTE_IF_SET_IN_BITMAP (names
, 0, i
, bi
)
1817 print_generic_expr (out
, ssa_name (i
), 0);
1820 fprintf (out
, "}\n");
1823 /* Compute a set of representative vuse versions for each phi. This
1824 is so we can compute conservative kill sets in terms of all vuses
1825 that are killed, instead of continually walking chains.
1827 We also have to be able kill all names associated with a phi when
1828 the phi dies in order to ensure we don't generate overlapping
1829 live ranges, which are not allowed in virtual SSA. */
1831 static bitmap
*vuse_names
;
1833 compute_vuse_representatives (void)
1837 VEC (tree
, heap
) *phis
= NULL
;
1838 bool changed
= true;
1843 for (phi
= phi_nodes (bb
);
1845 phi
= PHI_CHAIN (phi
))
1846 if (!is_gimple_reg (PHI_RESULT (phi
)))
1847 VEC_safe_push (tree
, heap
, phis
, phi
);
1854 for (i
= 0; VEC_iterate (tree
, phis
, i
, phi
); i
++)
1856 size_t ver
= SSA_NAME_VERSION (PHI_RESULT (phi
));
1860 if (vuse_names
[ver
] == NULL
)
1862 vuse_names
[ver
] = BITMAP_ALLOC (&grand_bitmap_obstack
);
1863 bitmap_set_bit (vuse_names
[ver
], ver
);
1865 FOR_EACH_PHI_ARG (usep
, phi
, iter
, SSA_OP_ALL_USES
)
1867 tree use
= USE_FROM_PTR (usep
);
1868 bitmap usebitmap
= get_representative (vuse_names
,
1869 SSA_NAME_VERSION (use
));
1870 if (usebitmap
!= NULL
)
1872 changed
|= bitmap_ior_into (vuse_names
[ver
],
1877 changed
|= !bitmap_bit_p (vuse_names
[ver
],
1878 SSA_NAME_VERSION (use
));
1880 bitmap_set_bit (vuse_names
[ver
],
1881 SSA_NAME_VERSION (use
));
1887 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
1888 for (i
= 0; VEC_iterate (tree
, phis
, i
, phi
); i
++)
1890 bitmap reps
= get_representative (vuse_names
,
1891 SSA_NAME_VERSION (PHI_RESULT (phi
)));
1894 print_generic_expr (dump_file
, PHI_RESULT (phi
), 0);
1895 fprintf (dump_file
, " represents ");
1896 dump_bitmap_of_names (dump_file
, reps
);
1899 VEC_free (tree
, heap
, phis
);
1902 /* Compute reaching vuses and antic safe loads. RVUSE computation is
1903 is a small bit of iterative dataflow to determine what virtual uses
1904 reach what blocks. Because we can't generate overlapping virtual
1905 uses, and virtual uses *do* actually die, this ends up being faster
1906 in most cases than continually walking the virtual use/def chains
1907 to determine whether we are inside a block where a given virtual is
1908 still available to be used.
1910 ANTIC_SAFE_LOADS are those loads that actually occur before any kill to
1911 their vuses in the block,and thus, are safe at the top of the
1921 b = *a is an antic safe load because it still safe to consider it
1922 ANTIC at the top of the block.
1924 We currently compute a conservative approximation to
1925 ANTIC_SAFE_LOADS. We compute those loads that occur before *any*
1926 stores in the block. This is not because it is difficult to
1927 compute the precise answer, but because it is expensive. More
1928 testing is necessary to determine whether it is worth computing the
1932 compute_rvuse_and_antic_safe (void)
1939 bool changed
= true;
1940 unsigned int *first_store_uid
;
1942 first_store_uid
= xcalloc (n_basic_blocks
, sizeof (unsigned int));
1944 compute_vuse_representatives ();
1948 RVUSE_IN (bb
) = BITMAP_ALLOC (&grand_bitmap_obstack
);
1949 RVUSE_GEN (bb
) = BITMAP_ALLOC (&grand_bitmap_obstack
);
1950 RVUSE_KILL (bb
) = BITMAP_ALLOC (&grand_bitmap_obstack
);
1951 RVUSE_OUT (bb
) = BITMAP_ALLOC (&grand_bitmap_obstack
);
1952 ANTIC_SAFE_LOADS (bb
) = NULL
;
1955 /* Mark live on entry */
1956 for (i
= 0; i
< num_ssa_names
; i
++)
1958 tree name
= ssa_name (i
);
1959 if (name
&& !is_gimple_reg (name
)
1960 && IS_EMPTY_STMT (SSA_NAME_DEF_STMT (name
)))
1961 bitmap_set_bit (RVUSE_OUT (ENTRY_BLOCK_PTR
),
1962 SSA_NAME_VERSION (name
));
1965 /* Compute local sets for reaching vuses.
1966 GEN(block) = generated in block and not locally killed.
1967 KILL(block) = set of vuses killed in block.
1972 block_stmt_iterator bsi
;
1977 for (bsi
= bsi_start (bb
); !bsi_end_p (bsi
); bsi_next (&bsi
))
1979 tree stmt
= bsi_stmt (bsi
);
1981 if (first_store_uid
[bb
->index
] == 0
1982 && !ZERO_SSA_OPERANDS (stmt
, SSA_OP_VMAYUSE
| SSA_OP_VMAYDEF
1983 | SSA_OP_VMUSTDEF
| SSA_OP_VMUSTKILL
))
1985 first_store_uid
[bb
->index
] = stmt_ann (stmt
)->uid
;
1989 FOR_EACH_SSA_USE_OPERAND (usep
, stmt
, iter
, SSA_OP_VIRTUAL_KILLS
1992 tree use
= USE_FROM_PTR (usep
);
1993 bitmap repbit
= get_representative (vuse_names
,
1994 SSA_NAME_VERSION (use
));
1997 bitmap_and_compl_into (RVUSE_GEN (bb
), repbit
);
1998 bitmap_ior_into (RVUSE_KILL (bb
), repbit
);
2002 bitmap_set_bit (RVUSE_KILL (bb
), SSA_NAME_VERSION (use
));
2003 bitmap_clear_bit (RVUSE_GEN (bb
), SSA_NAME_VERSION (use
));
2006 FOR_EACH_SSA_DEF_OPERAND (defp
, stmt
, iter
, SSA_OP_VIRTUAL_DEFS
)
2008 tree def
= DEF_FROM_PTR (defp
);
2009 bitmap_set_bit (RVUSE_GEN (bb
), SSA_NAME_VERSION (def
));
2016 for (phi
= phi_nodes (bb
); phi
; phi
= PHI_CHAIN (phi
))
2018 if (!is_gimple_reg (PHI_RESULT (phi
)))
2023 tree def
= PHI_RESULT (phi
);
2024 /* In reality, the PHI result is generated at the end of
2025 each predecessor block. This will make the value
2026 LVUSE_IN for the bb containing the PHI, which is
2028 FOR_EACH_EDGE (e
, ei
, bb
->preds
)
2029 bitmap_set_bit (RVUSE_GEN (e
->src
), SSA_NAME_VERSION (def
));
2034 /* Solve reaching vuses.
2036 RVUSE_IN[BB] = Union of RVUSE_OUT of predecessors.
2037 RVUSE_OUT[BB] = RVUSE_GEN[BB] U (RVUSE_IN[BB] - RVUSE_KILL[BB])
2039 postorder
= XNEWVEC (int, n_basic_blocks
- NUM_FIXED_BLOCKS
);
2040 pre_and_rev_post_order_compute (NULL
, postorder
, false);
2047 for (j
= 0; j
< n_basic_blocks
- NUM_FIXED_BLOCKS
; j
++)
2051 bb
= BASIC_BLOCK (postorder
[j
]);
2053 FOR_EACH_EDGE (e
, ei
, bb
->preds
)
2054 bitmap_ior_into (RVUSE_IN (bb
), RVUSE_OUT (e
->src
));
2056 changed
|= bitmap_ior_and_compl (RVUSE_OUT (bb
),
2064 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
2068 fprintf (dump_file
, "RVUSE_IN (%d) =", bb
->index
);
2069 dump_bitmap_of_names (dump_file
, RVUSE_IN (bb
));
2071 fprintf (dump_file
, "RVUSE_KILL (%d) =", bb
->index
);
2072 dump_bitmap_of_names (dump_file
, RVUSE_KILL (bb
));
2074 fprintf (dump_file
, "RVUSE_GEN (%d) =", bb
->index
);
2075 dump_bitmap_of_names (dump_file
, RVUSE_GEN (bb
));
2077 fprintf (dump_file
, "RVUSE_OUT (%d) =", bb
->index
);
2078 dump_bitmap_of_names (dump_file
, RVUSE_OUT (bb
));
2084 value_set_node_t node
;
2085 if (bitmap_empty_p (RVUSE_KILL (bb
)))
2088 for (node
= EXP_GEN (bb
)->head
; node
; node
= node
->next
)
2090 if (REFERENCE_CLASS_P (node
->expr
))
2092 tree vh
= get_value_handle (node
->expr
);
2093 tree maybe
= bitmap_find_leader (AVAIL_OUT (bb
), vh
);
2097 tree def
= SSA_NAME_DEF_STMT (maybe
);
2099 if (bb_for_stmt (def
) != bb
)
2102 if (TREE_CODE (def
) == PHI_NODE
2103 || stmt_ann (def
)->uid
< first_store_uid
[bb
->index
])
2105 if (ANTIC_SAFE_LOADS (bb
) == NULL
)
2106 ANTIC_SAFE_LOADS (bb
) = set_new (true);
2107 value_insert_into_set (ANTIC_SAFE_LOADS (bb
),
2114 free (first_store_uid
);
2117 /* Return true if we can value number the call in STMT. This is true
2118 if we have a pure or constant call. */
2121 can_value_number_call (tree stmt
)
2123 tree call
= get_call_expr_in (stmt
);
2125 if (call_expr_flags (call
) & (ECF_PURE
| ECF_CONST
))
2130 /* Return true if OP is a tree which we can perform value numbering
2134 can_value_number_operation (tree op
)
2136 return UNARY_CLASS_P (op
)
2137 || BINARY_CLASS_P (op
)
2138 || COMPARISON_CLASS_P (op
)
2139 || REFERENCE_CLASS_P (op
)
2140 || (TREE_CODE (op
) == CALL_EXPR
2141 && can_value_number_call (op
));
2145 /* Return true if OP is a tree which we can perform PRE on
2146 on. This may not match the operations we can value number, but in
2147 a perfect world would. */
2150 can_PRE_operation (tree op
)
2152 return UNARY_CLASS_P (op
)
2153 || BINARY_CLASS_P (op
)
2154 || COMPARISON_CLASS_P (op
)
2155 || TREE_CODE (op
) == INDIRECT_REF
2156 || TREE_CODE (op
) == COMPONENT_REF
2157 || TREE_CODE (op
) == CALL_EXPR
2158 || TREE_CODE (op
) == ARRAY_REF
;
2162 /* Inserted expressions are placed onto this worklist, which is used
2163 for performing quick dead code elimination of insertions we made
2164 that didn't turn out to be necessary. */
2165 static VEC(tree
,heap
) *inserted_exprs
;
2167 /* Pool allocated fake store expressions are placed onto this
2168 worklist, which, after performing dead code elimination, is walked
2169 to see which expressions need to be put into GC'able memory */
2170 static VEC(tree
, heap
) *need_creation
;
2172 /* For COMPONENT_REF's and ARRAY_REF's, we can't have any intermediates for the
2173 COMPONENT_REF or INDIRECT_REF or ARRAY_REF portion, because we'd end up with
2174 trying to rename aggregates into ssa form directly, which is a no
2177 Thus, this routine doesn't create temporaries, it just builds a
2178 single access expression for the array, calling
2179 find_or_generate_expression to build the innermost pieces.
2181 This function is a subroutine of create_expression_by_pieces, and
2182 should not be called on it's own unless you really know what you
2186 create_component_ref_by_pieces (basic_block block
, tree expr
, tree stmts
)
2191 if (TREE_CODE (genop
) == VALUE_HANDLE
)
2193 tree found
= bitmap_find_leader (AVAIL_OUT (block
), expr
);
2198 if (TREE_CODE (genop
) == VALUE_HANDLE
)
2199 genop
= VALUE_HANDLE_EXPR_SET (expr
)->head
->expr
;
2201 switch TREE_CODE (genop
)
2207 op0
= create_component_ref_by_pieces (block
,
2208 TREE_OPERAND (genop
, 0),
2210 op1
= TREE_OPERAND (genop
, 1);
2211 if (TREE_CODE (op1
) == VALUE_HANDLE
)
2212 op1
= find_or_generate_expression (block
, op1
, stmts
);
2213 op2
= TREE_OPERAND (genop
, 2);
2214 if (op2
&& TREE_CODE (op2
) == VALUE_HANDLE
)
2215 op2
= find_or_generate_expression (block
, op2
, stmts
);
2216 op3
= TREE_OPERAND (genop
, 3);
2217 if (op3
&& TREE_CODE (op3
) == VALUE_HANDLE
)
2218 op3
= find_or_generate_expression (block
, op3
, stmts
);
2219 folded
= build4 (ARRAY_REF
, TREE_TYPE (genop
), op0
, op1
,
2227 op0
= create_component_ref_by_pieces (block
,
2228 TREE_OPERAND (genop
, 0),
2230 op1
= VALUE_HANDLE_EXPR_SET (TREE_OPERAND (genop
, 1))->head
->expr
;
2231 folded
= fold_build3 (COMPONENT_REF
, TREE_TYPE (genop
), op0
, op1
,
2238 tree op1
= TREE_OPERAND (genop
, 0);
2239 tree genop1
= find_or_generate_expression (block
, op1
, stmts
);
2241 folded
= fold_build1 (TREE_CODE (genop
), TREE_TYPE (genop
),
2259 /* Find a leader for an expression, or generate one using
2260 create_expression_by_pieces if it's ANTIC but
2262 BLOCK is the basic_block we are looking for leaders in.
2263 EXPR is the expression to find a leader or generate for.
2264 STMTS is the statement list to put the inserted expressions on.
2265 Returns the SSA_NAME of the LHS of the generated expression or the
2269 find_or_generate_expression (basic_block block
, tree expr
, tree stmts
)
2271 tree genop
= bitmap_find_leader (AVAIL_OUT (block
), expr
);
2273 /* If it's still NULL, it must be a complex expression, so generate
2277 genop
= VALUE_HANDLE_EXPR_SET (expr
)->head
->expr
;
2279 gcc_assert (can_PRE_operation (genop
));
2280 genop
= create_expression_by_pieces (block
, genop
, stmts
);
2285 #define NECESSARY(stmt) stmt->common.asm_written_flag
2286 /* Create an expression in pieces, so that we can handle very complex
2287 expressions that may be ANTIC, but not necessary GIMPLE.
2288 BLOCK is the basic block the expression will be inserted into,
2289 EXPR is the expression to insert (in value form)
2290 STMTS is a statement list to append the necessary insertions into.
2292 This function will die if we hit some value that shouldn't be
2293 ANTIC but is (IE there is no leader for it, or its components).
2294 This function may also generate expressions that are themselves
2295 partially or fully redundant. Those that are will be either made
2296 fully redundant during the next iteration of insert (for partially
2297 redundant ones), or eliminated by eliminate (for fully redundant
2301 create_expression_by_pieces (basic_block block
, tree expr
, tree stmts
)
2304 tree folded
, forced_stmts
, newexpr
;
2306 tree_stmt_iterator tsi
;
2308 switch (TREE_CODE_CLASS (TREE_CODE (expr
)))
2310 case tcc_expression
:
2314 tree genop0
, genop2
;
2316 tree walker
, genwalker
;
2318 gcc_assert (TREE_CODE (expr
) == CALL_EXPR
);
2321 op0
= TREE_OPERAND (expr
, 0);
2322 arglist
= TREE_OPERAND (expr
, 1);
2323 op2
= TREE_OPERAND (expr
, 2);
2325 genop0
= find_or_generate_expression (block
, op0
, stmts
);
2326 genarglist
= copy_list (arglist
);
2327 for (walker
= arglist
, genwalker
= genarglist
;
2328 genwalker
&& walker
;
2329 genwalker
= TREE_CHAIN (genwalker
), walker
= TREE_CHAIN (walker
))
2331 TREE_VALUE (genwalker
)
2332 = find_or_generate_expression (block
, TREE_VALUE (walker
),
2337 genop2
= find_or_generate_expression (block
, op2
, stmts
);
2338 folded
= fold_build3 (TREE_CODE (expr
), TREE_TYPE (expr
),
2339 genop0
, genarglist
, genop2
);
2347 if (TREE_CODE (expr
) == COMPONENT_REF
2348 || TREE_CODE (expr
) == ARRAY_REF
)
2350 folded
= create_component_ref_by_pieces (block
, expr
, stmts
);
2354 tree op1
= TREE_OPERAND (expr
, 0);
2355 tree genop1
= find_or_generate_expression (block
, op1
, stmts
);
2357 folded
= fold_build1 (TREE_CODE (expr
), TREE_TYPE (expr
),
2364 case tcc_comparison
:
2366 tree op1
= TREE_OPERAND (expr
, 0);
2367 tree op2
= TREE_OPERAND (expr
, 1);
2368 tree genop1
= find_or_generate_expression (block
, op1
, stmts
);
2369 tree genop2
= find_or_generate_expression (block
, op2
, stmts
);
2370 folded
= fold_build2 (TREE_CODE (expr
), TREE_TYPE (expr
),
2377 tree op1
= TREE_OPERAND (expr
, 0);
2378 tree genop1
= find_or_generate_expression (block
, op1
, stmts
);
2379 folded
= fold_build1 (TREE_CODE (expr
), TREE_TYPE (expr
),
2388 /* Force the generated expression to be a sequence of GIMPLE
2390 We have to call unshare_expr because force_gimple_operand may
2391 modify the tree we pass to it. */
2392 newexpr
= force_gimple_operand (unshare_expr (folded
), &forced_stmts
,
2395 /* If we have any intermediate expressions to the value sets, add them
2396 to the value sets and chain them on in the instruction stream. */
2399 tsi
= tsi_start (forced_stmts
);
2400 for (; !tsi_end_p (tsi
); tsi_next (&tsi
))
2402 tree stmt
= tsi_stmt (tsi
);
2403 tree forcedname
= TREE_OPERAND (stmt
, 0);
2404 tree forcedexpr
= TREE_OPERAND (stmt
, 1);
2405 tree val
= vn_lookup_or_add (forcedexpr
, NULL
);
2407 VEC_safe_push (tree
, heap
, inserted_exprs
, stmt
);
2408 vn_add (forcedname
, val
);
2409 bitmap_value_replace_in_set (NEW_SETS (block
), forcedname
);
2410 bitmap_value_replace_in_set (AVAIL_OUT (block
), forcedname
);
2411 mark_new_vars_to_rename (stmt
);
2413 tsi
= tsi_last (stmts
);
2414 tsi_link_after (&tsi
, forced_stmts
, TSI_CONTINUE_LINKING
);
2417 /* Build and insert the assignment of the end result to the temporary
2418 that we will return. */
2419 if (!pretemp
|| TREE_TYPE (expr
) != TREE_TYPE (pretemp
))
2421 pretemp
= create_tmp_var (TREE_TYPE (expr
), "pretmp");
2422 get_var_ann (pretemp
);
2426 add_referenced_var (temp
);
2428 if (TREE_CODE (TREE_TYPE (expr
)) == COMPLEX_TYPE
)
2429 DECL_COMPLEX_GIMPLE_REG_P (temp
) = 1;
2431 newexpr
= build2 (MODIFY_EXPR
, TREE_TYPE (expr
), temp
, newexpr
);
2432 name
= make_ssa_name (temp
, newexpr
);
2433 TREE_OPERAND (newexpr
, 0) = name
;
2434 NECESSARY (newexpr
) = 0;
2436 tsi
= tsi_last (stmts
);
2437 tsi_link_after (&tsi
, newexpr
, TSI_CONTINUE_LINKING
);
2438 VEC_safe_push (tree
, heap
, inserted_exprs
, newexpr
);
2439 mark_new_vars_to_rename (newexpr
);
2441 /* Add a value handle to the temporary.
2442 The value may already exist in either NEW_SETS, or AVAIL_OUT, because
2443 we are creating the expression by pieces, and this particular piece of
2444 the expression may have been represented. There is no harm in replacing
2446 v
= get_value_handle (expr
);
2448 bitmap_value_replace_in_set (NEW_SETS (block
), name
);
2449 bitmap_value_replace_in_set (AVAIL_OUT (block
), name
);
2451 pre_stats
.insertions
++;
2452 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
2454 fprintf (dump_file
, "Inserted ");
2455 print_generic_expr (dump_file
, newexpr
, 0);
2456 fprintf (dump_file
, " in predecessor %d\n", block
->index
);
2462 /* Insert the to-be-made-available values of NODE for each
2463 predecessor, stored in AVAIL, into the predecessors of BLOCK, and
2464 merge the result with a phi node, given the same value handle as
2465 NODE. Return true if we have inserted new stuff. */
2468 insert_into_preds_of_block (basic_block block
, value_set_node_t node
,
2471 tree val
= get_value_handle (node
->expr
);
2473 bool insertions
= false;
2478 tree type
= TREE_TYPE (avail
[EDGE_PRED (block
, 0)->src
->index
]);
2481 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
2483 fprintf (dump_file
, "Found partial redundancy for expression ");
2484 print_generic_expr (dump_file
, node
->expr
, 0);
2485 fprintf (dump_file
, " (");
2486 print_generic_expr (dump_file
, val
, 0);
2487 fprintf (dump_file
, ")");
2488 fprintf (dump_file
, "\n");
2491 /* Make sure we aren't creating an induction variable. */
2492 if (block
->loop_depth
> 0 && EDGE_COUNT (block
->preds
) == 2
2493 && TREE_CODE_CLASS (TREE_CODE (node
->expr
)) != tcc_reference
)
2495 bool firstinsideloop
= false;
2496 bool secondinsideloop
= false;
2497 firstinsideloop
= flow_bb_inside_loop_p (block
->loop_father
,
2498 EDGE_PRED (block
, 0)->src
);
2499 secondinsideloop
= flow_bb_inside_loop_p (block
->loop_father
,
2500 EDGE_PRED (block
, 1)->src
);
2501 /* Induction variables only have one edge inside the loop. */
2502 if (firstinsideloop
^ secondinsideloop
)
2504 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
2505 fprintf (dump_file
, "Skipping insertion of phi for partial redundancy: Looks like an induction variable\n");
2511 /* Make the necessary insertions. */
2512 FOR_EACH_EDGE (pred
, ei
, block
->preds
)
2514 tree stmts
= alloc_stmt_list ();
2517 eprime
= avail
[bprime
->index
];
2519 if (can_PRE_operation (eprime
))
2521 #ifdef ENABLE_CHECKING
2524 /* eprime may be an invariant. */
2525 vh
= TREE_CODE (eprime
) == VALUE_HANDLE
2527 : get_value_handle (eprime
);
2529 /* ensure that the virtual uses we need reach our block. */
2530 if (TREE_CODE (vh
) == VALUE_HANDLE
)
2535 VEC_iterate (tree
, VALUE_HANDLE_VUSES (vh
), i
, vuse
);
2538 size_t id
= SSA_NAME_VERSION (vuse
);
2539 gcc_assert (bitmap_bit_p (RVUSE_OUT (bprime
), id
)
2540 || IS_EMPTY_STMT (SSA_NAME_DEF_STMT (vuse
)));
2544 builtexpr
= create_expression_by_pieces (bprime
,
2547 bsi_insert_on_edge (pred
, stmts
);
2548 avail
[bprime
->index
] = builtexpr
;
2552 /* If we didn't want a phi node, and we made insertions, we still have
2553 inserted new stuff, and thus return true. If we didn't want a phi node,
2554 and didn't make insertions, we haven't added anything new, so return
2556 if (nophi
&& insertions
)
2558 else if (nophi
&& !insertions
)
2561 /* Now build a phi for the new variable. */
2562 if (!prephitemp
|| TREE_TYPE (prephitemp
) != type
)
2564 prephitemp
= create_tmp_var (type
, "prephitmp");
2565 get_var_ann (prephitemp
);
2569 add_referenced_var (temp
);
2571 if (TREE_CODE (type
) == COMPLEX_TYPE
)
2572 DECL_COMPLEX_GIMPLE_REG_P (temp
) = 1;
2573 temp
= create_phi_node (temp
, block
);
2575 NECESSARY (temp
) = 0;
2576 VEC_safe_push (tree
, heap
, inserted_exprs
, temp
);
2577 FOR_EACH_EDGE (pred
, ei
, block
->preds
)
2578 add_phi_arg (temp
, avail
[pred
->src
->index
], pred
);
2580 vn_add (PHI_RESULT (temp
), val
);
2582 /* The value should *not* exist in PHI_GEN, or else we wouldn't be doing
2583 this insertion, since we test for the existence of this value in PHI_GEN
2584 before proceeding with the partial redundancy checks in insert_aux.
2586 The value may exist in AVAIL_OUT, in particular, it could be represented
2587 by the expression we are trying to eliminate, in which case we want the
2588 replacement to occur. If it's not existing in AVAIL_OUT, we want it
2591 Similarly, to the PHI_GEN case, the value should not exist in NEW_SETS of
2592 this block, because if it did, it would have existed in our dominator's
2593 AVAIL_OUT, and would have been skipped due to the full redundancy check.
2596 bitmap_insert_into_set (PHI_GEN (block
),
2598 bitmap_value_replace_in_set (AVAIL_OUT (block
),
2600 bitmap_insert_into_set (NEW_SETS (block
),
2603 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
2605 fprintf (dump_file
, "Created phi ");
2606 print_generic_expr (dump_file
, temp
, 0);
2607 fprintf (dump_file
, " in block %d\n", block
->index
);
2615 /* Perform insertion of partially redundant values.
2616 For BLOCK, do the following:
2617 1. Propagate the NEW_SETS of the dominator into the current block.
2618 If the block has multiple predecessors,
2619 2a. Iterate over the ANTIC expressions for the block to see if
2620 any of them are partially redundant.
2621 2b. If so, insert them into the necessary predecessors to make
2622 the expression fully redundant.
2623 2c. Insert a new PHI merging the values of the predecessors.
2624 2d. Insert the new PHI, and the new expressions, into the
2626 3. Recursively call ourselves on the dominator children of BLOCK.
2631 insert_aux (basic_block block
)
2634 bool new_stuff
= false;
2639 dom
= get_immediate_dominator (CDI_DOMINATORS
, block
);
2644 bitmap_set_t newset
= NEW_SETS (dom
);
2647 /* Note that we need to value_replace both NEW_SETS, and
2648 AVAIL_OUT. For both the case of NEW_SETS, the value may be
2649 represented by some non-simple expression here that we want
2650 to replace it with. */
2651 EXECUTE_IF_SET_IN_BITMAP (newset
->expressions
, 0, i
, bi
)
2653 bitmap_value_replace_in_set (NEW_SETS (block
), ssa_name (i
));
2654 bitmap_value_replace_in_set (AVAIL_OUT (block
), ssa_name (i
));
2657 if (!single_pred_p (block
))
2659 value_set_node_t node
;
2660 for (node
= ANTIC_IN (block
)->head
;
2664 if (can_PRE_operation (node
->expr
)
2665 && !AGGREGATE_TYPE_P (TREE_TYPE (node
->expr
)))
2669 bool by_some
= false;
2670 bool cant_insert
= false;
2671 bool all_same
= true;
2672 tree first_s
= NULL
;
2675 tree eprime
= NULL_TREE
;
2678 val
= get_value_handle (node
->expr
);
2679 if (bitmap_set_contains_value (PHI_GEN (block
), val
))
2681 if (bitmap_set_contains_value (AVAIL_OUT (dom
), val
))
2683 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
2684 fprintf (dump_file
, "Found fully redundant value\n");
2688 avail
= XCNEWVEC (tree
, last_basic_block
);
2689 FOR_EACH_EDGE (pred
, ei
, block
->preds
)
2694 /* This can happen in the very weird case
2695 that our fake infinite loop edges have caused a
2696 critical edge to appear. */
2697 if (EDGE_CRITICAL_P (pred
))
2703 eprime
= phi_translate (node
->expr
,
2707 /* eprime will generally only be NULL if the
2708 value of the expression, translated
2709 through the PHI for this predecessor, is
2710 undefined. If that is the case, we can't
2711 make the expression fully redundant,
2712 because its value is undefined along a
2713 predecessor path. We can thus break out
2714 early because it doesn't matter what the
2715 rest of the results are. */
2722 eprime
= fully_constant_expression (eprime
);
2723 vprime
= get_value_handle (eprime
);
2724 gcc_assert (vprime
);
2725 edoubleprime
= bitmap_find_leader (AVAIL_OUT (bprime
),
2727 if (edoubleprime
== NULL
)
2729 avail
[bprime
->index
] = eprime
;
2734 avail
[bprime
->index
] = edoubleprime
;
2736 if (first_s
== NULL
)
2737 first_s
= edoubleprime
;
2738 else if (!operand_equal_p (first_s
, edoubleprime
,
2743 /* If we can insert it, it's not the same value
2744 already existing along every predecessor, and
2745 it's defined by some predecessor, it is
2746 partially redundant. */
2747 if (!cant_insert
&& !all_same
&& by_some
)
2749 if (insert_into_preds_of_block (block
, node
, avail
))
2752 /* If all edges produce the same value and that value is
2753 an invariant, then the PHI has the same value on all
2754 edges. Note this. */
2755 else if (!cant_insert
&& all_same
&& eprime
2756 && is_gimple_min_invariant (eprime
)
2757 && !is_gimple_min_invariant (val
))
2759 value_set_t exprset
= VALUE_HANDLE_EXPR_SET (val
);
2760 value_set_node_t node
;
2762 for (node
= exprset
->head
; node
; node
= node
->next
)
2764 if (TREE_CODE (node
->expr
) == SSA_NAME
)
2766 vn_add (node
->expr
, eprime
);
2767 pre_stats
.constified
++;
2777 for (son
= first_dom_son (CDI_DOMINATORS
, block
);
2779 son
= next_dom_son (CDI_DOMINATORS
, son
))
2781 new_stuff
|= insert_aux (son
);
2787 /* Perform insertion of partially redundant values. */
2792 bool new_stuff
= true;
2794 int num_iterations
= 0;
2797 NEW_SETS (bb
) = bitmap_set_new ();
2803 new_stuff
= insert_aux (ENTRY_BLOCK_PTR
);
2805 if (num_iterations
> 2 && dump_file
&& (dump_flags
& TDF_STATS
))
2806 fprintf (dump_file
, "insert required %d iterations\n", num_iterations
);
2810 /* Return true if VAR is an SSA variable with no defining statement in
2811 this procedure, *AND* isn't a live-on-entry parameter. */
2814 is_undefined_value (tree expr
)
2816 return (TREE_CODE (expr
) == SSA_NAME
2817 && IS_EMPTY_STMT (SSA_NAME_DEF_STMT (expr
))
2818 /* PARM_DECLs and hard registers are always defined. */
2819 && TREE_CODE (SSA_NAME_VAR (expr
)) != PARM_DECL
);
2823 /* Given an SSA variable VAR and an expression EXPR, compute the value
2824 number for EXPR and create a value handle (VAL) for it. If VAR and
2825 EXPR are not the same, associate VAL with VAR. Finally, add VAR to
2826 S1 and its value handle to S2.
2828 VUSES represent the virtual use operands associated with EXPR (if
2832 add_to_sets (tree var
, tree expr
, tree stmt
, bitmap_set_t s1
,
2835 tree val
= vn_lookup_or_add (expr
, stmt
);
2837 /* VAR and EXPR may be the same when processing statements for which
2838 we are not computing value numbers (e.g., non-assignments, or
2839 statements that make aliased stores). In those cases, we are
2840 only interested in making VAR available as its own value. */
2845 bitmap_insert_into_set (s1
, var
);
2846 bitmap_value_insert_into_set (s2
, var
);
2850 /* Given a unary or binary expression EXPR, create and return a new
2851 expression with the same structure as EXPR but with its operands
2852 replaced with the value handles of each of the operands of EXPR.
2854 VUSES represent the virtual use operands associated with EXPR (if
2855 any). Insert EXPR's operands into the EXP_GEN set for BLOCK. */
2858 create_value_expr_from (tree expr
, basic_block block
, tree stmt
)
2861 enum tree_code code
= TREE_CODE (expr
);
2865 gcc_assert (TREE_CODE_CLASS (code
) == tcc_unary
2866 || TREE_CODE_CLASS (code
) == tcc_binary
2867 || TREE_CODE_CLASS (code
) == tcc_comparison
2868 || TREE_CODE_CLASS (code
) == tcc_reference
2869 || TREE_CODE_CLASS (code
) == tcc_expression
2870 || TREE_CODE_CLASS (code
) == tcc_exceptional
2871 || TREE_CODE_CLASS (code
) == tcc_declaration
);
2873 if (TREE_CODE_CLASS (code
) == tcc_unary
)
2874 pool
= unary_node_pool
;
2875 else if (TREE_CODE_CLASS (code
) == tcc_reference
)
2876 pool
= reference_node_pool
;
2877 else if (TREE_CODE_CLASS (code
) == tcc_binary
)
2878 pool
= binary_node_pool
;
2879 else if (TREE_CODE_CLASS (code
) == tcc_comparison
)
2880 pool
= comparison_node_pool
;
2881 else if (TREE_CODE_CLASS (code
) == tcc_exceptional
)
2883 gcc_assert (code
== TREE_LIST
);
2884 pool
= list_node_pool
;
2888 gcc_assert (code
== CALL_EXPR
);
2889 pool
= expression_node_pool
;
2892 vexpr
= (tree
) pool_alloc (pool
);
2893 memcpy (vexpr
, expr
, tree_size (expr
));
2895 /* This case is only for TREE_LIST's that appear as part of
2896 CALL_EXPR's. Anything else is a bug, but we can't easily verify
2897 this, hence this comment. TREE_LIST is not handled by the
2898 general case below is because they don't have a fixed length, or
2899 operands, so you can't access purpose/value/chain through
2900 TREE_OPERAND macros. */
2902 if (code
== TREE_LIST
)
2904 tree op
= NULL_TREE
;
2905 tree temp
= NULL_TREE
;
2906 if (TREE_CHAIN (vexpr
))
2907 temp
= create_value_expr_from (TREE_CHAIN (vexpr
), block
, stmt
);
2908 TREE_CHAIN (vexpr
) = temp
? temp
: TREE_CHAIN (vexpr
);
2911 /* Recursively value-numberize reference ops. */
2912 if (REFERENCE_CLASS_P (TREE_VALUE (vexpr
)))
2915 op
= TREE_VALUE (vexpr
);
2916 tempop
= create_value_expr_from (op
, block
, stmt
);
2917 op
= tempop
? tempop
: op
;
2919 TREE_VALUE (vexpr
) = vn_lookup_or_add (op
, stmt
);
2923 op
= TREE_VALUE (vexpr
);
2924 TREE_VALUE (vexpr
) = vn_lookup_or_add (TREE_VALUE (vexpr
), NULL
);
2926 /* This is the equivalent of inserting op into EXP_GEN like we
2928 if (!is_undefined_value (op
))
2929 value_insert_into_set (EXP_GEN (block
), op
);
2934 for (i
= 0; i
< TREE_CODE_LENGTH (code
); i
++)
2938 op
= TREE_OPERAND (expr
, i
);
2939 if (op
== NULL_TREE
)
2942 /* Recursively value-numberize reference ops and tree lists. */
2943 if (REFERENCE_CLASS_P (op
))
2945 tree tempop
= create_value_expr_from (op
, block
, stmt
);
2946 op
= tempop
? tempop
: op
;
2947 val
= vn_lookup_or_add (op
, stmt
);
2949 else if (TREE_CODE (op
) == TREE_LIST
)
2953 gcc_assert (TREE_CODE (expr
) == CALL_EXPR
);
2954 tempop
= create_value_expr_from (op
, block
, stmt
);
2956 op
= tempop
? tempop
: op
;
2957 vn_lookup_or_add (op
, NULL
);
2958 /* Unlike everywhere else, we do *not* want to replace the
2959 TREE_LIST itself with a value number, because support
2960 functions we call will blow up. */
2964 /* Create a value handle for OP and add it to VEXPR. */
2965 val
= vn_lookup_or_add (op
, NULL
);
2967 if (!is_undefined_value (op
) && TREE_CODE (op
) != TREE_LIST
)
2968 value_insert_into_set (EXP_GEN (block
), op
);
2970 if (TREE_CODE (val
) == VALUE_HANDLE
)
2971 TREE_TYPE (val
) = TREE_TYPE (TREE_OPERAND (vexpr
, i
));
2973 TREE_OPERAND (vexpr
, i
) = val
;
2981 /* Insert extra phis to merge values that are fully available from
2982 preds of BLOCK, but have no dominating representative coming from
2986 insert_extra_phis (basic_block block
, basic_block dom
)
2989 if (!single_pred_p (block
))
2994 bitmap_set_t tempset
= bitmap_set_new ();
2996 FOR_EACH_EDGE (e
, ei
, block
->preds
)
2998 /* We cannot handle abnormal incoming edges correctly. */
2999 if (e
->flags
& EDGE_ABNORMAL
)
3004 bitmap_set_copy (tempset
, AVAIL_OUT (e
->src
));
3008 bitmap_set_and (tempset
, AVAIL_OUT (e
->src
));
3012 bitmap_set_and_compl (tempset
, AVAIL_OUT (dom
));
3014 if (!bitmap_set_empty_p (tempset
))
3019 EXECUTE_IF_SET_IN_BITMAP (tempset
->expressions
, 0, i
, bi
)
3021 tree name
= ssa_name (i
);
3022 tree val
= get_value_handle (name
);
3025 if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name
))
3029 || TREE_TYPE (name
) != TREE_TYPE (mergephitemp
))
3031 mergephitemp
= create_tmp_var (TREE_TYPE (name
),
3033 get_var_ann (mergephitemp
);
3035 temp
= mergephitemp
;
3037 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
3039 fprintf (dump_file
, "Creating phi ");
3040 print_generic_expr (dump_file
, temp
, 0);
3041 fprintf (dump_file
, " to merge available but not dominating values ");
3044 add_referenced_var (temp
);
3045 temp
= create_phi_node (temp
, block
);
3046 NECESSARY (temp
) = 0;
3047 VEC_safe_push (tree
, heap
, inserted_exprs
, temp
);
3049 FOR_EACH_EDGE (e
, ei
, block
->preds
)
3051 tree leader
= bitmap_find_leader (AVAIL_OUT (e
->src
), val
);
3053 gcc_assert (leader
);
3054 add_phi_arg (temp
, leader
, e
);
3056 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
3058 print_generic_expr (dump_file
, leader
, 0);
3059 fprintf (dump_file
, " in block %d,", e
->src
->index
);
3063 vn_add (PHI_RESULT (temp
), val
);
3065 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
3066 fprintf (dump_file
, "\n");
3072 /* Given a statement STMT and its right hand side which is a load, try
3073 to look for the expression stored in the location for the load, and
3074 return true if a useful equivalence was recorded for LHS. */
3077 try_look_through_load (tree lhs
, tree mem_ref
, tree stmt
, basic_block block
)
3079 tree store_stmt
= NULL
;
3084 FOR_EACH_SSA_TREE_OPERAND (vuse
, stmt
, i
, SSA_OP_VIRTUAL_USES
)
3088 gcc_assert (TREE_CODE (vuse
) == SSA_NAME
);
3089 def_stmt
= SSA_NAME_DEF_STMT (vuse
);
3091 /* If there is no useful statement for this VUSE, we'll not find a
3092 useful expression to return either. Likewise, if there is a
3093 statement but it is not a simple assignment or it has virtual
3094 uses, we can stop right here. Note that this means we do
3095 not look through PHI nodes, which is intentional. */
3097 || TREE_CODE (def_stmt
) != MODIFY_EXPR
3098 || !ZERO_SSA_OPERANDS (def_stmt
, SSA_OP_VIRTUAL_USES
))
3101 /* If this is not the same statement as one we have looked at for
3102 another VUSE of STMT already, we have two statements producing
3103 something that reaches our STMT. */
3104 if (store_stmt
&& store_stmt
!= def_stmt
)
3108 /* Is this a store to the exact same location as the one we are
3109 loading from in STMT? */
3110 if (!operand_equal_p (TREE_OPERAND (def_stmt
, 0), mem_ref
, 0))
3113 /* Otherwise remember this statement and see if all other VUSEs
3114 come from the same statement. */
3115 store_stmt
= def_stmt
;
3119 /* Alright then, we have visited all VUSEs of STMT and we've determined
3120 that all of them come from the same statement STORE_STMT. See if there
3121 is a useful expression we can deduce from STORE_STMT. */
3122 rhs
= TREE_OPERAND (store_stmt
, 1);
3123 if ((TREE_CODE (rhs
) == SSA_NAME
3124 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (rhs
))
3125 || is_gimple_min_invariant (rhs
)
3126 || TREE_CODE (rhs
) == ADDR_EXPR
3127 || TREE_INVARIANT (rhs
))
3130 /* Yay! Compute a value number for the RHS of the statement and
3131 add its value to the AVAIL_OUT set for the block. Add the LHS
3133 add_to_sets (lhs
, rhs
, store_stmt
, TMP_GEN (block
), AVAIL_OUT (block
));
3134 if (TREE_CODE (rhs
) == SSA_NAME
3135 && !is_undefined_value (rhs
))
3136 value_insert_into_set (EXP_GEN (block
), rhs
);
3143 /* Return a copy of NODE that is stored in the temporary alloc_pool's.
3144 This is made recursively true, so that the operands are stored in
3145 the pool as well. */
3148 poolify_tree (tree node
)
3150 switch (TREE_CODE (node
))
3154 tree temp
= pool_alloc (reference_node_pool
);
3155 memcpy (temp
, node
, tree_size (node
));
3156 TREE_OPERAND (temp
, 0) = poolify_tree (TREE_OPERAND (temp
, 0));
3162 tree temp
= pool_alloc (modify_expr_node_pool
);
3163 memcpy (temp
, node
, tree_size (node
));
3164 TREE_OPERAND (temp
, 0) = poolify_tree (TREE_OPERAND (temp
, 0));
3165 TREE_OPERAND (temp
, 1) = poolify_tree (TREE_OPERAND (temp
, 1));
3182 static tree modify_expr_template
;
3184 /* Allocate a MODIFY_EXPR with TYPE, and operands OP1, OP2 in the
3185 alloc pools and return it. */
3187 poolify_modify_expr (tree type
, tree op1
, tree op2
)
3189 if (modify_expr_template
== NULL
)
3190 modify_expr_template
= build2 (MODIFY_EXPR
, type
, op1
, op2
);
3192 TREE_OPERAND (modify_expr_template
, 0) = op1
;
3193 TREE_OPERAND (modify_expr_template
, 1) = op2
;
3194 TREE_TYPE (modify_expr_template
) = type
;
3196 return poolify_tree (modify_expr_template
);
3200 /* For each real store operation of the form
3201 *a = <value> that we see, create a corresponding fake store of the
3202 form storetmp_<version> = *a.
3204 This enables AVAIL computation to mark the results of stores as
3205 available. Without this, you'd need to do some computation to
3206 mark the result of stores as ANTIC and AVAIL at all the right
3208 To save memory, we keep the store
3209 statements pool allocated until we decide whether they are
3210 necessary or not. */
3213 insert_fake_stores (void)
3219 block_stmt_iterator bsi
;
3220 for (bsi
= bsi_start (block
); !bsi_end_p (bsi
); bsi_next (&bsi
))
3222 tree stmt
= bsi_stmt (bsi
);
3224 /* We can't generate SSA names for stores that are complex
3225 or aggregate. We also want to ignore things whose
3226 virtual uses occur in abnormal phis. */
3228 if (TREE_CODE (stmt
) == MODIFY_EXPR
3229 && TREE_CODE (TREE_OPERAND (stmt
, 0)) == INDIRECT_REF
3230 && !AGGREGATE_TYPE_P (TREE_TYPE (TREE_OPERAND (stmt
, 0)))
3231 && TREE_CODE (TREE_TYPE (TREE_OPERAND (stmt
, 0))) != COMPLEX_TYPE
)
3235 tree lhs
= TREE_OPERAND (stmt
, 0);
3236 tree rhs
= TREE_OPERAND (stmt
, 1);
3238 bool notokay
= false;
3240 FOR_EACH_SSA_DEF_OPERAND (defp
, stmt
, iter
, SSA_OP_VIRTUAL_DEFS
)
3242 tree defvar
= DEF_FROM_PTR (defp
);
3243 if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (defvar
))
3253 if (!storetemp
|| TREE_TYPE (rhs
) != TREE_TYPE (storetemp
))
3255 storetemp
= create_tmp_var (TREE_TYPE (rhs
), "storetmp");
3256 get_var_ann (storetemp
);
3259 new = poolify_modify_expr (TREE_TYPE (stmt
), storetemp
, lhs
);
3261 lhs
= make_ssa_name (storetemp
, new);
3262 TREE_OPERAND (new, 0) = lhs
;
3263 create_ssa_artficial_load_stmt (new, stmt
);
3265 NECESSARY (new) = 0;
3266 VEC_safe_push (tree
, heap
, inserted_exprs
, new);
3267 VEC_safe_push (tree
, heap
, need_creation
, new);
3268 bsi_insert_after (&bsi
, new, BSI_NEW_STMT
);
3274 /* Turn the pool allocated fake stores that we created back into real
3275 GC allocated ones if they turned out to be necessary to PRE some
3279 realify_fake_stores (void)
3284 for (i
= 0; VEC_iterate (tree
, need_creation
, i
, stmt
); i
++)
3286 if (NECESSARY (stmt
))
3288 block_stmt_iterator bsi
;
3291 /* Mark the temp variable as referenced */
3292 add_referenced_var (SSA_NAME_VAR (TREE_OPERAND (stmt
, 0)));
3294 /* Put the new statement in GC memory, fix up the
3295 SSA_NAME_DEF_STMT on it, and then put it in place of
3296 the old statement before the store in the IR stream
3297 as a plain ssa name copy. */
3298 bsi
= bsi_for_stmt (stmt
);
3300 newstmt
= build2 (MODIFY_EXPR
, void_type_node
,
3301 TREE_OPERAND (stmt
, 0),
3302 TREE_OPERAND (bsi_stmt (bsi
), 1));
3303 SSA_NAME_DEF_STMT (TREE_OPERAND (newstmt
, 0)) = newstmt
;
3304 bsi_insert_before (&bsi
, newstmt
, BSI_SAME_STMT
);
3305 bsi
= bsi_for_stmt (stmt
);
3306 bsi_remove (&bsi
, true);
3309 release_defs (stmt
);
3313 /* Tree-combine a value number expression *EXPR_P that does a type
3314 conversion with the value number expression of its operand.
3315 Returns true, if *EXPR_P simplifies to a value number or
3316 gimple min-invariant expression different from EXPR_P and
3317 sets *EXPR_P to the simplified expression value number.
3318 Otherwise returns false and does not change *EXPR_P. */
3321 try_combine_conversion (tree
*expr_p
)
3323 tree expr
= *expr_p
;
3326 if (!((TREE_CODE (expr
) == NOP_EXPR
3327 || TREE_CODE (expr
) == CONVERT_EXPR
)
3328 && TREE_CODE (TREE_OPERAND (expr
, 0)) == VALUE_HANDLE
3329 && !VALUE_HANDLE_VUSES (TREE_OPERAND (expr
, 0))))
3332 t
= fold_unary (TREE_CODE (expr
), TREE_TYPE (expr
),
3333 VALUE_HANDLE_EXPR_SET (TREE_OPERAND (expr
, 0))->head
->expr
);
3337 /* Strip useless type conversions, which is safe in the optimizers but
3338 not generally in fold. */
3339 STRIP_USELESS_TYPE_CONVERSION (t
);
3341 /* Disallow value expressions we have no value number for already, as
3342 we would miss a leader for it here. */
3343 if (!(TREE_CODE (t
) == VALUE_HANDLE
3344 || is_gimple_min_invariant (t
)))
3345 t
= vn_lookup (t
, NULL
);
3355 /* Compute the AVAIL set for all basic blocks.
3357 This function performs value numbering of the statements in each basic
3358 block. The AVAIL sets are built from information we glean while doing
3359 this value numbering, since the AVAIL sets contain only one entry per
3362 AVAIL_IN[BLOCK] = AVAIL_OUT[dom(BLOCK)].
3363 AVAIL_OUT[BLOCK] = AVAIL_IN[BLOCK] U PHI_GEN[BLOCK] U TMP_GEN[BLOCK]. */
3366 compute_avail (void)
3368 basic_block block
, son
;
3369 basic_block
*worklist
;
3372 /* For arguments with default definitions, we pretend they are
3373 defined in the entry block. */
3374 for (param
= DECL_ARGUMENTS (current_function_decl
);
3376 param
= TREE_CHAIN (param
))
3378 if (default_def (param
) != NULL
)
3380 tree def
= default_def (param
);
3381 vn_lookup_or_add (def
, NULL
);
3382 bitmap_insert_into_set (TMP_GEN (ENTRY_BLOCK_PTR
), def
);
3383 bitmap_value_insert_into_set (AVAIL_OUT (ENTRY_BLOCK_PTR
), def
);
3387 /* Likewise for the static chain decl. */
3388 if (cfun
->static_chain_decl
)
3390 param
= cfun
->static_chain_decl
;
3391 if (default_def (param
) != NULL
)
3393 tree def
= default_def (param
);
3394 vn_lookup_or_add (def
, NULL
);
3395 bitmap_insert_into_set (TMP_GEN (ENTRY_BLOCK_PTR
), def
);
3396 bitmap_value_insert_into_set (AVAIL_OUT (ENTRY_BLOCK_PTR
), def
);
3400 /* Allocate the worklist. */
3401 worklist
= XNEWVEC (basic_block
, n_basic_blocks
);
3403 /* Seed the algorithm by putting the dominator children of the entry
3404 block on the worklist. */
3405 for (son
= first_dom_son (CDI_DOMINATORS
, ENTRY_BLOCK_PTR
);
3407 son
= next_dom_son (CDI_DOMINATORS
, son
))
3408 worklist
[sp
++] = son
;
3410 /* Loop until the worklist is empty. */
3413 block_stmt_iterator bsi
;
3416 unsigned int stmt_uid
= 1;
3418 /* Pick a block from the worklist. */
3419 block
= worklist
[--sp
];
3421 /* Initially, the set of available values in BLOCK is that of
3422 its immediate dominator. */
3423 dom
= get_immediate_dominator (CDI_DOMINATORS
, block
);
3425 bitmap_set_copy (AVAIL_OUT (block
), AVAIL_OUT (dom
));
3428 insert_extra_phis (block
, dom
);
3430 /* Generate values for PHI nodes. */
3431 for (phi
= phi_nodes (block
); phi
; phi
= PHI_CHAIN (phi
))
3432 /* We have no need for virtual phis, as they don't represent
3433 actual computations. */
3434 if (is_gimple_reg (PHI_RESULT (phi
)))
3435 add_to_sets (PHI_RESULT (phi
), PHI_RESULT (phi
), NULL
,
3436 PHI_GEN (block
), AVAIL_OUT (block
));
3438 /* Now compute value numbers and populate value sets with all
3439 the expressions computed in BLOCK. */
3440 for (bsi
= bsi_start (block
); !bsi_end_p (bsi
); bsi_next (&bsi
))
3446 stmt
= bsi_stmt (bsi
);
3447 ann
= stmt_ann (stmt
);
3449 ann
->uid
= stmt_uid
++;
3451 /* For regular value numbering, we are only interested in
3452 assignments of the form X_i = EXPR, where EXPR represents
3453 an "interesting" computation, it has no volatile operands
3454 and X_i doesn't flow through an abnormal edge. */
3455 if (TREE_CODE (stmt
) == MODIFY_EXPR
3456 && !ann
->has_volatile_ops
3457 && TREE_CODE (TREE_OPERAND (stmt
, 0)) == SSA_NAME
3458 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (TREE_OPERAND (stmt
, 0)))
3460 tree lhs
= TREE_OPERAND (stmt
, 0);
3461 tree rhs
= TREE_OPERAND (stmt
, 1);
3463 /* Try to look through loads. */
3464 if (TREE_CODE (lhs
) == SSA_NAME
3465 && !ZERO_SSA_OPERANDS (stmt
, SSA_OP_VIRTUAL_USES
)
3466 && try_look_through_load (lhs
, rhs
, stmt
, block
))
3469 STRIP_USELESS_TYPE_CONVERSION (rhs
);
3470 if (can_value_number_operation (rhs
))
3472 /* For value numberable operation, create a
3473 duplicate expression with the operands replaced
3474 with the value handles of the original RHS. */
3475 tree newt
= create_value_expr_from (rhs
, block
, stmt
);
3478 /* If we can combine a conversion expression
3479 with the expression for its operand just
3480 record the value number for it. */
3481 if (try_combine_conversion (&newt
))
3485 tree val
= vn_lookup_or_add (newt
, stmt
);
3487 value_insert_into_set (EXP_GEN (block
), newt
);
3489 bitmap_insert_into_set (TMP_GEN (block
), lhs
);
3490 bitmap_value_insert_into_set (AVAIL_OUT (block
), lhs
);
3494 else if ((TREE_CODE (rhs
) == SSA_NAME
3495 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (rhs
))
3496 || is_gimple_min_invariant (rhs
)
3497 || TREE_CODE (rhs
) == ADDR_EXPR
3498 || TREE_INVARIANT (rhs
)
3501 /* Compute a value number for the RHS of the statement
3502 and add its value to the AVAIL_OUT set for the block.
3503 Add the LHS to TMP_GEN. */
3504 add_to_sets (lhs
, rhs
, stmt
, TMP_GEN (block
),
3507 if (TREE_CODE (rhs
) == SSA_NAME
3508 && !is_undefined_value (rhs
))
3509 value_insert_into_set (EXP_GEN (block
), rhs
);
3514 /* For any other statement that we don't recognize, simply
3515 make the names generated by the statement available in
3516 AVAIL_OUT and TMP_GEN. */
3517 FOR_EACH_SSA_TREE_OPERAND (op
, stmt
, iter
, SSA_OP_DEF
)
3518 add_to_sets (op
, op
, NULL
, TMP_GEN (block
), AVAIL_OUT (block
));
3520 FOR_EACH_SSA_TREE_OPERAND (op
, stmt
, iter
, SSA_OP_USE
)
3521 add_to_sets (op
, op
, NULL
, NULL
, AVAIL_OUT (block
));
3524 /* Put the dominator children of BLOCK on the worklist of blocks
3525 to compute available sets for. */
3526 for (son
= first_dom_son (CDI_DOMINATORS
, block
);
3528 son
= next_dom_son (CDI_DOMINATORS
, son
))
3529 worklist
[sp
++] = son
;
3536 /* Eliminate fully redundant computations. */
3545 block_stmt_iterator i
;
3547 for (i
= bsi_start (b
); !bsi_end_p (i
); bsi_next (&i
))
3549 tree stmt
= bsi_stmt (i
);
3551 /* Lookup the RHS of the expression, see if we have an
3552 available computation for it. If so, replace the RHS with
3553 the available computation. */
3554 if (TREE_CODE (stmt
) == MODIFY_EXPR
3555 && TREE_CODE (TREE_OPERAND (stmt
, 0)) == SSA_NAME
3556 && TREE_CODE (TREE_OPERAND (stmt
,1)) != SSA_NAME
3557 && !is_gimple_min_invariant (TREE_OPERAND (stmt
, 1))
3558 && !stmt_ann (stmt
)->has_volatile_ops
)
3560 tree lhs
= TREE_OPERAND (stmt
, 0);
3561 tree
*rhs_p
= &TREE_OPERAND (stmt
, 1);
3564 sprime
= bitmap_find_leader (AVAIL_OUT (b
),
3565 vn_lookup (lhs
, NULL
));
3568 && (TREE_CODE (*rhs_p
) != SSA_NAME
3569 || may_propagate_copy (*rhs_p
, sprime
)))
3571 gcc_assert (sprime
!= *rhs_p
);
3573 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
3575 fprintf (dump_file
, "Replaced ");
3576 print_generic_expr (dump_file
, *rhs_p
, 0);
3577 fprintf (dump_file
, " with ");
3578 print_generic_expr (dump_file
, sprime
, 0);
3579 fprintf (dump_file
, " in ");
3580 print_generic_stmt (dump_file
, stmt
, 0);
3583 if (TREE_CODE (sprime
) == SSA_NAME
)
3584 NECESSARY (SSA_NAME_DEF_STMT (sprime
)) = 1;
3585 /* We need to make sure the new and old types actually match,
3586 which may require adding a simple cast, which fold_convert
3588 if (TREE_CODE (*rhs_p
) != SSA_NAME
3589 && !tree_ssa_useless_type_conversion_1 (TREE_TYPE (*rhs_p
),
3590 TREE_TYPE (sprime
)))
3591 sprime
= fold_convert (TREE_TYPE (*rhs_p
), sprime
);
3593 pre_stats
.eliminations
++;
3594 propagate_tree_value (rhs_p
, sprime
);
3597 /* If we removed EH side effects from the statement, clean
3598 its EH information. */
3599 if (maybe_clean_or_replace_eh_stmt (stmt
, stmt
))
3601 bitmap_set_bit (need_eh_cleanup
,
3602 bb_for_stmt (stmt
)->index
);
3603 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
3604 fprintf (dump_file
, " Removed EH side effects.\n");
3612 /* Borrow a bit of tree-ssa-dce.c for the moment.
3613 XXX: In 4.1, we should be able to just run a DCE pass after PRE, though
3614 this may be a bit faster, and we may want critical edges kept split. */
3616 /* If OP's defining statement has not already been determined to be necessary,
3617 mark that statement necessary. Return the stmt, if it is newly
3621 mark_operand_necessary (tree op
)
3627 if (TREE_CODE (op
) != SSA_NAME
)
3630 stmt
= SSA_NAME_DEF_STMT (op
);
3633 if (NECESSARY (stmt
)
3634 || IS_EMPTY_STMT (stmt
))
3637 NECESSARY (stmt
) = 1;
3641 /* Because we don't follow exactly the standard PRE algorithm, and decide not
3642 to insert PHI nodes sometimes, and because value numbering of casts isn't
3643 perfect, we sometimes end up inserting dead code. This simple DCE-like
3644 pass removes any insertions we made that weren't actually used. */
3647 remove_dead_inserted_code (void)
3649 VEC(tree
,heap
) *worklist
= NULL
;
3653 worklist
= VEC_alloc (tree
, heap
, VEC_length (tree
, inserted_exprs
));
3654 for (i
= 0; VEC_iterate (tree
, inserted_exprs
, i
, t
); i
++)
3657 VEC_quick_push (tree
, worklist
, t
);
3659 while (VEC_length (tree
, worklist
) > 0)
3661 t
= VEC_pop (tree
, worklist
);
3663 /* PHI nodes are somewhat special in that each PHI alternative has
3664 data and control dependencies. All the statements feeding the
3665 PHI node's arguments are always necessary. */
3666 if (TREE_CODE (t
) == PHI_NODE
)
3670 VEC_reserve (tree
, heap
, worklist
, PHI_NUM_ARGS (t
));
3671 for (k
= 0; k
< PHI_NUM_ARGS (t
); k
++)
3673 tree arg
= PHI_ARG_DEF (t
, k
);
3674 if (TREE_CODE (arg
) == SSA_NAME
)
3676 arg
= mark_operand_necessary (arg
);
3678 VEC_quick_push (tree
, worklist
, arg
);
3684 /* Propagate through the operands. Examine all the USE, VUSE and
3685 V_MAY_DEF operands in this statement. Mark all the statements
3686 which feed this statement's uses as necessary. */
3690 /* The operands of V_MAY_DEF expressions are also needed as they
3691 represent potential definitions that may reach this
3692 statement (V_MAY_DEF operands allow us to follow def-def
3695 FOR_EACH_SSA_TREE_OPERAND (use
, t
, iter
, SSA_OP_ALL_USES
)
3697 tree n
= mark_operand_necessary (use
);
3699 VEC_safe_push (tree
, heap
, worklist
, n
);
3704 for (i
= 0; VEC_iterate (tree
, inserted_exprs
, i
, t
); i
++)
3708 block_stmt_iterator bsi
;
3710 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
3712 fprintf (dump_file
, "Removing unnecessary insertion:");
3713 print_generic_stmt (dump_file
, t
, 0);
3716 if (TREE_CODE (t
) == PHI_NODE
)
3718 remove_phi_node (t
, NULL
);
3722 bsi
= bsi_for_stmt (t
);
3723 bsi_remove (&bsi
, true);
3728 VEC_free (tree
, heap
, worklist
);
3731 /* Initialize data structures used by PRE. */
3734 init_pre (bool do_fre
)
3740 inserted_exprs
= NULL
;
3741 need_creation
= NULL
;
3742 pretemp
= NULL_TREE
;
3743 storetemp
= NULL_TREE
;
3744 mergephitemp
= NULL_TREE
;
3745 prephitemp
= NULL_TREE
;
3749 current_loops
= loop_optimizer_init (LOOPS_NORMAL
);
3751 connect_infinite_loops_to_exit ();
3752 memset (&pre_stats
, 0, sizeof (pre_stats
));
3754 /* If block 0 has more than one predecessor, it means that its PHI
3755 nodes will have arguments coming from block -1. This creates
3756 problems for several places in PRE that keep local arrays indexed
3757 by block number. To prevent this, we split the edge coming from
3758 ENTRY_BLOCK_PTR (FIXME, if ENTRY_BLOCK_PTR had an index number
3759 different than -1 we wouldn't have to hack this. tree-ssa-dce.c
3760 needs a similar change). */
3761 if (!single_pred_p (single_succ (ENTRY_BLOCK_PTR
)))
3762 if (!(single_succ_edge (ENTRY_BLOCK_PTR
)->flags
& EDGE_ABNORMAL
))
3763 split_edge (single_succ_edge (ENTRY_BLOCK_PTR
));
3766 bb
->aux
= xcalloc (1, sizeof (struct bb_value_sets
));
3768 bitmap_obstack_initialize (&grand_bitmap_obstack
);
3769 phi_translate_table
= htab_create (511, expr_pred_trans_hash
,
3770 expr_pred_trans_eq
, free
);
3771 value_set_pool
= create_alloc_pool ("Value sets",
3772 sizeof (struct value_set
), 30);
3773 bitmap_set_pool
= create_alloc_pool ("Bitmap sets",
3774 sizeof (struct bitmap_set
), 30);
3775 value_set_node_pool
= create_alloc_pool ("Value set nodes",
3776 sizeof (struct value_set_node
), 30);
3777 calculate_dominance_info (CDI_POST_DOMINATORS
);
3778 calculate_dominance_info (CDI_DOMINATORS
);
3779 binary_node_pool
= create_alloc_pool ("Binary tree nodes",
3780 tree_code_size (PLUS_EXPR
), 30);
3781 unary_node_pool
= create_alloc_pool ("Unary tree nodes",
3782 tree_code_size (NEGATE_EXPR
), 30);
3783 reference_node_pool
= create_alloc_pool ("Reference tree nodes",
3784 tree_code_size (ARRAY_REF
), 30);
3785 expression_node_pool
= create_alloc_pool ("Expression tree nodes",
3786 tree_code_size (CALL_EXPR
), 30);
3787 list_node_pool
= create_alloc_pool ("List tree nodes",
3788 tree_code_size (TREE_LIST
), 30);
3789 comparison_node_pool
= create_alloc_pool ("Comparison tree nodes",
3790 tree_code_size (EQ_EXPR
), 30);
3791 modify_expr_node_pool
= create_alloc_pool ("MODIFY_EXPR nodes",
3792 tree_code_size (MODIFY_EXPR
),
3794 modify_expr_template
= NULL
;
3798 EXP_GEN (bb
) = set_new (true);
3799 PHI_GEN (bb
) = bitmap_set_new ();
3800 TMP_GEN (bb
) = bitmap_set_new ();
3801 AVAIL_OUT (bb
) = bitmap_set_new ();
3804 need_eh_cleanup
= BITMAP_ALLOC (NULL
);
3808 /* Deallocate data structures used by PRE. */
3811 fini_pre (bool do_fre
)
3816 VEC_free (tree
, heap
, inserted_exprs
);
3817 VEC_free (tree
, heap
, need_creation
);
3818 bitmap_obstack_release (&grand_bitmap_obstack
);
3819 free_alloc_pool (value_set_pool
);
3820 free_alloc_pool (bitmap_set_pool
);
3821 free_alloc_pool (value_set_node_pool
);
3822 free_alloc_pool (binary_node_pool
);
3823 free_alloc_pool (reference_node_pool
);
3824 free_alloc_pool (unary_node_pool
);
3825 free_alloc_pool (list_node_pool
);
3826 free_alloc_pool (expression_node_pool
);
3827 free_alloc_pool (comparison_node_pool
);
3828 free_alloc_pool (modify_expr_node_pool
);
3829 htab_delete (phi_translate_table
);
3830 remove_fake_exit_edges ();
3838 free_dominance_info (CDI_POST_DOMINATORS
);
3841 if (!bitmap_empty_p (need_eh_cleanup
))
3843 tree_purge_all_dead_eh_edges (need_eh_cleanup
);
3844 cleanup_tree_cfg ();
3847 BITMAP_FREE (need_eh_cleanup
);
3849 /* Wipe out pointers to VALUE_HANDLEs. In the not terribly distant
3850 future we will want them to be persistent though. */
3851 for (i
= 0; i
< num_ssa_names
; i
++)
3853 tree name
= ssa_name (i
);
3858 if (SSA_NAME_VALUE (name
)
3859 && TREE_CODE (SSA_NAME_VALUE (name
)) == VALUE_HANDLE
)
3860 SSA_NAME_VALUE (name
) = NULL
;
3862 if (!do_fre
&& current_loops
)
3864 loop_optimizer_finalize (current_loops
);
3865 current_loops
= NULL
;
3869 /* Main entry point to the SSA-PRE pass. DO_FRE is true if the caller
3870 only wants to do full redundancy elimination. */
3873 execute_pre (bool do_fre
)
3878 insert_fake_stores ();
3880 /* Collect and value number expressions computed in each basic block. */
3883 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
3889 print_value_set (dump_file
, EXP_GEN (bb
), "exp_gen", bb
->index
);
3890 bitmap_print_value_set (dump_file
, TMP_GEN (bb
), "tmp_gen",
3892 bitmap_print_value_set (dump_file
, AVAIL_OUT (bb
), "avail_out",
3897 /* Insert can get quite slow on an incredibly large number of basic
3898 blocks due to some quadratic behavior. Until this behavior is
3899 fixed, don't run it when he have an incredibly large number of
3900 bb's. If we aren't going to run insert, there is no point in
3901 computing ANTIC, either, even though it's plenty fast. */
3902 if (!do_fre
&& n_basic_blocks
< 4000)
3904 vuse_names
= XCNEWVEC (bitmap
, num_ssa_names
);
3905 compute_rvuse_and_antic_safe ();
3911 /* Remove all the redundant expressions. */
3915 if (dump_file
&& (dump_flags
& TDF_STATS
))
3917 fprintf (dump_file
, "Insertions: %d\n", pre_stats
.insertions
);
3918 fprintf (dump_file
, "New PHIs: %d\n", pre_stats
.phis
);
3919 fprintf (dump_file
, "Eliminated: %d\n", pre_stats
.eliminations
);
3920 fprintf (dump_file
, "Constified: %d\n", pre_stats
.constified
);
3923 bsi_commit_edge_inserts ();
3927 remove_dead_inserted_code ();
3928 realify_fake_stores ();
3935 /* Gate and execute functions for PRE. */
3940 execute_pre (false);
3947 return flag_tree_pre
!= 0;
3950 struct tree_opt_pass pass_pre
=
3953 gate_pre
, /* gate */
3954 do_pre
, /* execute */
3957 0, /* static_pass_number */
3958 TV_TREE_PRE
, /* tv_id */
3959 PROP_no_crit_edges
| PROP_cfg
3960 | PROP_ssa
| PROP_alias
, /* properties_required */
3961 0, /* properties_provided */
3962 0, /* properties_destroyed */
3963 0, /* todo_flags_start */
3964 TODO_update_ssa_only_virtuals
| TODO_dump_func
| TODO_ggc_collect
3965 | TODO_verify_ssa
, /* todo_flags_finish */
3970 /* Gate and execute functions for FRE. */
3982 return flag_tree_fre
!= 0;
3985 struct tree_opt_pass pass_fre
=
3988 gate_fre
, /* gate */
3989 execute_fre
, /* execute */
3992 0, /* static_pass_number */
3993 TV_TREE_FRE
, /* tv_id */
3994 PROP_cfg
| PROP_ssa
| PROP_alias
, /* properties_required */
3995 0, /* properties_provided */
3996 0, /* properties_destroyed */
3997 0, /* todo_flags_start */
3998 TODO_dump_func
| TODO_ggc_collect
| TODO_verify_ssa
, /* todo_flags_finish */