1 /* Scalar evolution detector.
2 Copyright (C) 2003-2014 Free Software Foundation, Inc.
3 Contributed by Sebastian Pop <s.pop@laposte.net>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
24 This pass analyzes the evolution of scalar variables in loop
25 structures. The algorithm is based on the SSA representation,
26 and on the loop hierarchy tree. This algorithm is not based on
27 the notion of versions of a variable, as it was the case for the
28 previous implementations of the scalar evolution algorithm, but
29 it assumes that each defined name is unique.
31 The notation used in this file is called "chains of recurrences",
32 and has been proposed by Eugene Zima, Robert Van Engelen, and
33 others for describing induction variables in programs. For example
34 "b -> {0, +, 2}_1" means that the scalar variable "b" is equal to 0
35 when entering in the loop_1 and has a step 2 in this loop, in other
36 words "for (b = 0; b < N; b+=2);". Note that the coefficients of
37 this chain of recurrence (or chrec [shrek]) can contain the name of
38 other variables, in which case they are called parametric chrecs.
39 For example, "b -> {a, +, 2}_1" means that the initial value of "b"
40 is the value of "a". In most of the cases these parametric chrecs
41 are fully instantiated before their use because symbolic names can
42 hide some difficult cases such as self-references described later
43 (see the Fibonacci example).
45 A short sketch of the algorithm is:
47 Given a scalar variable to be analyzed, follow the SSA edge to
50 - When the definition is a GIMPLE_ASSIGN: if the right hand side
51 (RHS) of the definition cannot be statically analyzed, the answer
52 of the analyzer is: "don't know".
53 Otherwise, for all the variables that are not yet analyzed in the
54 RHS, try to determine their evolution, and finally try to
55 evaluate the operation of the RHS that gives the evolution
56 function of the analyzed variable.
58 - When the definition is a condition-phi-node: determine the
59 evolution function for all the branches of the phi node, and
60 finally merge these evolutions (see chrec_merge).
62 - When the definition is a loop-phi-node: determine its initial
63 condition, that is the SSA edge defined in an outer loop, and
64 keep it symbolic. Then determine the SSA edges that are defined
65 in the body of the loop. Follow the inner edges until ending on
66 another loop-phi-node of the same analyzed loop. If the reached
67 loop-phi-node is not the starting loop-phi-node, then we keep
68 this definition under a symbolic form. If the reached
69 loop-phi-node is the same as the starting one, then we compute a
70 symbolic stride on the return path. The result is then the
71 symbolic chrec {initial_condition, +, symbolic_stride}_loop.
75 Example 1: Illustration of the basic algorithm.
81 | if (c > 10) exit_loop
84 Suppose that we want to know the number of iterations of the
85 loop_1. The exit_loop is controlled by a COND_EXPR (c > 10). We
86 ask the scalar evolution analyzer two questions: what's the
87 scalar evolution (scev) of "c", and what's the scev of "10". For
88 "10" the answer is "10" since it is a scalar constant. For the
89 scalar variable "c", it follows the SSA edge to its definition,
90 "c = b + 1", and then asks again what's the scev of "b".
91 Following the SSA edge, we end on a loop-phi-node "b = phi (a,
92 c)", where the initial condition is "a", and the inner loop edge
93 is "c". The initial condition is kept under a symbolic form (it
94 may be the case that the copy constant propagation has done its
95 work and we end with the constant "3" as one of the edges of the
96 loop-phi-node). The update edge is followed to the end of the
97 loop, and until reaching again the starting loop-phi-node: b -> c
98 -> b. At this point we have drawn a path from "b" to "b" from
99 which we compute the stride in the loop: in this example it is
100 "+1". The resulting scev for "b" is "b -> {a, +, 1}_1". Now
101 that the scev for "b" is known, it is possible to compute the
102 scev for "c", that is "c -> {a + 1, +, 1}_1". In order to
103 determine the number of iterations in the loop_1, we have to
104 instantiate_parameters (loop_1, {a + 1, +, 1}_1), that gives after some
105 more analysis the scev {4, +, 1}_1, or in other words, this is
106 the function "f (x) = x + 4", where x is the iteration count of
107 the loop_1. Now we have to solve the inequality "x + 4 > 10",
108 and take the smallest iteration number for which the loop is
109 exited: x = 7. This loop runs from x = 0 to x = 7, and in total
110 there are 8 iterations. In terms of loop normalization, we have
111 created a variable that is implicitly defined, "x" or just "_1",
112 and all the other analyzed scalars of the loop are defined in
113 function of this variable:
119 or in terms of a C program:
122 | for (x = 0; x <= 7; x++)
128 Example 2a: Illustration of the algorithm on nested loops.
139 For analyzing the scalar evolution of "a", the algorithm follows
140 the SSA edge into the loop's body: "a -> b". "b" is an inner
141 loop-phi-node, and its analysis as in Example 1, gives:
146 Following the SSA edge for the initial condition, we end on "c = a
147 + 2", and then on the starting loop-phi-node "a". From this point,
148 the loop stride is computed: back on "c = a + 2" we get a "+2" in
149 the loop_1, then on the loop-phi-node "b" we compute the overall
150 effect of the inner loop that is "b = c + 30", and we get a "+30"
151 in the loop_1. That means that the overall stride in loop_1 is
152 equal to "+32", and the result is:
157 Example 2b: Multivariate chains of recurrences.
170 Analyzing the access function of array A with
171 instantiate_parameters (loop_1, "j + k"), we obtain the
172 instantiation and the analysis of the scalar variables "j" and "k"
173 in loop_1. This leads to the scalar evolution {4, +, 1}_1: the end
174 value of loop_2 for "j" is 4, and the evolution of "k" in loop_1 is
175 {0, +, 1}_1. To obtain the evolution function in loop_3 and
176 instantiate the scalar variables up to loop_1, one has to use:
177 instantiate_scev (block_before_loop (loop_1), loop_3, "j + k").
178 The result of this call is {{0, +, 1}_1, +, 1}_2.
180 Example 3: Higher degree polynomials.
194 instantiate_parameters (loop_1, {5, +, a}_1) -> {5, +, 2, +, 1}_1
195 instantiate_parameters (loop_1, {5 + a, +, a}_1) -> {7, +, 3, +, 1}_1
197 Example 4: Lucas, Fibonacci, or mixers in general.
209 The syntax "(1, c)_1" stands for a PEELED_CHREC that has the
210 following semantics: during the first iteration of the loop_1, the
211 variable contains the value 1, and then it contains the value "c".
212 Note that this syntax is close to the syntax of the loop-phi-node:
213 "a -> (1, c)_1" vs. "a = phi (1, c)".
215 The symbolic chrec representation contains all the semantics of the
216 original code. What is more difficult is to use this information.
218 Example 5: Flip-flops, or exchangers.
230 Based on these symbolic chrecs, it is possible to refine this
231 information into the more precise PERIODIC_CHRECs:
236 This transformation is not yet implemented.
240 You can find a more detailed description of the algorithm in:
241 http://icps.u-strasbg.fr/~pop/DEA_03_Pop.pdf
242 http://icps.u-strasbg.fr/~pop/DEA_03_Pop.ps.gz. But note that
243 this is a preliminary report and some of the details of the
244 algorithm have changed. I'm working on a research report that
245 updates the description of the algorithms to reflect the design
246 choices used in this implementation.
248 A set of slides show a high level overview of the algorithm and run
249 an example through the scalar evolution analyzer:
250 http://cri.ensmp.fr/~pop/gcc/mar04/slides.pdf
252 The slides that I have presented at the GCC Summit'04 are available
253 at: http://cri.ensmp.fr/~pop/gcc/20040604/gccsummit-lno-spop.pdf
258 #include "coretypes.h"
261 #include "gimple-pretty-print.h"
262 #include "basic-block.h"
263 #include "tree-ssa-alias.h"
264 #include "internal-fn.h"
265 #include "gimple-expr.h"
268 #include "gimplify.h"
269 #include "gimple-iterator.h"
270 #include "gimplify-me.h"
271 #include "gimple-ssa.h"
272 #include "tree-cfg.h"
273 #include "tree-phinodes.h"
274 #include "stringpool.h"
275 #include "tree-ssanames.h"
276 #include "tree-ssa-loop-ivopts.h"
277 #include "tree-ssa-loop-manip.h"
278 #include "tree-ssa-loop-niter.h"
279 #include "tree-ssa-loop.h"
280 #include "tree-ssa.h"
282 #include "tree-chrec.h"
283 #include "pointer-set.h"
284 #include "tree-affine.h"
285 #include "tree-scalar-evolution.h"
286 #include "dumpfile.h"
288 #include "tree-ssa-propagate.h"
289 #include "gimple-fold.h"
290 #include "gimplify-me.h"
292 static tree
analyze_scalar_evolution_1 (struct loop
*, tree
, tree
);
293 static tree
analyze_scalar_evolution_for_address_of (struct loop
*loop
,
296 /* The cached information about an SSA name with version NAME_VERSION,
297 claiming that below basic block with index INSTANTIATED_BELOW, the
298 value of the SSA name can be expressed as CHREC. */
300 struct GTY(()) scev_info_str
{
301 unsigned int name_version
;
302 int instantiated_below
;
306 /* Counters for the scev database. */
307 static unsigned nb_set_scev
= 0;
308 static unsigned nb_get_scev
= 0;
310 /* The following trees are unique elements. Thus the comparison of
311 another element to these elements should be done on the pointer to
312 these trees, and not on their value. */
314 /* The SSA_NAMEs that are not yet analyzed are qualified with NULL_TREE. */
315 tree chrec_not_analyzed_yet
;
317 /* Reserved to the cases where the analyzer has detected an
318 undecidable property at compile time. */
319 tree chrec_dont_know
;
321 /* When the analyzer has detected that a property will never
322 happen, then it qualifies it with chrec_known. */
325 static GTY ((param_is (struct scev_info_str
))) htab_t scalar_evolution_info
;
328 /* Constructs a new SCEV_INFO_STR structure for VAR and INSTANTIATED_BELOW. */
330 static inline struct scev_info_str
*
331 new_scev_info_str (basic_block instantiated_below
, tree var
)
333 struct scev_info_str
*res
;
335 res
= ggc_alloc
<scev_info_str
> ();
336 res
->name_version
= SSA_NAME_VERSION (var
);
337 res
->chrec
= chrec_not_analyzed_yet
;
338 res
->instantiated_below
= instantiated_below
->index
;
343 /* Computes a hash function for database element ELT. */
345 static inline hashval_t
346 hash_scev_info (const void *elt_
)
348 const struct scev_info_str
*elt
= (const struct scev_info_str
*) elt_
;
349 return elt
->name_version
^ elt
->instantiated_below
;
352 /* Compares database elements E1 and E2. */
355 eq_scev_info (const void *e1
, const void *e2
)
357 const struct scev_info_str
*elt1
= (const struct scev_info_str
*) e1
;
358 const struct scev_info_str
*elt2
= (const struct scev_info_str
*) e2
;
360 return (elt1
->name_version
== elt2
->name_version
361 && elt1
->instantiated_below
== elt2
->instantiated_below
);
364 /* Deletes database element E. */
367 del_scev_info (void *e
)
373 /* Get the scalar evolution of VAR for INSTANTIATED_BELOW basic block.
374 A first query on VAR returns chrec_not_analyzed_yet. */
377 find_var_scev_info (basic_block instantiated_below
, tree var
)
379 struct scev_info_str
*res
;
380 struct scev_info_str tmp
;
383 tmp
.name_version
= SSA_NAME_VERSION (var
);
384 tmp
.instantiated_below
= instantiated_below
->index
;
385 slot
= htab_find_slot (scalar_evolution_info
, &tmp
, INSERT
);
388 *slot
= new_scev_info_str (instantiated_below
, var
);
389 res
= (struct scev_info_str
*) *slot
;
394 /* Return true when CHREC contains symbolic names defined in
398 chrec_contains_symbols_defined_in_loop (const_tree chrec
, unsigned loop_nb
)
402 if (chrec
== NULL_TREE
)
405 if (is_gimple_min_invariant (chrec
))
408 if (TREE_CODE (chrec
) == SSA_NAME
)
411 loop_p def_loop
, loop
;
413 if (SSA_NAME_IS_DEFAULT_DEF (chrec
))
416 def
= SSA_NAME_DEF_STMT (chrec
);
417 def_loop
= loop_containing_stmt (def
);
418 loop
= get_loop (cfun
, loop_nb
);
420 if (def_loop
== NULL
)
423 if (loop
== def_loop
|| flow_loop_nested_p (loop
, def_loop
))
429 n
= TREE_OPERAND_LENGTH (chrec
);
430 for (i
= 0; i
< n
; i
++)
431 if (chrec_contains_symbols_defined_in_loop (TREE_OPERAND (chrec
, i
),
437 /* Return true when PHI is a loop-phi-node. */
440 loop_phi_node_p (gimple phi
)
442 /* The implementation of this function is based on the following
443 property: "all the loop-phi-nodes of a loop are contained in the
444 loop's header basic block". */
446 return loop_containing_stmt (phi
)->header
== gimple_bb (phi
);
449 /* Compute the scalar evolution for EVOLUTION_FN after crossing LOOP.
450 In general, in the case of multivariate evolutions we want to get
451 the evolution in different loops. LOOP specifies the level for
452 which to get the evolution.
456 | for (j = 0; j < 100; j++)
458 | for (k = 0; k < 100; k++)
460 | i = k + j; - Here the value of i is a function of j, k.
462 | ... = i - Here the value of i is a function of j.
464 | ... = i - Here the value of i is a scalar.
470 | i_1 = phi (i_0, i_2)
474 This loop has the same effect as:
475 LOOP_1 has the same effect as:
479 The overall effect of the loop, "i_0 + 20" in the previous example,
480 is obtained by passing in the parameters: LOOP = 1,
481 EVOLUTION_FN = {i_0, +, 2}_1.
485 compute_overall_effect_of_inner_loop (struct loop
*loop
, tree evolution_fn
)
489 if (evolution_fn
== chrec_dont_know
)
490 return chrec_dont_know
;
492 else if (TREE_CODE (evolution_fn
) == POLYNOMIAL_CHREC
)
494 struct loop
*inner_loop
= get_chrec_loop (evolution_fn
);
496 if (inner_loop
== loop
497 || flow_loop_nested_p (loop
, inner_loop
))
499 tree nb_iter
= number_of_latch_executions (inner_loop
);
501 if (nb_iter
== chrec_dont_know
)
502 return chrec_dont_know
;
507 /* evolution_fn is the evolution function in LOOP. Get
508 its value in the nb_iter-th iteration. */
509 res
= chrec_apply (inner_loop
->num
, evolution_fn
, nb_iter
);
511 if (chrec_contains_symbols_defined_in_loop (res
, loop
->num
))
512 res
= instantiate_parameters (loop
, res
);
514 /* Continue the computation until ending on a parent of LOOP. */
515 return compute_overall_effect_of_inner_loop (loop
, res
);
522 /* If the evolution function is an invariant, there is nothing to do. */
523 else if (no_evolution_in_loop_p (evolution_fn
, loop
->num
, &val
) && val
)
527 return chrec_dont_know
;
530 /* Associate CHREC to SCALAR. */
533 set_scalar_evolution (basic_block instantiated_below
, tree scalar
, tree chrec
)
537 if (TREE_CODE (scalar
) != SSA_NAME
)
540 scalar_info
= find_var_scev_info (instantiated_below
, scalar
);
544 if (dump_flags
& TDF_SCEV
)
546 fprintf (dump_file
, "(set_scalar_evolution \n");
547 fprintf (dump_file
, " instantiated_below = %d \n",
548 instantiated_below
->index
);
549 fprintf (dump_file
, " (scalar = ");
550 print_generic_expr (dump_file
, scalar
, 0);
551 fprintf (dump_file
, ")\n (scalar_evolution = ");
552 print_generic_expr (dump_file
, chrec
, 0);
553 fprintf (dump_file
, "))\n");
555 if (dump_flags
& TDF_STATS
)
559 *scalar_info
= chrec
;
562 /* Retrieve the chrec associated to SCALAR instantiated below
563 INSTANTIATED_BELOW block. */
566 get_scalar_evolution (basic_block instantiated_below
, tree scalar
)
572 if (dump_flags
& TDF_SCEV
)
574 fprintf (dump_file
, "(get_scalar_evolution \n");
575 fprintf (dump_file
, " (scalar = ");
576 print_generic_expr (dump_file
, scalar
, 0);
577 fprintf (dump_file
, ")\n");
579 if (dump_flags
& TDF_STATS
)
583 switch (TREE_CODE (scalar
))
586 res
= *find_var_scev_info (instantiated_below
, scalar
);
596 res
= chrec_not_analyzed_yet
;
600 if (dump_file
&& (dump_flags
& TDF_SCEV
))
602 fprintf (dump_file
, " (scalar_evolution = ");
603 print_generic_expr (dump_file
, res
, 0);
604 fprintf (dump_file
, "))\n");
610 /* Helper function for add_to_evolution. Returns the evolution
611 function for an assignment of the form "a = b + c", where "a" and
612 "b" are on the strongly connected component. CHREC_BEFORE is the
613 information that we already have collected up to this point.
614 TO_ADD is the evolution of "c".
616 When CHREC_BEFORE has an evolution part in LOOP_NB, add to this
617 evolution the expression TO_ADD, otherwise construct an evolution
618 part for this loop. */
621 add_to_evolution_1 (unsigned loop_nb
, tree chrec_before
, tree to_add
,
624 tree type
, left
, right
;
625 struct loop
*loop
= get_loop (cfun
, loop_nb
), *chloop
;
627 switch (TREE_CODE (chrec_before
))
629 case POLYNOMIAL_CHREC
:
630 chloop
= get_chrec_loop (chrec_before
);
632 || flow_loop_nested_p (chloop
, loop
))
636 type
= chrec_type (chrec_before
);
638 /* When there is no evolution part in this loop, build it. */
643 right
= SCALAR_FLOAT_TYPE_P (type
)
644 ? build_real (type
, dconst0
)
645 : build_int_cst (type
, 0);
649 var
= CHREC_VARIABLE (chrec_before
);
650 left
= CHREC_LEFT (chrec_before
);
651 right
= CHREC_RIGHT (chrec_before
);
654 to_add
= chrec_convert (type
, to_add
, at_stmt
);
655 right
= chrec_convert_rhs (type
, right
, at_stmt
);
656 right
= chrec_fold_plus (chrec_type (right
), right
, to_add
);
657 return build_polynomial_chrec (var
, left
, right
);
661 gcc_assert (flow_loop_nested_p (loop
, chloop
));
663 /* Search the evolution in LOOP_NB. */
664 left
= add_to_evolution_1 (loop_nb
, CHREC_LEFT (chrec_before
),
666 right
= CHREC_RIGHT (chrec_before
);
667 right
= chrec_convert_rhs (chrec_type (left
), right
, at_stmt
);
668 return build_polynomial_chrec (CHREC_VARIABLE (chrec_before
),
673 /* These nodes do not depend on a loop. */
674 if (chrec_before
== chrec_dont_know
)
675 return chrec_dont_know
;
678 right
= chrec_convert_rhs (chrec_type (left
), to_add
, at_stmt
);
679 return build_polynomial_chrec (loop_nb
, left
, right
);
683 /* Add TO_ADD to the evolution part of CHREC_BEFORE in the dimension
686 Description (provided for completeness, for those who read code in
687 a plane, and for my poor 62 bytes brain that would have forgotten
688 all this in the next two or three months):
690 The algorithm of translation of programs from the SSA representation
691 into the chrecs syntax is based on a pattern matching. After having
692 reconstructed the overall tree expression for a loop, there are only
693 two cases that can arise:
695 1. a = loop-phi (init, a + expr)
696 2. a = loop-phi (init, expr)
698 where EXPR is either a scalar constant with respect to the analyzed
699 loop (this is a degree 0 polynomial), or an expression containing
700 other loop-phi definitions (these are higher degree polynomials).
707 | a = phi (init, a + 5)
714 | a = phi (inita, 2 * b + 3)
715 | b = phi (initb, b + 1)
718 For the first case, the semantics of the SSA representation is:
720 | a (x) = init + \sum_{j = 0}^{x - 1} expr (j)
722 that is, there is a loop index "x" that determines the scalar value
723 of the variable during the loop execution. During the first
724 iteration, the value is that of the initial condition INIT, while
725 during the subsequent iterations, it is the sum of the initial
726 condition with the sum of all the values of EXPR from the initial
727 iteration to the before last considered iteration.
729 For the second case, the semantics of the SSA program is:
731 | a (x) = init, if x = 0;
732 | expr (x - 1), otherwise.
734 The second case corresponds to the PEELED_CHREC, whose syntax is
735 close to the syntax of a loop-phi-node:
737 | phi (init, expr) vs. (init, expr)_x
739 The proof of the translation algorithm for the first case is a
740 proof by structural induction based on the degree of EXPR.
743 When EXPR is a constant with respect to the analyzed loop, or in
744 other words when EXPR is a polynomial of degree 0, the evolution of
745 the variable A in the loop is an affine function with an initial
746 condition INIT, and a step EXPR. In order to show this, we start
747 from the semantics of the SSA representation:
749 f (x) = init + \sum_{j = 0}^{x - 1} expr (j)
751 and since "expr (j)" is a constant with respect to "j",
753 f (x) = init + x * expr
755 Finally, based on the semantics of the pure sum chrecs, by
756 identification we get the corresponding chrecs syntax:
758 f (x) = init * \binom{x}{0} + expr * \binom{x}{1}
759 f (x) -> {init, +, expr}_x
762 Suppose that EXPR is a polynomial of degree N with respect to the
763 analyzed loop_x for which we have already determined that it is
764 written under the chrecs syntax:
766 | expr (x) -> {b_0, +, b_1, +, ..., +, b_{n-1}} (x)
768 We start from the semantics of the SSA program:
770 | f (x) = init + \sum_{j = 0}^{x - 1} expr (j)
772 | f (x) = init + \sum_{j = 0}^{x - 1}
773 | (b_0 * \binom{j}{0} + ... + b_{n-1} * \binom{j}{n-1})
775 | f (x) = init + \sum_{j = 0}^{x - 1}
776 | \sum_{k = 0}^{n - 1} (b_k * \binom{j}{k})
778 | f (x) = init + \sum_{k = 0}^{n - 1}
779 | (b_k * \sum_{j = 0}^{x - 1} \binom{j}{k})
781 | f (x) = init + \sum_{k = 0}^{n - 1}
782 | (b_k * \binom{x}{k + 1})
784 | f (x) = init + b_0 * \binom{x}{1} + ...
785 | + b_{n-1} * \binom{x}{n}
787 | f (x) = init * \binom{x}{0} + b_0 * \binom{x}{1} + ...
788 | + b_{n-1} * \binom{x}{n}
791 And finally from the definition of the chrecs syntax, we identify:
792 | f (x) -> {init, +, b_0, +, ..., +, b_{n-1}}_x
794 This shows the mechanism that stands behind the add_to_evolution
795 function. An important point is that the use of symbolic
796 parameters avoids the need of an analysis schedule.
803 | a = phi (inita, a + 2 + b)
804 | b = phi (initb, b + 1)
807 When analyzing "a", the algorithm keeps "b" symbolically:
809 | a -> {inita, +, 2 + b}_1
811 Then, after instantiation, the analyzer ends on the evolution:
813 | a -> {inita, +, 2 + initb, +, 1}_1
818 add_to_evolution (unsigned loop_nb
, tree chrec_before
, enum tree_code code
,
819 tree to_add
, gimple at_stmt
)
821 tree type
= chrec_type (to_add
);
822 tree res
= NULL_TREE
;
824 if (to_add
== NULL_TREE
)
827 /* TO_ADD is either a scalar, or a parameter. TO_ADD is not
828 instantiated at this point. */
829 if (TREE_CODE (to_add
) == POLYNOMIAL_CHREC
)
830 /* This should not happen. */
831 return chrec_dont_know
;
833 if (dump_file
&& (dump_flags
& TDF_SCEV
))
835 fprintf (dump_file
, "(add_to_evolution \n");
836 fprintf (dump_file
, " (loop_nb = %d)\n", loop_nb
);
837 fprintf (dump_file
, " (chrec_before = ");
838 print_generic_expr (dump_file
, chrec_before
, 0);
839 fprintf (dump_file
, ")\n (to_add = ");
840 print_generic_expr (dump_file
, to_add
, 0);
841 fprintf (dump_file
, ")\n");
844 if (code
== MINUS_EXPR
)
845 to_add
= chrec_fold_multiply (type
, to_add
, SCALAR_FLOAT_TYPE_P (type
)
846 ? build_real (type
, dconstm1
)
847 : build_int_cst_type (type
, -1));
849 res
= add_to_evolution_1 (loop_nb
, chrec_before
, to_add
, at_stmt
);
851 if (dump_file
&& (dump_flags
& TDF_SCEV
))
853 fprintf (dump_file
, " (res = ");
854 print_generic_expr (dump_file
, res
, 0);
855 fprintf (dump_file
, "))\n");
863 /* This section selects the loops that will be good candidates for the
864 scalar evolution analysis. For the moment, greedily select all the
865 loop nests we could analyze. */
867 /* For a loop with a single exit edge, return the COND_EXPR that
868 guards the exit edge. If the expression is too difficult to
869 analyze, then give up. */
872 get_loop_exit_condition (const struct loop
*loop
)
875 edge exit_edge
= single_exit (loop
);
877 if (dump_file
&& (dump_flags
& TDF_SCEV
))
878 fprintf (dump_file
, "(get_loop_exit_condition \n ");
884 stmt
= last_stmt (exit_edge
->src
);
885 if (gimple_code (stmt
) == GIMPLE_COND
)
889 if (dump_file
&& (dump_flags
& TDF_SCEV
))
891 print_gimple_stmt (dump_file
, res
, 0, 0);
892 fprintf (dump_file
, ")\n");
899 /* Depth first search algorithm. */
901 typedef enum t_bool
{
908 static t_bool
follow_ssa_edge (struct loop
*loop
, gimple
, gimple
, tree
*, int);
910 /* Follow the ssa edge into the binary expression RHS0 CODE RHS1.
911 Return true if the strongly connected component has been found. */
914 follow_ssa_edge_binary (struct loop
*loop
, gimple at_stmt
,
915 tree type
, tree rhs0
, enum tree_code code
, tree rhs1
,
916 gimple halting_phi
, tree
*evolution_of_loop
, int limit
)
918 t_bool res
= t_false
;
923 case POINTER_PLUS_EXPR
:
925 if (TREE_CODE (rhs0
) == SSA_NAME
)
927 if (TREE_CODE (rhs1
) == SSA_NAME
)
929 /* Match an assignment under the form:
932 /* We want only assignments of form "name + name" contribute to
933 LIMIT, as the other cases do not necessarily contribute to
934 the complexity of the expression. */
937 evol
= *evolution_of_loop
;
938 res
= follow_ssa_edge
939 (loop
, SSA_NAME_DEF_STMT (rhs0
), halting_phi
, &evol
, limit
);
942 *evolution_of_loop
= add_to_evolution
944 chrec_convert (type
, evol
, at_stmt
),
945 code
, rhs1
, at_stmt
);
947 else if (res
== t_false
)
949 res
= follow_ssa_edge
950 (loop
, SSA_NAME_DEF_STMT (rhs1
), halting_phi
,
951 evolution_of_loop
, limit
);
954 *evolution_of_loop
= add_to_evolution
956 chrec_convert (type
, *evolution_of_loop
, at_stmt
),
957 code
, rhs0
, at_stmt
);
959 else if (res
== t_dont_know
)
960 *evolution_of_loop
= chrec_dont_know
;
963 else if (res
== t_dont_know
)
964 *evolution_of_loop
= chrec_dont_know
;
969 /* Match an assignment under the form:
971 res
= follow_ssa_edge
972 (loop
, SSA_NAME_DEF_STMT (rhs0
), halting_phi
,
973 evolution_of_loop
, limit
);
975 *evolution_of_loop
= add_to_evolution
976 (loop
->num
, chrec_convert (type
, *evolution_of_loop
,
978 code
, rhs1
, at_stmt
);
980 else if (res
== t_dont_know
)
981 *evolution_of_loop
= chrec_dont_know
;
985 else if (TREE_CODE (rhs1
) == SSA_NAME
)
987 /* Match an assignment under the form:
989 res
= follow_ssa_edge
990 (loop
, SSA_NAME_DEF_STMT (rhs1
), halting_phi
,
991 evolution_of_loop
, limit
);
993 *evolution_of_loop
= add_to_evolution
994 (loop
->num
, chrec_convert (type
, *evolution_of_loop
,
996 code
, rhs0
, at_stmt
);
998 else if (res
== t_dont_know
)
999 *evolution_of_loop
= chrec_dont_know
;
1003 /* Otherwise, match an assignment under the form:
1005 /* And there is nothing to do. */
1010 /* This case is under the form "opnd0 = rhs0 - rhs1". */
1011 if (TREE_CODE (rhs0
) == SSA_NAME
)
1013 /* Match an assignment under the form:
1016 /* We want only assignments of form "name - name" contribute to
1017 LIMIT, as the other cases do not necessarily contribute to
1018 the complexity of the expression. */
1019 if (TREE_CODE (rhs1
) == SSA_NAME
)
1022 res
= follow_ssa_edge (loop
, SSA_NAME_DEF_STMT (rhs0
), halting_phi
,
1023 evolution_of_loop
, limit
);
1025 *evolution_of_loop
= add_to_evolution
1026 (loop
->num
, chrec_convert (type
, *evolution_of_loop
, at_stmt
),
1027 MINUS_EXPR
, rhs1
, at_stmt
);
1029 else if (res
== t_dont_know
)
1030 *evolution_of_loop
= chrec_dont_know
;
1033 /* Otherwise, match an assignment under the form:
1035 /* And there is nothing to do. */
1046 /* Follow the ssa edge into the expression EXPR.
1047 Return true if the strongly connected component has been found. */
1050 follow_ssa_edge_expr (struct loop
*loop
, gimple at_stmt
, tree expr
,
1051 gimple halting_phi
, tree
*evolution_of_loop
, int limit
)
1053 enum tree_code code
= TREE_CODE (expr
);
1054 tree type
= TREE_TYPE (expr
), rhs0
, rhs1
;
1057 /* The EXPR is one of the following cases:
1061 - a POINTER_PLUS_EXPR,
1064 - other cases are not yet handled. */
1069 /* This assignment is under the form "a_1 = (cast) rhs. */
1070 res
= follow_ssa_edge_expr (loop
, at_stmt
, TREE_OPERAND (expr
, 0),
1071 halting_phi
, evolution_of_loop
, limit
);
1072 *evolution_of_loop
= chrec_convert (type
, *evolution_of_loop
, at_stmt
);
1076 /* This assignment is under the form "a_1 = 7". */
1081 /* This assignment is under the form: "a_1 = b_2". */
1082 res
= follow_ssa_edge
1083 (loop
, SSA_NAME_DEF_STMT (expr
), halting_phi
, evolution_of_loop
, limit
);
1086 case POINTER_PLUS_EXPR
:
1089 /* This case is under the form "rhs0 +- rhs1". */
1090 rhs0
= TREE_OPERAND (expr
, 0);
1091 rhs1
= TREE_OPERAND (expr
, 1);
1092 type
= TREE_TYPE (rhs0
);
1093 STRIP_USELESS_TYPE_CONVERSION (rhs0
);
1094 STRIP_USELESS_TYPE_CONVERSION (rhs1
);
1095 res
= follow_ssa_edge_binary (loop
, at_stmt
, type
, rhs0
, code
, rhs1
,
1096 halting_phi
, evolution_of_loop
, limit
);
1100 /* Handle &MEM[ptr + CST] which is equivalent to POINTER_PLUS_EXPR. */
1101 if (TREE_CODE (TREE_OPERAND (expr
, 0)) == MEM_REF
)
1103 expr
= TREE_OPERAND (expr
, 0);
1104 rhs0
= TREE_OPERAND (expr
, 0);
1105 rhs1
= TREE_OPERAND (expr
, 1);
1106 type
= TREE_TYPE (rhs0
);
1107 STRIP_USELESS_TYPE_CONVERSION (rhs0
);
1108 STRIP_USELESS_TYPE_CONVERSION (rhs1
);
1109 res
= follow_ssa_edge_binary (loop
, at_stmt
, type
,
1110 rhs0
, POINTER_PLUS_EXPR
, rhs1
,
1111 halting_phi
, evolution_of_loop
, limit
);
1118 /* This assignment is of the form: "a_1 = ASSERT_EXPR <a_2, ...>"
1119 It must be handled as a copy assignment of the form a_1 = a_2. */
1120 rhs0
= ASSERT_EXPR_VAR (expr
);
1121 if (TREE_CODE (rhs0
) == SSA_NAME
)
1122 res
= follow_ssa_edge (loop
, SSA_NAME_DEF_STMT (rhs0
),
1123 halting_phi
, evolution_of_loop
, limit
);
1136 /* Follow the ssa edge into the right hand side of an assignment STMT.
1137 Return true if the strongly connected component has been found. */
1140 follow_ssa_edge_in_rhs (struct loop
*loop
, gimple stmt
,
1141 gimple halting_phi
, tree
*evolution_of_loop
, int limit
)
1143 enum tree_code code
= gimple_assign_rhs_code (stmt
);
1144 tree type
= gimple_expr_type (stmt
), rhs1
, rhs2
;
1150 /* This assignment is under the form "a_1 = (cast) rhs. */
1151 res
= follow_ssa_edge_expr (loop
, stmt
, gimple_assign_rhs1 (stmt
),
1152 halting_phi
, evolution_of_loop
, limit
);
1153 *evolution_of_loop
= chrec_convert (type
, *evolution_of_loop
, stmt
);
1156 case POINTER_PLUS_EXPR
:
1159 rhs1
= gimple_assign_rhs1 (stmt
);
1160 rhs2
= gimple_assign_rhs2 (stmt
);
1161 type
= TREE_TYPE (rhs1
);
1162 res
= follow_ssa_edge_binary (loop
, stmt
, type
, rhs1
, code
, rhs2
,
1163 halting_phi
, evolution_of_loop
, limit
);
1167 if (get_gimple_rhs_class (code
) == GIMPLE_SINGLE_RHS
)
1168 res
= follow_ssa_edge_expr (loop
, stmt
, gimple_assign_rhs1 (stmt
),
1169 halting_phi
, evolution_of_loop
, limit
);
1178 /* Checks whether the I-th argument of a PHI comes from a backedge. */
1181 backedge_phi_arg_p (gimple phi
, int i
)
1183 const_edge e
= gimple_phi_arg_edge (phi
, i
);
1185 /* We would in fact like to test EDGE_DFS_BACK here, but we do not care
1186 about updating it anywhere, and this should work as well most of the
1188 if (e
->flags
& EDGE_IRREDUCIBLE_LOOP
)
1194 /* Helper function for one branch of the condition-phi-node. Return
1195 true if the strongly connected component has been found following
1198 static inline t_bool
1199 follow_ssa_edge_in_condition_phi_branch (int i
,
1201 gimple condition_phi
,
1203 tree
*evolution_of_branch
,
1204 tree init_cond
, int limit
)
1206 tree branch
= PHI_ARG_DEF (condition_phi
, i
);
1207 *evolution_of_branch
= chrec_dont_know
;
1209 /* Do not follow back edges (they must belong to an irreducible loop, which
1210 we really do not want to worry about). */
1211 if (backedge_phi_arg_p (condition_phi
, i
))
1214 if (TREE_CODE (branch
) == SSA_NAME
)
1216 *evolution_of_branch
= init_cond
;
1217 return follow_ssa_edge (loop
, SSA_NAME_DEF_STMT (branch
), halting_phi
,
1218 evolution_of_branch
, limit
);
1221 /* This case occurs when one of the condition branches sets
1222 the variable to a constant: i.e. a phi-node like
1223 "a_2 = PHI <a_7(5), 2(6)>;".
1225 FIXME: This case have to be refined correctly:
1226 in some cases it is possible to say something better than
1227 chrec_dont_know, for example using a wrap-around notation. */
1231 /* This function merges the branches of a condition-phi-node in a
1235 follow_ssa_edge_in_condition_phi (struct loop
*loop
,
1236 gimple condition_phi
,
1238 tree
*evolution_of_loop
, int limit
)
1241 tree init
= *evolution_of_loop
;
1242 tree evolution_of_branch
;
1243 t_bool res
= follow_ssa_edge_in_condition_phi_branch (0, loop
, condition_phi
,
1245 &evolution_of_branch
,
1247 if (res
== t_false
|| res
== t_dont_know
)
1250 *evolution_of_loop
= evolution_of_branch
;
1252 n
= gimple_phi_num_args (condition_phi
);
1253 for (i
= 1; i
< n
; i
++)
1255 /* Quickly give up when the evolution of one of the branches is
1257 if (*evolution_of_loop
== chrec_dont_know
)
1260 /* Increase the limit by the PHI argument number to avoid exponential
1261 time and memory complexity. */
1262 res
= follow_ssa_edge_in_condition_phi_branch (i
, loop
, condition_phi
,
1264 &evolution_of_branch
,
1266 if (res
== t_false
|| res
== t_dont_know
)
1269 *evolution_of_loop
= chrec_merge (*evolution_of_loop
,
1270 evolution_of_branch
);
1276 /* Follow an SSA edge in an inner loop. It computes the overall
1277 effect of the loop, and following the symbolic initial conditions,
1278 it follows the edges in the parent loop. The inner loop is
1279 considered as a single statement. */
1282 follow_ssa_edge_inner_loop_phi (struct loop
*outer_loop
,
1283 gimple loop_phi_node
,
1285 tree
*evolution_of_loop
, int limit
)
1287 struct loop
*loop
= loop_containing_stmt (loop_phi_node
);
1288 tree ev
= analyze_scalar_evolution (loop
, PHI_RESULT (loop_phi_node
));
1290 /* Sometimes, the inner loop is too difficult to analyze, and the
1291 result of the analysis is a symbolic parameter. */
1292 if (ev
== PHI_RESULT (loop_phi_node
))
1294 t_bool res
= t_false
;
1295 int i
, n
= gimple_phi_num_args (loop_phi_node
);
1297 for (i
= 0; i
< n
; i
++)
1299 tree arg
= PHI_ARG_DEF (loop_phi_node
, i
);
1302 /* Follow the edges that exit the inner loop. */
1303 bb
= gimple_phi_arg_edge (loop_phi_node
, i
)->src
;
1304 if (!flow_bb_inside_loop_p (loop
, bb
))
1305 res
= follow_ssa_edge_expr (outer_loop
, loop_phi_node
,
1307 evolution_of_loop
, limit
);
1312 /* If the path crosses this loop-phi, give up. */
1314 *evolution_of_loop
= chrec_dont_know
;
1319 /* Otherwise, compute the overall effect of the inner loop. */
1320 ev
= compute_overall_effect_of_inner_loop (loop
, ev
);
1321 return follow_ssa_edge_expr (outer_loop
, loop_phi_node
, ev
, halting_phi
,
1322 evolution_of_loop
, limit
);
1325 /* Follow an SSA edge from a loop-phi-node to itself, constructing a
1326 path that is analyzed on the return walk. */
1329 follow_ssa_edge (struct loop
*loop
, gimple def
, gimple halting_phi
,
1330 tree
*evolution_of_loop
, int limit
)
1332 struct loop
*def_loop
;
1334 if (gimple_nop_p (def
))
1337 /* Give up if the path is longer than the MAX that we allow. */
1338 if (limit
> PARAM_VALUE (PARAM_SCEV_MAX_EXPR_COMPLEXITY
))
1341 def_loop
= loop_containing_stmt (def
);
1343 switch (gimple_code (def
))
1346 if (!loop_phi_node_p (def
))
1347 /* DEF is a condition-phi-node. Follow the branches, and
1348 record their evolutions. Finally, merge the collected
1349 information and set the approximation to the main
1351 return follow_ssa_edge_in_condition_phi
1352 (loop
, def
, halting_phi
, evolution_of_loop
, limit
);
1354 /* When the analyzed phi is the halting_phi, the
1355 depth-first search is over: we have found a path from
1356 the halting_phi to itself in the loop. */
1357 if (def
== halting_phi
)
1360 /* Otherwise, the evolution of the HALTING_PHI depends
1361 on the evolution of another loop-phi-node, i.e. the
1362 evolution function is a higher degree polynomial. */
1363 if (def_loop
== loop
)
1367 if (flow_loop_nested_p (loop
, def_loop
))
1368 return follow_ssa_edge_inner_loop_phi
1369 (loop
, def
, halting_phi
, evolution_of_loop
, limit
+ 1);
1375 return follow_ssa_edge_in_rhs (loop
, def
, halting_phi
,
1376 evolution_of_loop
, limit
);
1379 /* At this level of abstraction, the program is just a set
1380 of GIMPLE_ASSIGNs and PHI_NODEs. In principle there is no
1381 other node to be handled. */
1387 /* Simplify PEELED_CHREC represented by (init_cond, arg) in LOOP.
1388 Handle below case and return the corresponding POLYNOMIAL_CHREC:
1390 # i_17 = PHI <i_13(5), 0(3)>
1391 # _20 = PHI <_5(5), start_4(D)(3)>
1394 _5 = start_4(D) + i_13;
1396 Though variable _20 appears as a PEELED_CHREC in the form of
1397 (start_4, _5)_LOOP, it's a POLYNOMIAL_CHREC like {start_4, 1}_LOOP.
1402 simplify_peeled_chrec (struct loop
*loop
, tree arg
, tree init_cond
)
1404 aff_tree aff1
, aff2
;
1405 tree ev
, left
, right
, type
, step_val
;
1406 pointer_map_t
*peeled_chrec_map
= NULL
;
1408 ev
= instantiate_parameters (loop
, analyze_scalar_evolution (loop
, arg
));
1409 if (ev
== NULL_TREE
|| TREE_CODE (ev
) != POLYNOMIAL_CHREC
)
1410 return chrec_dont_know
;
1412 left
= CHREC_LEFT (ev
);
1413 right
= CHREC_RIGHT (ev
);
1414 type
= TREE_TYPE (left
);
1415 step_val
= chrec_fold_plus (type
, init_cond
, right
);
1417 /* Transform (init, {left, right}_LOOP)_LOOP to {init, right}_LOOP
1418 if "left" equals to "init + right". */
1419 if (operand_equal_p (left
, step_val
, 0))
1421 if (dump_file
&& (dump_flags
& TDF_SCEV
))
1422 fprintf (dump_file
, "Simplify PEELED_CHREC into POLYNOMIAL_CHREC.\n");
1424 return build_polynomial_chrec (loop
->num
, init_cond
, right
);
1427 /* Try harder to check if they are equal. */
1428 tree_to_aff_combination_expand (left
, type
, &aff1
, &peeled_chrec_map
);
1429 tree_to_aff_combination_expand (step_val
, type
, &aff2
, &peeled_chrec_map
);
1430 free_affine_expand_cache (&peeled_chrec_map
);
1431 aff_combination_scale (&aff2
, -1);
1432 aff_combination_add (&aff1
, &aff2
);
1434 /* Transform (init, {left, right}_LOOP)_LOOP to {init, right}_LOOP
1435 if "left" equals to "init + right". */
1436 if (aff_combination_zero_p (&aff1
))
1438 if (dump_file
&& (dump_flags
& TDF_SCEV
))
1439 fprintf (dump_file
, "Simplify PEELED_CHREC into POLYNOMIAL_CHREC.\n");
1441 return build_polynomial_chrec (loop
->num
, init_cond
, right
);
1443 return chrec_dont_know
;
1446 /* Given a LOOP_PHI_NODE, this function determines the evolution
1447 function from LOOP_PHI_NODE to LOOP_PHI_NODE in the loop. */
1450 analyze_evolution_in_loop (gimple loop_phi_node
,
1453 int i
, n
= gimple_phi_num_args (loop_phi_node
);
1454 tree evolution_function
= chrec_not_analyzed_yet
;
1455 struct loop
*loop
= loop_containing_stmt (loop_phi_node
);
1457 static bool simplify_peeled_chrec_p
= true;
1459 if (dump_file
&& (dump_flags
& TDF_SCEV
))
1461 fprintf (dump_file
, "(analyze_evolution_in_loop \n");
1462 fprintf (dump_file
, " (loop_phi_node = ");
1463 print_gimple_stmt (dump_file
, loop_phi_node
, 0, 0);
1464 fprintf (dump_file
, ")\n");
1467 for (i
= 0; i
< n
; i
++)
1469 tree arg
= PHI_ARG_DEF (loop_phi_node
, i
);
1474 /* Select the edges that enter the loop body. */
1475 bb
= gimple_phi_arg_edge (loop_phi_node
, i
)->src
;
1476 if (!flow_bb_inside_loop_p (loop
, bb
))
1479 if (TREE_CODE (arg
) == SSA_NAME
)
1483 ssa_chain
= SSA_NAME_DEF_STMT (arg
);
1485 /* Pass in the initial condition to the follow edge function. */
1487 res
= follow_ssa_edge (loop
, ssa_chain
, loop_phi_node
, &ev_fn
, 0);
1489 /* If ev_fn has no evolution in the inner loop, and the
1490 init_cond is not equal to ev_fn, then we have an
1491 ambiguity between two possible values, as we cannot know
1492 the number of iterations at this point. */
1493 if (TREE_CODE (ev_fn
) != POLYNOMIAL_CHREC
1494 && no_evolution_in_loop_p (ev_fn
, loop
->num
, &val
) && val
1495 && !operand_equal_p (init_cond
, ev_fn
, 0))
1496 ev_fn
= chrec_dont_know
;
1501 /* When it is impossible to go back on the same
1502 loop_phi_node by following the ssa edges, the
1503 evolution is represented by a peeled chrec, i.e. the
1504 first iteration, EV_FN has the value INIT_COND, then
1505 all the other iterations it has the value of ARG.
1506 For the moment, PEELED_CHREC nodes are not built. */
1509 ev_fn
= chrec_dont_know
;
1510 /* Try to recognize POLYNOMIAL_CHREC which appears in
1511 the form of PEELED_CHREC, but guard the process with
1512 a bool variable to keep the analyzer from infinite
1513 recurrence for real PEELED_RECs. */
1514 if (simplify_peeled_chrec_p
&& TREE_CODE (arg
) == SSA_NAME
)
1516 simplify_peeled_chrec_p
= false;
1517 ev_fn
= simplify_peeled_chrec (loop
, arg
, init_cond
);
1518 simplify_peeled_chrec_p
= true;
1522 /* When there are multiple back edges of the loop (which in fact never
1523 happens currently, but nevertheless), merge their evolutions. */
1524 evolution_function
= chrec_merge (evolution_function
, ev_fn
);
1527 if (dump_file
&& (dump_flags
& TDF_SCEV
))
1529 fprintf (dump_file
, " (evolution_function = ");
1530 print_generic_expr (dump_file
, evolution_function
, 0);
1531 fprintf (dump_file
, "))\n");
1534 return evolution_function
;
1537 /* Given a loop-phi-node, return the initial conditions of the
1538 variable on entry of the loop. When the CCP has propagated
1539 constants into the loop-phi-node, the initial condition is
1540 instantiated, otherwise the initial condition is kept symbolic.
1541 This analyzer does not analyze the evolution outside the current
1542 loop, and leaves this task to the on-demand tree reconstructor. */
1545 analyze_initial_condition (gimple loop_phi_node
)
1548 tree init_cond
= chrec_not_analyzed_yet
;
1549 struct loop
*loop
= loop_containing_stmt (loop_phi_node
);
1551 if (dump_file
&& (dump_flags
& TDF_SCEV
))
1553 fprintf (dump_file
, "(analyze_initial_condition \n");
1554 fprintf (dump_file
, " (loop_phi_node = \n");
1555 print_gimple_stmt (dump_file
, loop_phi_node
, 0, 0);
1556 fprintf (dump_file
, ")\n");
1559 n
= gimple_phi_num_args (loop_phi_node
);
1560 for (i
= 0; i
< n
; i
++)
1562 tree branch
= PHI_ARG_DEF (loop_phi_node
, i
);
1563 basic_block bb
= gimple_phi_arg_edge (loop_phi_node
, i
)->src
;
1565 /* When the branch is oriented to the loop's body, it does
1566 not contribute to the initial condition. */
1567 if (flow_bb_inside_loop_p (loop
, bb
))
1570 if (init_cond
== chrec_not_analyzed_yet
)
1576 if (TREE_CODE (branch
) == SSA_NAME
)
1578 init_cond
= chrec_dont_know
;
1582 init_cond
= chrec_merge (init_cond
, branch
);
1585 /* Ooops -- a loop without an entry??? */
1586 if (init_cond
== chrec_not_analyzed_yet
)
1587 init_cond
= chrec_dont_know
;
1589 /* During early loop unrolling we do not have fully constant propagated IL.
1590 Handle degenerate PHIs here to not miss important unrollings. */
1591 if (TREE_CODE (init_cond
) == SSA_NAME
)
1593 gimple def
= SSA_NAME_DEF_STMT (init_cond
);
1595 if (gimple_code (def
) == GIMPLE_PHI
1596 && (res
= degenerate_phi_result (def
)) != NULL_TREE
1597 /* Only allow invariants here, otherwise we may break
1598 loop-closed SSA form. */
1599 && is_gimple_min_invariant (res
))
1603 if (dump_file
&& (dump_flags
& TDF_SCEV
))
1605 fprintf (dump_file
, " (init_cond = ");
1606 print_generic_expr (dump_file
, init_cond
, 0);
1607 fprintf (dump_file
, "))\n");
1613 /* Analyze the scalar evolution for LOOP_PHI_NODE. */
1616 interpret_loop_phi (struct loop
*loop
, gimple loop_phi_node
)
1619 struct loop
*phi_loop
= loop_containing_stmt (loop_phi_node
);
1622 if (phi_loop
!= loop
)
1624 struct loop
*subloop
;
1625 tree evolution_fn
= analyze_scalar_evolution
1626 (phi_loop
, PHI_RESULT (loop_phi_node
));
1628 /* Dive one level deeper. */
1629 subloop
= superloop_at_depth (phi_loop
, loop_depth (loop
) + 1);
1631 /* Interpret the subloop. */
1632 res
= compute_overall_effect_of_inner_loop (subloop
, evolution_fn
);
1636 /* Otherwise really interpret the loop phi. */
1637 init_cond
= analyze_initial_condition (loop_phi_node
);
1638 res
= analyze_evolution_in_loop (loop_phi_node
, init_cond
);
1640 /* Verify we maintained the correct initial condition throughout
1641 possible conversions in the SSA chain. */
1642 if (res
!= chrec_dont_know
)
1644 tree new_init
= res
;
1645 if (CONVERT_EXPR_P (res
)
1646 && TREE_CODE (TREE_OPERAND (res
, 0)) == POLYNOMIAL_CHREC
)
1647 new_init
= fold_convert (TREE_TYPE (res
),
1648 CHREC_LEFT (TREE_OPERAND (res
, 0)));
1649 else if (TREE_CODE (res
) == POLYNOMIAL_CHREC
)
1650 new_init
= CHREC_LEFT (res
);
1651 STRIP_USELESS_TYPE_CONVERSION (new_init
);
1652 if (TREE_CODE (new_init
) == POLYNOMIAL_CHREC
1653 || !operand_equal_p (init_cond
, new_init
, 0))
1654 return chrec_dont_know
;
1660 /* This function merges the branches of a condition-phi-node,
1661 contained in the outermost loop, and whose arguments are already
1665 interpret_condition_phi (struct loop
*loop
, gimple condition_phi
)
1667 int i
, n
= gimple_phi_num_args (condition_phi
);
1668 tree res
= chrec_not_analyzed_yet
;
1670 for (i
= 0; i
< n
; i
++)
1674 if (backedge_phi_arg_p (condition_phi
, i
))
1676 res
= chrec_dont_know
;
1680 branch_chrec
= analyze_scalar_evolution
1681 (loop
, PHI_ARG_DEF (condition_phi
, i
));
1683 res
= chrec_merge (res
, branch_chrec
);
1689 /* Interpret the operation RHS1 OP RHS2. If we didn't
1690 analyze this node before, follow the definitions until ending
1691 either on an analyzed GIMPLE_ASSIGN, or on a loop-phi-node. On the
1692 return path, this function propagates evolutions (ala constant copy
1693 propagation). OPND1 is not a GIMPLE expression because we could
1694 analyze the effect of an inner loop: see interpret_loop_phi. */
1697 interpret_rhs_expr (struct loop
*loop
, gimple at_stmt
,
1698 tree type
, tree rhs1
, enum tree_code code
, tree rhs2
)
1700 tree res
, chrec1
, chrec2
;
1703 if (get_gimple_rhs_class (code
) == GIMPLE_SINGLE_RHS
)
1705 if (is_gimple_min_invariant (rhs1
))
1706 return chrec_convert (type
, rhs1
, at_stmt
);
1708 if (code
== SSA_NAME
)
1709 return chrec_convert (type
, analyze_scalar_evolution (loop
, rhs1
),
1712 if (code
== ASSERT_EXPR
)
1714 rhs1
= ASSERT_EXPR_VAR (rhs1
);
1715 return chrec_convert (type
, analyze_scalar_evolution (loop
, rhs1
),
1723 if (TREE_CODE (TREE_OPERAND (rhs1
, 0)) == MEM_REF
1724 || handled_component_p (TREE_OPERAND (rhs1
, 0)))
1726 enum machine_mode mode
;
1727 HOST_WIDE_INT bitsize
, bitpos
;
1734 base
= get_inner_reference (TREE_OPERAND (rhs1
, 0),
1735 &bitsize
, &bitpos
, &offset
,
1736 &mode
, &unsignedp
, &volatilep
, false);
1738 if (TREE_CODE (base
) == MEM_REF
)
1740 rhs2
= TREE_OPERAND (base
, 1);
1741 rhs1
= TREE_OPERAND (base
, 0);
1743 chrec1
= analyze_scalar_evolution (loop
, rhs1
);
1744 chrec2
= analyze_scalar_evolution (loop
, rhs2
);
1745 chrec1
= chrec_convert (type
, chrec1
, at_stmt
);
1746 chrec2
= chrec_convert (TREE_TYPE (rhs2
), chrec2
, at_stmt
);
1747 chrec1
= instantiate_parameters (loop
, chrec1
);
1748 chrec2
= instantiate_parameters (loop
, chrec2
);
1749 res
= chrec_fold_plus (type
, chrec1
, chrec2
);
1753 chrec1
= analyze_scalar_evolution_for_address_of (loop
, base
);
1754 chrec1
= chrec_convert (type
, chrec1
, at_stmt
);
1758 if (offset
!= NULL_TREE
)
1760 chrec2
= analyze_scalar_evolution (loop
, offset
);
1761 chrec2
= chrec_convert (TREE_TYPE (offset
), chrec2
, at_stmt
);
1762 chrec2
= instantiate_parameters (loop
, chrec2
);
1763 res
= chrec_fold_plus (type
, res
, chrec2
);
1768 gcc_assert ((bitpos
% BITS_PER_UNIT
) == 0);
1770 unitpos
= size_int (bitpos
/ BITS_PER_UNIT
);
1771 chrec3
= analyze_scalar_evolution (loop
, unitpos
);
1772 chrec3
= chrec_convert (TREE_TYPE (unitpos
), chrec3
, at_stmt
);
1773 chrec3
= instantiate_parameters (loop
, chrec3
);
1774 res
= chrec_fold_plus (type
, res
, chrec3
);
1778 res
= chrec_dont_know
;
1781 case POINTER_PLUS_EXPR
:
1782 chrec1
= analyze_scalar_evolution (loop
, rhs1
);
1783 chrec2
= analyze_scalar_evolution (loop
, rhs2
);
1784 chrec1
= chrec_convert (type
, chrec1
, at_stmt
);
1785 chrec2
= chrec_convert (TREE_TYPE (rhs2
), chrec2
, at_stmt
);
1786 chrec1
= instantiate_parameters (loop
, chrec1
);
1787 chrec2
= instantiate_parameters (loop
, chrec2
);
1788 res
= chrec_fold_plus (type
, chrec1
, chrec2
);
1792 chrec1
= analyze_scalar_evolution (loop
, rhs1
);
1793 chrec2
= analyze_scalar_evolution (loop
, rhs2
);
1794 chrec1
= chrec_convert (type
, chrec1
, at_stmt
);
1795 chrec2
= chrec_convert (type
, chrec2
, at_stmt
);
1796 chrec1
= instantiate_parameters (loop
, chrec1
);
1797 chrec2
= instantiate_parameters (loop
, chrec2
);
1798 res
= chrec_fold_plus (type
, chrec1
, chrec2
);
1802 chrec1
= analyze_scalar_evolution (loop
, rhs1
);
1803 chrec2
= analyze_scalar_evolution (loop
, rhs2
);
1804 chrec1
= chrec_convert (type
, chrec1
, at_stmt
);
1805 chrec2
= chrec_convert (type
, chrec2
, at_stmt
);
1806 chrec1
= instantiate_parameters (loop
, chrec1
);
1807 chrec2
= instantiate_parameters (loop
, chrec2
);
1808 res
= chrec_fold_minus (type
, chrec1
, chrec2
);
1812 chrec1
= analyze_scalar_evolution (loop
, rhs1
);
1813 chrec1
= chrec_convert (type
, chrec1
, at_stmt
);
1814 /* TYPE may be integer, real or complex, so use fold_convert. */
1815 chrec1
= instantiate_parameters (loop
, chrec1
);
1816 res
= chrec_fold_multiply (type
, chrec1
,
1817 fold_convert (type
, integer_minus_one_node
));
1821 /* Handle ~X as -1 - X. */
1822 chrec1
= analyze_scalar_evolution (loop
, rhs1
);
1823 chrec1
= chrec_convert (type
, chrec1
, at_stmt
);
1824 chrec1
= instantiate_parameters (loop
, chrec1
);
1825 res
= chrec_fold_minus (type
,
1826 fold_convert (type
, integer_minus_one_node
),
1831 chrec1
= analyze_scalar_evolution (loop
, rhs1
);
1832 chrec2
= analyze_scalar_evolution (loop
, rhs2
);
1833 chrec1
= chrec_convert (type
, chrec1
, at_stmt
);
1834 chrec2
= chrec_convert (type
, chrec2
, at_stmt
);
1835 chrec1
= instantiate_parameters (loop
, chrec1
);
1836 chrec2
= instantiate_parameters (loop
, chrec2
);
1837 res
= chrec_fold_multiply (type
, chrec1
, chrec2
);
1841 /* In case we have a truncation of a widened operation that in
1842 the truncated type has undefined overflow behavior analyze
1843 the operation done in an unsigned type of the same precision
1844 as the final truncation. We cannot derive a scalar evolution
1845 for the widened operation but for the truncated result. */
1846 if (TREE_CODE (type
) == INTEGER_TYPE
1847 && TREE_CODE (TREE_TYPE (rhs1
)) == INTEGER_TYPE
1848 && TYPE_PRECISION (type
) < TYPE_PRECISION (TREE_TYPE (rhs1
))
1849 && TYPE_OVERFLOW_UNDEFINED (type
)
1850 && TREE_CODE (rhs1
) == SSA_NAME
1851 && (def
= SSA_NAME_DEF_STMT (rhs1
))
1852 && is_gimple_assign (def
)
1853 && TREE_CODE_CLASS (gimple_assign_rhs_code (def
)) == tcc_binary
1854 && TREE_CODE (gimple_assign_rhs2 (def
)) == INTEGER_CST
)
1856 tree utype
= unsigned_type_for (type
);
1857 chrec1
= interpret_rhs_expr (loop
, at_stmt
, utype
,
1858 gimple_assign_rhs1 (def
),
1859 gimple_assign_rhs_code (def
),
1860 gimple_assign_rhs2 (def
));
1863 chrec1
= analyze_scalar_evolution (loop
, rhs1
);
1864 res
= chrec_convert (type
, chrec1
, at_stmt
);
1868 res
= chrec_dont_know
;
1875 /* Interpret the expression EXPR. */
1878 interpret_expr (struct loop
*loop
, gimple at_stmt
, tree expr
)
1880 enum tree_code code
;
1881 tree type
= TREE_TYPE (expr
), op0
, op1
;
1883 if (automatically_generated_chrec_p (expr
))
1886 if (TREE_CODE (expr
) == POLYNOMIAL_CHREC
1887 || get_gimple_rhs_class (TREE_CODE (expr
)) == GIMPLE_TERNARY_RHS
)
1888 return chrec_dont_know
;
1890 extract_ops_from_tree (expr
, &code
, &op0
, &op1
);
1892 return interpret_rhs_expr (loop
, at_stmt
, type
,
1896 /* Interpret the rhs of the assignment STMT. */
1899 interpret_gimple_assign (struct loop
*loop
, gimple stmt
)
1901 tree type
= TREE_TYPE (gimple_assign_lhs (stmt
));
1902 enum tree_code code
= gimple_assign_rhs_code (stmt
);
1904 return interpret_rhs_expr (loop
, stmt
, type
,
1905 gimple_assign_rhs1 (stmt
), code
,
1906 gimple_assign_rhs2 (stmt
));
1911 /* This section contains all the entry points:
1912 - number_of_iterations_in_loop,
1913 - analyze_scalar_evolution,
1914 - instantiate_parameters.
1917 /* Compute and return the evolution function in WRTO_LOOP, the nearest
1918 common ancestor of DEF_LOOP and USE_LOOP. */
1921 compute_scalar_evolution_in_loop (struct loop
*wrto_loop
,
1922 struct loop
*def_loop
,
1928 if (def_loop
== wrto_loop
)
1931 def_loop
= superloop_at_depth (def_loop
, loop_depth (wrto_loop
) + 1);
1932 res
= compute_overall_effect_of_inner_loop (def_loop
, ev
);
1934 if (no_evolution_in_loop_p (res
, wrto_loop
->num
, &val
) && val
)
1937 return analyze_scalar_evolution_1 (wrto_loop
, res
, chrec_not_analyzed_yet
);
1940 /* Helper recursive function. */
1943 analyze_scalar_evolution_1 (struct loop
*loop
, tree var
, tree res
)
1945 tree type
= TREE_TYPE (var
);
1948 struct loop
*def_loop
;
1950 if (loop
== NULL
|| TREE_CODE (type
) == VECTOR_TYPE
)
1951 return chrec_dont_know
;
1953 if (TREE_CODE (var
) != SSA_NAME
)
1954 return interpret_expr (loop
, NULL
, var
);
1956 def
= SSA_NAME_DEF_STMT (var
);
1957 bb
= gimple_bb (def
);
1958 def_loop
= bb
? bb
->loop_father
: NULL
;
1961 || !flow_bb_inside_loop_p (loop
, bb
))
1963 /* Keep the symbolic form. */
1968 if (res
!= chrec_not_analyzed_yet
)
1970 if (loop
!= bb
->loop_father
)
1971 res
= compute_scalar_evolution_in_loop
1972 (find_common_loop (loop
, bb
->loop_father
), bb
->loop_father
, res
);
1977 if (loop
!= def_loop
)
1979 res
= analyze_scalar_evolution_1 (def_loop
, var
, chrec_not_analyzed_yet
);
1980 res
= compute_scalar_evolution_in_loop (loop
, def_loop
, res
);
1985 switch (gimple_code (def
))
1988 res
= interpret_gimple_assign (loop
, def
);
1992 if (loop_phi_node_p (def
))
1993 res
= interpret_loop_phi (loop
, def
);
1995 res
= interpret_condition_phi (loop
, def
);
1999 res
= chrec_dont_know
;
2005 /* Keep the symbolic form. */
2006 if (res
== chrec_dont_know
)
2009 if (loop
== def_loop
)
2010 set_scalar_evolution (block_before_loop (loop
), var
, res
);
2015 /* Analyzes and returns the scalar evolution of the ssa_name VAR in
2016 LOOP. LOOP is the loop in which the variable is used.
2018 Example of use: having a pointer VAR to a SSA_NAME node, STMT a
2019 pointer to the statement that uses this variable, in order to
2020 determine the evolution function of the variable, use the following
2023 loop_p loop = loop_containing_stmt (stmt);
2024 tree chrec_with_symbols = analyze_scalar_evolution (loop, var);
2025 tree chrec_instantiated = instantiate_parameters (loop, chrec_with_symbols);
2029 analyze_scalar_evolution (struct loop
*loop
, tree var
)
2033 if (dump_file
&& (dump_flags
& TDF_SCEV
))
2035 fprintf (dump_file
, "(analyze_scalar_evolution \n");
2036 fprintf (dump_file
, " (loop_nb = %d)\n", loop
->num
);
2037 fprintf (dump_file
, " (scalar = ");
2038 print_generic_expr (dump_file
, var
, 0);
2039 fprintf (dump_file
, ")\n");
2042 res
= get_scalar_evolution (block_before_loop (loop
), var
);
2043 res
= analyze_scalar_evolution_1 (loop
, var
, res
);
2045 if (dump_file
&& (dump_flags
& TDF_SCEV
))
2046 fprintf (dump_file
, ")\n");
2051 /* Analyzes and returns the scalar evolution of VAR address in LOOP. */
2054 analyze_scalar_evolution_for_address_of (struct loop
*loop
, tree var
)
2056 return analyze_scalar_evolution (loop
, build_fold_addr_expr (var
));
2059 /* Analyze scalar evolution of use of VERSION in USE_LOOP with respect to
2060 WRTO_LOOP (which should be a superloop of USE_LOOP)
2062 FOLDED_CASTS is set to true if resolve_mixers used
2063 chrec_convert_aggressive (TODO -- not really, we are way too conservative
2064 at the moment in order to keep things simple).
2066 To illustrate the meaning of USE_LOOP and WRTO_LOOP, consider the following
2069 for (i = 0; i < 100; i++) -- loop 1
2071 for (j = 0; j < 100; j++) -- loop 2
2078 for (t = 0; t < 100; t++) -- loop 3
2085 Both k1 and k2 are invariants in loop3, thus
2086 analyze_scalar_evolution_in_loop (loop3, loop3, k1) = k1
2087 analyze_scalar_evolution_in_loop (loop3, loop3, k2) = k2
2089 As they are invariant, it does not matter whether we consider their
2090 usage in loop 3 or loop 2, hence
2091 analyze_scalar_evolution_in_loop (loop2, loop3, k1) =
2092 analyze_scalar_evolution_in_loop (loop2, loop2, k1) = i
2093 analyze_scalar_evolution_in_loop (loop2, loop3, k2) =
2094 analyze_scalar_evolution_in_loop (loop2, loop2, k2) = [0,+,1]_2
2096 Similarly for their evolutions with respect to loop 1. The values of K2
2097 in the use in loop 2 vary independently on loop 1, thus we cannot express
2098 the evolution with respect to loop 1:
2099 analyze_scalar_evolution_in_loop (loop1, loop3, k1) =
2100 analyze_scalar_evolution_in_loop (loop1, loop2, k1) = [0,+,1]_1
2101 analyze_scalar_evolution_in_loop (loop1, loop3, k2) =
2102 analyze_scalar_evolution_in_loop (loop1, loop2, k2) = dont_know
2104 The value of k2 in the use in loop 1 is known, though:
2105 analyze_scalar_evolution_in_loop (loop1, loop1, k1) = [0,+,1]_1
2106 analyze_scalar_evolution_in_loop (loop1, loop1, k2) = 100
2110 analyze_scalar_evolution_in_loop (struct loop
*wrto_loop
, struct loop
*use_loop
,
2111 tree version
, bool *folded_casts
)
2114 tree ev
= version
, tmp
;
2116 /* We cannot just do
2118 tmp = analyze_scalar_evolution (use_loop, version);
2119 ev = resolve_mixers (wrto_loop, tmp);
2121 as resolve_mixers would query the scalar evolution with respect to
2122 wrto_loop. For example, in the situation described in the function
2123 comment, suppose that wrto_loop = loop1, use_loop = loop3 and
2126 analyze_scalar_evolution (use_loop, version) = k2
2128 and resolve_mixers (loop1, k2) finds that the value of k2 in loop 1
2129 is 100, which is a wrong result, since we are interested in the
2132 Instead, we need to proceed from use_loop to wrto_loop loop by loop,
2133 each time checking that there is no evolution in the inner loop. */
2136 *folded_casts
= false;
2139 tmp
= analyze_scalar_evolution (use_loop
, ev
);
2140 ev
= resolve_mixers (use_loop
, tmp
);
2142 if (folded_casts
&& tmp
!= ev
)
2143 *folded_casts
= true;
2145 if (use_loop
== wrto_loop
)
2148 /* If the value of the use changes in the inner loop, we cannot express
2149 its value in the outer loop (we might try to return interval chrec,
2150 but we do not have a user for it anyway) */
2151 if (!no_evolution_in_loop_p (ev
, use_loop
->num
, &val
)
2153 return chrec_dont_know
;
2155 use_loop
= loop_outer (use_loop
);
2160 /* Hashtable helpers for a temporary hash-table used when
2161 instantiating a CHREC or resolving mixers. For this use
2162 instantiated_below is always the same. */
2164 struct instantiate_cache_type
2167 vec
<scev_info_str
> entries
;
2169 instantiate_cache_type () : map (NULL
), entries (vNULL
) {}
2170 ~instantiate_cache_type ();
2171 tree
get (unsigned slot
) { return entries
[slot
].chrec
; }
2172 void set (unsigned slot
, tree chrec
) { entries
[slot
].chrec
= chrec
; }
2175 instantiate_cache_type::~instantiate_cache_type ()
2184 /* Cache to avoid infinite recursion when instantiating an SSA name.
2185 Live during the outermost instantiate_scev or resolve_mixers call. */
2186 static instantiate_cache_type
*global_cache
;
2188 /* Computes a hash function for database element ELT. */
2190 static inline hashval_t
2191 hash_idx_scev_info (const void *elt_
)
2193 unsigned idx
= ((size_t) elt_
) - 2;
2194 return hash_scev_info (&global_cache
->entries
[idx
]);
2197 /* Compares database elements E1 and E2. */
2200 eq_idx_scev_info (const void *e1
, const void *e2
)
2202 unsigned idx1
= ((size_t) e1
) - 2;
2203 return eq_scev_info (&global_cache
->entries
[idx1
], e2
);
2206 /* Returns from CACHE the slot number of the cached chrec for NAME. */
2209 get_instantiated_value_entry (instantiate_cache_type
&cache
,
2210 tree name
, basic_block instantiate_below
)
2214 cache
.map
= htab_create (10, hash_idx_scev_info
, eq_idx_scev_info
, NULL
);
2215 cache
.entries
.create (10);
2219 e
.name_version
= SSA_NAME_VERSION (name
);
2220 e
.instantiated_below
= instantiate_below
->index
;
2221 void **slot
= htab_find_slot_with_hash (cache
.map
, &e
,
2222 hash_scev_info (&e
), INSERT
);
2225 e
.chrec
= chrec_not_analyzed_yet
;
2226 *slot
= (void *)(size_t)(cache
.entries
.length () + 2);
2227 cache
.entries
.safe_push (e
);
2230 return ((size_t)*slot
) - 2;
2234 /* Return the closed_loop_phi node for VAR. If there is none, return
2238 loop_closed_phi_def (tree var
)
2243 gimple_stmt_iterator psi
;
2245 if (var
== NULL_TREE
2246 || TREE_CODE (var
) != SSA_NAME
)
2249 loop
= loop_containing_stmt (SSA_NAME_DEF_STMT (var
));
2250 exit
= single_exit (loop
);
2254 for (psi
= gsi_start_phis (exit
->dest
); !gsi_end_p (psi
); gsi_next (&psi
))
2256 phi
= gsi_stmt (psi
);
2257 if (PHI_ARG_DEF_FROM_EDGE (phi
, exit
) == var
)
2258 return PHI_RESULT (phi
);
2264 static tree
instantiate_scev_r (basic_block
, struct loop
*, struct loop
*,
2267 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2268 and EVOLUTION_LOOP, that were left under a symbolic form.
2270 CHREC is an SSA_NAME to be instantiated.
2272 CACHE is the cache of already instantiated values.
2274 FOLD_CONVERSIONS should be set to true when the conversions that
2275 may wrap in signed/pointer type are folded, as long as the value of
2276 the chrec is preserved.
2278 SIZE_EXPR is used for computing the size of the expression to be
2279 instantiated, and to stop if it exceeds some limit. */
2282 instantiate_scev_name (basic_block instantiate_below
,
2283 struct loop
*evolution_loop
, struct loop
*inner_loop
,
2285 bool fold_conversions
,
2289 struct loop
*def_loop
;
2290 basic_block def_bb
= gimple_bb (SSA_NAME_DEF_STMT (chrec
));
2292 /* A parameter (or loop invariant and we do not want to include
2293 evolutions in outer loops), nothing to do. */
2295 || loop_depth (def_bb
->loop_father
) == 0
2296 || dominated_by_p (CDI_DOMINATORS
, instantiate_below
, def_bb
))
2299 /* We cache the value of instantiated variable to avoid exponential
2300 time complexity due to reevaluations. We also store the convenient
2301 value in the cache in order to prevent infinite recursion -- we do
2302 not want to instantiate the SSA_NAME if it is in a mixer
2303 structure. This is used for avoiding the instantiation of
2304 recursively defined functions, such as:
2306 | a_2 -> {0, +, 1, +, a_2}_1 */
2308 unsigned si
= get_instantiated_value_entry (*global_cache
,
2309 chrec
, instantiate_below
);
2310 if (global_cache
->get (si
) != chrec_not_analyzed_yet
)
2311 return global_cache
->get (si
);
2313 /* On recursion return chrec_dont_know. */
2314 global_cache
->set (si
, chrec_dont_know
);
2316 def_loop
= find_common_loop (evolution_loop
, def_bb
->loop_father
);
2318 /* If the analysis yields a parametric chrec, instantiate the
2320 res
= analyze_scalar_evolution (def_loop
, chrec
);
2322 /* Don't instantiate default definitions. */
2323 if (TREE_CODE (res
) == SSA_NAME
2324 && SSA_NAME_IS_DEFAULT_DEF (res
))
2327 /* Don't instantiate loop-closed-ssa phi nodes. */
2328 else if (TREE_CODE (res
) == SSA_NAME
2329 && loop_depth (loop_containing_stmt (SSA_NAME_DEF_STMT (res
)))
2330 > loop_depth (def_loop
))
2333 res
= loop_closed_phi_def (chrec
);
2337 /* When there is no loop_closed_phi_def, it means that the
2338 variable is not used after the loop: try to still compute the
2339 value of the variable when exiting the loop. */
2340 if (res
== NULL_TREE
)
2342 loop_p loop
= loop_containing_stmt (SSA_NAME_DEF_STMT (chrec
));
2343 res
= analyze_scalar_evolution (loop
, chrec
);
2344 res
= compute_overall_effect_of_inner_loop (loop
, res
);
2345 res
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2347 fold_conversions
, size_expr
);
2349 else if (!dominated_by_p (CDI_DOMINATORS
, instantiate_below
,
2350 gimple_bb (SSA_NAME_DEF_STMT (res
))))
2351 res
= chrec_dont_know
;
2354 else if (res
!= chrec_dont_know
)
2357 && def_bb
->loop_father
!= inner_loop
2358 && !flow_loop_nested_p (def_bb
->loop_father
, inner_loop
))
2359 /* ??? We could try to compute the overall effect of the loop here. */
2360 res
= chrec_dont_know
;
2362 res
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2364 fold_conversions
, size_expr
);
2367 /* Store the correct value to the cache. */
2368 global_cache
->set (si
, res
);
2372 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2373 and EVOLUTION_LOOP, that were left under a symbolic form.
2375 CHREC is a polynomial chain of recurrence to be instantiated.
2377 CACHE is the cache of already instantiated values.
2379 FOLD_CONVERSIONS should be set to true when the conversions that
2380 may wrap in signed/pointer type are folded, as long as the value of
2381 the chrec is preserved.
2383 SIZE_EXPR is used for computing the size of the expression to be
2384 instantiated, and to stop if it exceeds some limit. */
2387 instantiate_scev_poly (basic_block instantiate_below
,
2388 struct loop
*evolution_loop
, struct loop
*,
2389 tree chrec
, bool fold_conversions
, int size_expr
)
2392 tree op0
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2393 get_chrec_loop (chrec
),
2394 CHREC_LEFT (chrec
), fold_conversions
,
2396 if (op0
== chrec_dont_know
)
2397 return chrec_dont_know
;
2399 op1
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2400 get_chrec_loop (chrec
),
2401 CHREC_RIGHT (chrec
), fold_conversions
,
2403 if (op1
== chrec_dont_know
)
2404 return chrec_dont_know
;
2406 if (CHREC_LEFT (chrec
) != op0
2407 || CHREC_RIGHT (chrec
) != op1
)
2409 op1
= chrec_convert_rhs (chrec_type (op0
), op1
, NULL
);
2410 chrec
= build_polynomial_chrec (CHREC_VARIABLE (chrec
), op0
, op1
);
2416 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2417 and EVOLUTION_LOOP, that were left under a symbolic form.
2419 "C0 CODE C1" is a binary expression of type TYPE to be instantiated.
2421 CACHE is the cache of already instantiated values.
2423 FOLD_CONVERSIONS should be set to true when the conversions that
2424 may wrap in signed/pointer type are folded, as long as the value of
2425 the chrec is preserved.
2427 SIZE_EXPR is used for computing the size of the expression to be
2428 instantiated, and to stop if it exceeds some limit. */
2431 instantiate_scev_binary (basic_block instantiate_below
,
2432 struct loop
*evolution_loop
, struct loop
*inner_loop
,
2433 tree chrec
, enum tree_code code
,
2434 tree type
, tree c0
, tree c1
,
2435 bool fold_conversions
, int size_expr
)
2438 tree op0
= instantiate_scev_r (instantiate_below
, evolution_loop
, inner_loop
,
2439 c0
, fold_conversions
, size_expr
);
2440 if (op0
== chrec_dont_know
)
2441 return chrec_dont_know
;
2443 op1
= instantiate_scev_r (instantiate_below
, evolution_loop
, inner_loop
,
2444 c1
, fold_conversions
, size_expr
);
2445 if (op1
== chrec_dont_know
)
2446 return chrec_dont_know
;
2451 op0
= chrec_convert (type
, op0
, NULL
);
2452 op1
= chrec_convert_rhs (type
, op1
, NULL
);
2456 case POINTER_PLUS_EXPR
:
2458 return chrec_fold_plus (type
, op0
, op1
);
2461 return chrec_fold_minus (type
, op0
, op1
);
2464 return chrec_fold_multiply (type
, op0
, op1
);
2471 return chrec
? chrec
: fold_build2 (code
, type
, c0
, c1
);
2474 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2475 and EVOLUTION_LOOP, that were left under a symbolic form.
2477 "CHREC" is an array reference to be instantiated.
2479 CACHE is the cache of already instantiated values.
2481 FOLD_CONVERSIONS should be set to true when the conversions that
2482 may wrap in signed/pointer type are folded, as long as the value of
2483 the chrec is preserved.
2485 SIZE_EXPR is used for computing the size of the expression to be
2486 instantiated, and to stop if it exceeds some limit. */
2489 instantiate_array_ref (basic_block instantiate_below
,
2490 struct loop
*evolution_loop
, struct loop
*inner_loop
,
2491 tree chrec
, bool fold_conversions
, int size_expr
)
2494 tree index
= TREE_OPERAND (chrec
, 1);
2495 tree op1
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2497 fold_conversions
, size_expr
);
2499 if (op1
== chrec_dont_know
)
2500 return chrec_dont_know
;
2502 if (chrec
&& op1
== index
)
2505 res
= unshare_expr (chrec
);
2506 TREE_OPERAND (res
, 1) = op1
;
2510 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2511 and EVOLUTION_LOOP, that were left under a symbolic form.
2513 "CHREC" that stands for a convert expression "(TYPE) OP" is to be
2516 CACHE is the cache of already instantiated values.
2518 FOLD_CONVERSIONS should be set to true when the conversions that
2519 may wrap in signed/pointer type are folded, as long as the value of
2520 the chrec is preserved.
2522 SIZE_EXPR is used for computing the size of the expression to be
2523 instantiated, and to stop if it exceeds some limit. */
2526 instantiate_scev_convert (basic_block instantiate_below
,
2527 struct loop
*evolution_loop
, struct loop
*inner_loop
,
2528 tree chrec
, tree type
, tree op
,
2529 bool fold_conversions
, int size_expr
)
2531 tree op0
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2533 fold_conversions
, size_expr
);
2535 if (op0
== chrec_dont_know
)
2536 return chrec_dont_know
;
2538 if (fold_conversions
)
2540 tree tmp
= chrec_convert_aggressive (type
, op0
);
2545 if (chrec
&& op0
== op
)
2548 /* If we used chrec_convert_aggressive, we can no longer assume that
2549 signed chrecs do not overflow, as chrec_convert does, so avoid
2550 calling it in that case. */
2551 if (fold_conversions
)
2552 return fold_convert (type
, op0
);
2554 return chrec_convert (type
, op0
, NULL
);
2557 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2558 and EVOLUTION_LOOP, that were left under a symbolic form.
2560 CHREC is a BIT_NOT_EXPR or a NEGATE_EXPR expression to be instantiated.
2561 Handle ~X as -1 - X.
2562 Handle -X as -1 * X.
2564 CACHE is the cache of already instantiated values.
2566 FOLD_CONVERSIONS should be set to true when the conversions that
2567 may wrap in signed/pointer type are folded, as long as the value of
2568 the chrec is preserved.
2570 SIZE_EXPR is used for computing the size of the expression to be
2571 instantiated, and to stop if it exceeds some limit. */
2574 instantiate_scev_not (basic_block instantiate_below
,
2575 struct loop
*evolution_loop
, struct loop
*inner_loop
,
2577 enum tree_code code
, tree type
, tree op
,
2578 bool fold_conversions
, int size_expr
)
2580 tree op0
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2582 fold_conversions
, size_expr
);
2584 if (op0
== chrec_dont_know
)
2585 return chrec_dont_know
;
2589 op0
= chrec_convert (type
, op0
, NULL
);
2594 return chrec_fold_minus
2595 (type
, fold_convert (type
, integer_minus_one_node
), op0
);
2598 return chrec_fold_multiply
2599 (type
, fold_convert (type
, integer_minus_one_node
), op0
);
2606 return chrec
? chrec
: fold_build1 (code
, type
, op0
);
2609 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2610 and EVOLUTION_LOOP, that were left under a symbolic form.
2612 CHREC is an expression with 3 operands to be instantiated.
2614 CACHE is the cache of already instantiated values.
2616 FOLD_CONVERSIONS should be set to true when the conversions that
2617 may wrap in signed/pointer type are folded, as long as the value of
2618 the chrec is preserved.
2620 SIZE_EXPR is used for computing the size of the expression to be
2621 instantiated, and to stop if it exceeds some limit. */
2624 instantiate_scev_3 (basic_block instantiate_below
,
2625 struct loop
*evolution_loop
, struct loop
*inner_loop
,
2627 bool fold_conversions
, int size_expr
)
2630 tree op0
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2631 inner_loop
, TREE_OPERAND (chrec
, 0),
2632 fold_conversions
, size_expr
);
2633 if (op0
== chrec_dont_know
)
2634 return chrec_dont_know
;
2636 op1
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2637 inner_loop
, TREE_OPERAND (chrec
, 1),
2638 fold_conversions
, size_expr
);
2639 if (op1
== chrec_dont_know
)
2640 return chrec_dont_know
;
2642 op2
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2643 inner_loop
, TREE_OPERAND (chrec
, 2),
2644 fold_conversions
, size_expr
);
2645 if (op2
== chrec_dont_know
)
2646 return chrec_dont_know
;
2648 if (op0
== TREE_OPERAND (chrec
, 0)
2649 && op1
== TREE_OPERAND (chrec
, 1)
2650 && op2
== TREE_OPERAND (chrec
, 2))
2653 return fold_build3 (TREE_CODE (chrec
),
2654 TREE_TYPE (chrec
), op0
, op1
, op2
);
2657 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2658 and EVOLUTION_LOOP, that were left under a symbolic form.
2660 CHREC is an expression with 2 operands to be instantiated.
2662 CACHE is the cache of already instantiated values.
2664 FOLD_CONVERSIONS should be set to true when the conversions that
2665 may wrap in signed/pointer type are folded, as long as the value of
2666 the chrec is preserved.
2668 SIZE_EXPR is used for computing the size of the expression to be
2669 instantiated, and to stop if it exceeds some limit. */
2672 instantiate_scev_2 (basic_block instantiate_below
,
2673 struct loop
*evolution_loop
, struct loop
*inner_loop
,
2675 bool fold_conversions
, int size_expr
)
2678 tree op0
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2679 inner_loop
, TREE_OPERAND (chrec
, 0),
2680 fold_conversions
, size_expr
);
2681 if (op0
== chrec_dont_know
)
2682 return chrec_dont_know
;
2684 op1
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2685 inner_loop
, TREE_OPERAND (chrec
, 1),
2686 fold_conversions
, size_expr
);
2687 if (op1
== chrec_dont_know
)
2688 return chrec_dont_know
;
2690 if (op0
== TREE_OPERAND (chrec
, 0)
2691 && op1
== TREE_OPERAND (chrec
, 1))
2694 return fold_build2 (TREE_CODE (chrec
), TREE_TYPE (chrec
), op0
, op1
);
2697 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2698 and EVOLUTION_LOOP, that were left under a symbolic form.
2700 CHREC is an expression with 2 operands to be instantiated.
2702 CACHE is the cache of already instantiated values.
2704 FOLD_CONVERSIONS should be set to true when the conversions that
2705 may wrap in signed/pointer type are folded, as long as the value of
2706 the chrec is preserved.
2708 SIZE_EXPR is used for computing the size of the expression to be
2709 instantiated, and to stop if it exceeds some limit. */
2712 instantiate_scev_1 (basic_block instantiate_below
,
2713 struct loop
*evolution_loop
, struct loop
*inner_loop
,
2715 bool fold_conversions
, int size_expr
)
2717 tree op0
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2718 inner_loop
, TREE_OPERAND (chrec
, 0),
2719 fold_conversions
, size_expr
);
2721 if (op0
== chrec_dont_know
)
2722 return chrec_dont_know
;
2724 if (op0
== TREE_OPERAND (chrec
, 0))
2727 return fold_build1 (TREE_CODE (chrec
), TREE_TYPE (chrec
), op0
);
2730 /* Analyze all the parameters of the chrec, between INSTANTIATE_BELOW
2731 and EVOLUTION_LOOP, that were left under a symbolic form.
2733 CHREC is the scalar evolution to instantiate.
2735 CACHE is the cache of already instantiated values.
2737 FOLD_CONVERSIONS should be set to true when the conversions that
2738 may wrap in signed/pointer type are folded, as long as the value of
2739 the chrec is preserved.
2741 SIZE_EXPR is used for computing the size of the expression to be
2742 instantiated, and to stop if it exceeds some limit. */
2745 instantiate_scev_r (basic_block instantiate_below
,
2746 struct loop
*evolution_loop
, struct loop
*inner_loop
,
2748 bool fold_conversions
, int size_expr
)
2750 /* Give up if the expression is larger than the MAX that we allow. */
2751 if (size_expr
++ > PARAM_VALUE (PARAM_SCEV_MAX_EXPR_SIZE
))
2752 return chrec_dont_know
;
2754 if (chrec
== NULL_TREE
2755 || automatically_generated_chrec_p (chrec
)
2756 || is_gimple_min_invariant (chrec
))
2759 switch (TREE_CODE (chrec
))
2762 return instantiate_scev_name (instantiate_below
, evolution_loop
,
2764 fold_conversions
, size_expr
);
2766 case POLYNOMIAL_CHREC
:
2767 return instantiate_scev_poly (instantiate_below
, evolution_loop
,
2769 fold_conversions
, size_expr
);
2771 case POINTER_PLUS_EXPR
:
2775 return instantiate_scev_binary (instantiate_below
, evolution_loop
,
2777 TREE_CODE (chrec
), chrec_type (chrec
),
2778 TREE_OPERAND (chrec
, 0),
2779 TREE_OPERAND (chrec
, 1),
2780 fold_conversions
, size_expr
);
2783 return instantiate_scev_convert (instantiate_below
, evolution_loop
,
2785 TREE_TYPE (chrec
), TREE_OPERAND (chrec
, 0),
2786 fold_conversions
, size_expr
);
2790 return instantiate_scev_not (instantiate_below
, evolution_loop
,
2792 TREE_CODE (chrec
), TREE_TYPE (chrec
),
2793 TREE_OPERAND (chrec
, 0),
2794 fold_conversions
, size_expr
);
2797 case SCEV_NOT_KNOWN
:
2798 return chrec_dont_know
;
2804 return instantiate_array_ref (instantiate_below
, evolution_loop
,
2806 fold_conversions
, size_expr
);
2812 if (VL_EXP_CLASS_P (chrec
))
2813 return chrec_dont_know
;
2815 switch (TREE_CODE_LENGTH (TREE_CODE (chrec
)))
2818 return instantiate_scev_3 (instantiate_below
, evolution_loop
,
2820 fold_conversions
, size_expr
);
2823 return instantiate_scev_2 (instantiate_below
, evolution_loop
,
2825 fold_conversions
, size_expr
);
2828 return instantiate_scev_1 (instantiate_below
, evolution_loop
,
2830 fold_conversions
, size_expr
);
2839 /* Too complicated to handle. */
2840 return chrec_dont_know
;
2843 /* Analyze all the parameters of the chrec that were left under a
2844 symbolic form. INSTANTIATE_BELOW is the basic block that stops the
2845 recursive instantiation of parameters: a parameter is a variable
2846 that is defined in a basic block that dominates INSTANTIATE_BELOW or
2847 a function parameter. */
2850 instantiate_scev (basic_block instantiate_below
, struct loop
*evolution_loop
,
2855 if (dump_file
&& (dump_flags
& TDF_SCEV
))
2857 fprintf (dump_file
, "(instantiate_scev \n");
2858 fprintf (dump_file
, " (instantiate_below = %d)\n", instantiate_below
->index
);
2859 fprintf (dump_file
, " (evolution_loop = %d)\n", evolution_loop
->num
);
2860 fprintf (dump_file
, " (chrec = ");
2861 print_generic_expr (dump_file
, chrec
, 0);
2862 fprintf (dump_file
, ")\n");
2868 global_cache
= new instantiate_cache_type
;
2872 res
= instantiate_scev_r (instantiate_below
, evolution_loop
,
2873 NULL
, chrec
, false, 0);
2877 delete global_cache
;
2878 global_cache
= NULL
;
2881 if (dump_file
&& (dump_flags
& TDF_SCEV
))
2883 fprintf (dump_file
, " (res = ");
2884 print_generic_expr (dump_file
, res
, 0);
2885 fprintf (dump_file
, "))\n");
2891 /* Similar to instantiate_parameters, but does not introduce the
2892 evolutions in outer loops for LOOP invariants in CHREC, and does not
2893 care about causing overflows, as long as they do not affect value
2894 of an expression. */
2897 resolve_mixers (struct loop
*loop
, tree chrec
)
2902 global_cache
= new instantiate_cache_type
;
2906 tree ret
= instantiate_scev_r (block_before_loop (loop
), loop
, NULL
,
2911 delete global_cache
;
2912 global_cache
= NULL
;
2918 /* Entry point for the analysis of the number of iterations pass.
2919 This function tries to safely approximate the number of iterations
2920 the loop will run. When this property is not decidable at compile
2921 time, the result is chrec_dont_know. Otherwise the result is a
2922 scalar or a symbolic parameter. When the number of iterations may
2923 be equal to zero and the property cannot be determined at compile
2924 time, the result is a COND_EXPR that represents in a symbolic form
2925 the conditions under which the number of iterations is not zero.
2927 Example of analysis: suppose that the loop has an exit condition:
2929 "if (b > 49) goto end_loop;"
2931 and that in a previous analysis we have determined that the
2932 variable 'b' has an evolution function:
2934 "EF = {23, +, 5}_2".
2936 When we evaluate the function at the point 5, i.e. the value of the
2937 variable 'b' after 5 iterations in the loop, we have EF (5) = 48,
2938 and EF (6) = 53. In this case the value of 'b' on exit is '53' and
2939 the loop body has been executed 6 times. */
2942 number_of_latch_executions (struct loop
*loop
)
2945 struct tree_niter_desc niter_desc
;
2949 /* Determine whether the number of iterations in loop has already
2951 res
= loop
->nb_iterations
;
2955 may_be_zero
= NULL_TREE
;
2957 if (dump_file
&& (dump_flags
& TDF_SCEV
))
2958 fprintf (dump_file
, "(number_of_iterations_in_loop = \n");
2960 res
= chrec_dont_know
;
2961 exit
= single_exit (loop
);
2963 if (exit
&& number_of_iterations_exit (loop
, exit
, &niter_desc
, false))
2965 may_be_zero
= niter_desc
.may_be_zero
;
2966 res
= niter_desc
.niter
;
2969 if (res
== chrec_dont_know
2971 || integer_zerop (may_be_zero
))
2973 else if (integer_nonzerop (may_be_zero
))
2974 res
= build_int_cst (TREE_TYPE (res
), 0);
2976 else if (COMPARISON_CLASS_P (may_be_zero
))
2977 res
= fold_build3 (COND_EXPR
, TREE_TYPE (res
), may_be_zero
,
2978 build_int_cst (TREE_TYPE (res
), 0), res
);
2980 res
= chrec_dont_know
;
2982 if (dump_file
&& (dump_flags
& TDF_SCEV
))
2984 fprintf (dump_file
, " (set_nb_iterations_in_loop = ");
2985 print_generic_expr (dump_file
, res
, 0);
2986 fprintf (dump_file
, "))\n");
2989 loop
->nb_iterations
= res
;
2994 /* Counters for the stats. */
3000 unsigned nb_affine_multivar
;
3001 unsigned nb_higher_poly
;
3002 unsigned nb_chrec_dont_know
;
3003 unsigned nb_undetermined
;
3006 /* Reset the counters. */
3009 reset_chrecs_counters (struct chrec_stats
*stats
)
3011 stats
->nb_chrecs
= 0;
3012 stats
->nb_affine
= 0;
3013 stats
->nb_affine_multivar
= 0;
3014 stats
->nb_higher_poly
= 0;
3015 stats
->nb_chrec_dont_know
= 0;
3016 stats
->nb_undetermined
= 0;
3019 /* Dump the contents of a CHREC_STATS structure. */
3022 dump_chrecs_stats (FILE *file
, struct chrec_stats
*stats
)
3024 fprintf (file
, "\n(\n");
3025 fprintf (file
, "-----------------------------------------\n");
3026 fprintf (file
, "%d\taffine univariate chrecs\n", stats
->nb_affine
);
3027 fprintf (file
, "%d\taffine multivariate chrecs\n", stats
->nb_affine_multivar
);
3028 fprintf (file
, "%d\tdegree greater than 2 polynomials\n",
3029 stats
->nb_higher_poly
);
3030 fprintf (file
, "%d\tchrec_dont_know chrecs\n", stats
->nb_chrec_dont_know
);
3031 fprintf (file
, "-----------------------------------------\n");
3032 fprintf (file
, "%d\ttotal chrecs\n", stats
->nb_chrecs
);
3033 fprintf (file
, "%d\twith undetermined coefficients\n",
3034 stats
->nb_undetermined
);
3035 fprintf (file
, "-----------------------------------------\n");
3036 fprintf (file
, "%d\tchrecs in the scev database\n",
3037 (int) htab_elements (scalar_evolution_info
));
3038 fprintf (file
, "%d\tsets in the scev database\n", nb_set_scev
);
3039 fprintf (file
, "%d\tgets in the scev database\n", nb_get_scev
);
3040 fprintf (file
, "-----------------------------------------\n");
3041 fprintf (file
, ")\n\n");
3044 /* Gather statistics about CHREC. */
3047 gather_chrec_stats (tree chrec
, struct chrec_stats
*stats
)
3049 if (dump_file
&& (dump_flags
& TDF_STATS
))
3051 fprintf (dump_file
, "(classify_chrec ");
3052 print_generic_expr (dump_file
, chrec
, 0);
3053 fprintf (dump_file
, "\n");
3058 if (chrec
== NULL_TREE
)
3060 stats
->nb_undetermined
++;
3064 switch (TREE_CODE (chrec
))
3066 case POLYNOMIAL_CHREC
:
3067 if (evolution_function_is_affine_p (chrec
))
3069 if (dump_file
&& (dump_flags
& TDF_STATS
))
3070 fprintf (dump_file
, " affine_univariate\n");
3073 else if (evolution_function_is_affine_multivariate_p (chrec
, 0))
3075 if (dump_file
&& (dump_flags
& TDF_STATS
))
3076 fprintf (dump_file
, " affine_multivariate\n");
3077 stats
->nb_affine_multivar
++;
3081 if (dump_file
&& (dump_flags
& TDF_STATS
))
3082 fprintf (dump_file
, " higher_degree_polynomial\n");
3083 stats
->nb_higher_poly
++;
3092 if (chrec_contains_undetermined (chrec
))
3094 if (dump_file
&& (dump_flags
& TDF_STATS
))
3095 fprintf (dump_file
, " undetermined\n");
3096 stats
->nb_undetermined
++;
3099 if (dump_file
&& (dump_flags
& TDF_STATS
))
3100 fprintf (dump_file
, ")\n");
3103 /* Callback for htab_traverse, gathers information on chrecs in the
3107 gather_stats_on_scev_database_1 (void **slot
, void *stats
)
3109 struct scev_info_str
*entry
= (struct scev_info_str
*) *slot
;
3111 gather_chrec_stats (entry
->chrec
, (struct chrec_stats
*) stats
);
3116 /* Classify the chrecs of the whole database. */
3119 gather_stats_on_scev_database (void)
3121 struct chrec_stats stats
;
3126 reset_chrecs_counters (&stats
);
3128 htab_traverse (scalar_evolution_info
, gather_stats_on_scev_database_1
,
3131 dump_chrecs_stats (dump_file
, &stats
);
3139 initialize_scalar_evolutions_analyzer (void)
3141 /* The elements below are unique. */
3142 if (chrec_dont_know
== NULL_TREE
)
3144 chrec_not_analyzed_yet
= NULL_TREE
;
3145 chrec_dont_know
= make_node (SCEV_NOT_KNOWN
);
3146 chrec_known
= make_node (SCEV_KNOWN
);
3147 TREE_TYPE (chrec_dont_know
) = void_type_node
;
3148 TREE_TYPE (chrec_known
) = void_type_node
;
3152 /* Initialize the analysis of scalar evolutions for LOOPS. */
3155 scev_initialize (void)
3159 scalar_evolution_info
= htab_create_ggc (100, hash_scev_info
, eq_scev_info
,
3162 initialize_scalar_evolutions_analyzer ();
3164 FOR_EACH_LOOP (loop
, 0)
3166 loop
->nb_iterations
= NULL_TREE
;
3170 /* Return true if SCEV is initialized. */
3173 scev_initialized_p (void)
3175 return scalar_evolution_info
!= NULL
;
3178 /* Cleans up the information cached by the scalar evolutions analysis
3179 in the hash table. */
3182 scev_reset_htab (void)
3184 if (!scalar_evolution_info
)
3187 htab_empty (scalar_evolution_info
);
3190 /* Cleans up the information cached by the scalar evolutions analysis
3191 in the hash table and in the loop->nb_iterations. */
3203 FOR_EACH_LOOP (loop
, 0)
3205 loop
->nb_iterations
= NULL_TREE
;
3209 /* Checks whether use of OP in USE_LOOP behaves as a simple affine iv with
3210 respect to WRTO_LOOP and returns its base and step in IV if possible
3211 (see analyze_scalar_evolution_in_loop for more details on USE_LOOP
3212 and WRTO_LOOP). If ALLOW_NONCONSTANT_STEP is true, we want step to be
3213 invariant in LOOP. Otherwise we require it to be an integer constant.
3215 IV->no_overflow is set to true if we are sure the iv cannot overflow (e.g.
3216 because it is computed in signed arithmetics). Consequently, adding an
3219 for (i = IV->base; ; i += IV->step)
3221 is only safe if IV->no_overflow is false, or TYPE_OVERFLOW_UNDEFINED is
3222 false for the type of the induction variable, or you can prove that i does
3223 not wrap by some other argument. Otherwise, this might introduce undefined
3226 for (i = iv->base; ; i = (type) ((unsigned type) i + (unsigned type) iv->step))
3228 must be used instead. */
3231 simple_iv (struct loop
*wrto_loop
, struct loop
*use_loop
, tree op
,
3232 affine_iv
*iv
, bool allow_nonconstant_step
)
3237 iv
->base
= NULL_TREE
;
3238 iv
->step
= NULL_TREE
;
3239 iv
->no_overflow
= false;
3241 type
= TREE_TYPE (op
);
3242 if (!POINTER_TYPE_P (type
)
3243 && !INTEGRAL_TYPE_P (type
))
3246 ev
= analyze_scalar_evolution_in_loop (wrto_loop
, use_loop
, op
,
3248 if (chrec_contains_undetermined (ev
)
3249 || chrec_contains_symbols_defined_in_loop (ev
, wrto_loop
->num
))
3252 if (tree_does_not_contain_chrecs (ev
))
3255 iv
->step
= build_int_cst (TREE_TYPE (ev
), 0);
3256 iv
->no_overflow
= true;
3260 if (TREE_CODE (ev
) != POLYNOMIAL_CHREC
3261 || CHREC_VARIABLE (ev
) != (unsigned) wrto_loop
->num
)
3264 iv
->step
= CHREC_RIGHT (ev
);
3265 if ((!allow_nonconstant_step
&& TREE_CODE (iv
->step
) != INTEGER_CST
)
3266 || tree_contains_chrecs (iv
->step
, NULL
))
3269 iv
->base
= CHREC_LEFT (ev
);
3270 if (tree_contains_chrecs (iv
->base
, NULL
))
3273 iv
->no_overflow
= !folded_casts
&& TYPE_OVERFLOW_UNDEFINED (type
);
3278 /* Finalize the scalar evolution analysis. */
3281 scev_finalize (void)
3283 if (!scalar_evolution_info
)
3285 htab_delete (scalar_evolution_info
);
3286 scalar_evolution_info
= NULL
;
3289 /* Returns true if the expression EXPR is considered to be too expensive
3290 for scev_const_prop. */
3293 expression_expensive_p (tree expr
)
3295 enum tree_code code
;
3297 if (is_gimple_val (expr
))
3300 code
= TREE_CODE (expr
);
3301 if (code
== TRUNC_DIV_EXPR
3302 || code
== CEIL_DIV_EXPR
3303 || code
== FLOOR_DIV_EXPR
3304 || code
== ROUND_DIV_EXPR
3305 || code
== TRUNC_MOD_EXPR
3306 || code
== CEIL_MOD_EXPR
3307 || code
== FLOOR_MOD_EXPR
3308 || code
== ROUND_MOD_EXPR
3309 || code
== EXACT_DIV_EXPR
)
3311 /* Division by power of two is usually cheap, so we allow it.
3312 Forbid anything else. */
3313 if (!integer_pow2p (TREE_OPERAND (expr
, 1)))
3317 switch (TREE_CODE_CLASS (code
))
3320 case tcc_comparison
:
3321 if (expression_expensive_p (TREE_OPERAND (expr
, 1)))
3326 return expression_expensive_p (TREE_OPERAND (expr
, 0));
3333 /* Replace ssa names for that scev can prove they are constant by the
3334 appropriate constants. Also perform final value replacement in loops,
3335 in case the replacement expressions are cheap.
3337 We only consider SSA names defined by phi nodes; rest is left to the
3338 ordinary constant propagation pass. */
3341 scev_const_prop (void)
3344 tree name
, type
, ev
;
3346 struct loop
*loop
, *ex_loop
;
3347 bitmap ssa_names_to_remove
= NULL
;
3349 gimple_stmt_iterator psi
;
3351 if (number_of_loops (cfun
) <= 1)
3354 FOR_EACH_BB_FN (bb
, cfun
)
3356 loop
= bb
->loop_father
;
3358 for (psi
= gsi_start_phis (bb
); !gsi_end_p (psi
); gsi_next (&psi
))
3360 phi
= gsi_stmt (psi
);
3361 name
= PHI_RESULT (phi
);
3363 if (virtual_operand_p (name
))
3366 type
= TREE_TYPE (name
);
3368 if (!POINTER_TYPE_P (type
)
3369 && !INTEGRAL_TYPE_P (type
))
3372 ev
= resolve_mixers (loop
, analyze_scalar_evolution (loop
, name
));
3373 if (!is_gimple_min_invariant (ev
)
3374 || !may_propagate_copy (name
, ev
))
3377 /* Replace the uses of the name. */
3379 replace_uses_by (name
, ev
);
3381 if (!ssa_names_to_remove
)
3382 ssa_names_to_remove
= BITMAP_ALLOC (NULL
);
3383 bitmap_set_bit (ssa_names_to_remove
, SSA_NAME_VERSION (name
));
3387 /* Remove the ssa names that were replaced by constants. We do not
3388 remove them directly in the previous cycle, since this
3389 invalidates scev cache. */
3390 if (ssa_names_to_remove
)
3394 EXECUTE_IF_SET_IN_BITMAP (ssa_names_to_remove
, 0, i
, bi
)
3396 gimple_stmt_iterator psi
;
3397 name
= ssa_name (i
);
3398 phi
= SSA_NAME_DEF_STMT (name
);
3400 gcc_assert (gimple_code (phi
) == GIMPLE_PHI
);
3401 psi
= gsi_for_stmt (phi
);
3402 remove_phi_node (&psi
, true);
3405 BITMAP_FREE (ssa_names_to_remove
);
3409 /* Now the regular final value replacement. */
3410 FOR_EACH_LOOP (loop
, LI_FROM_INNERMOST
)
3413 tree def
, rslt
, niter
;
3414 gimple_stmt_iterator gsi
;
3416 /* If we do not know exact number of iterations of the loop, we cannot
3417 replace the final value. */
3418 exit
= single_exit (loop
);
3422 niter
= number_of_latch_executions (loop
);
3423 if (niter
== chrec_dont_know
)
3426 /* Ensure that it is possible to insert new statements somewhere. */
3427 if (!single_pred_p (exit
->dest
))
3428 split_loop_exit_edge (exit
);
3429 gsi
= gsi_after_labels (exit
->dest
);
3431 ex_loop
= superloop_at_depth (loop
,
3432 loop_depth (exit
->dest
->loop_father
) + 1);
3434 for (psi
= gsi_start_phis (exit
->dest
); !gsi_end_p (psi
); )
3436 phi
= gsi_stmt (psi
);
3437 rslt
= PHI_RESULT (phi
);
3438 def
= PHI_ARG_DEF_FROM_EDGE (phi
, exit
);
3439 if (virtual_operand_p (def
))
3445 if (!POINTER_TYPE_P (TREE_TYPE (def
))
3446 && !INTEGRAL_TYPE_P (TREE_TYPE (def
)))
3453 def
= analyze_scalar_evolution_in_loop (ex_loop
, loop
, def
,
3455 def
= compute_overall_effect_of_inner_loop (ex_loop
, def
);
3456 if (!tree_does_not_contain_chrecs (def
)
3457 || chrec_contains_symbols_defined_in_loop (def
, ex_loop
->num
)
3458 /* Moving the computation from the loop may prolong life range
3459 of some ssa names, which may cause problems if they appear
3460 on abnormal edges. */
3461 || contains_abnormal_ssa_name_p (def
)
3462 /* Do not emit expensive expressions. The rationale is that
3463 when someone writes a code like
3465 while (n > 45) n -= 45;
3467 he probably knows that n is not large, and does not want it
3468 to be turned into n %= 45. */
3469 || expression_expensive_p (def
))
3471 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
3473 fprintf (dump_file
, "not replacing:\n ");
3474 print_gimple_stmt (dump_file
, phi
, 0, 0);
3475 fprintf (dump_file
, "\n");
3481 /* Eliminate the PHI node and replace it by a computation outside
3485 fprintf (dump_file
, "\nfinal value replacement:\n ");
3486 print_gimple_stmt (dump_file
, phi
, 0, 0);
3487 fprintf (dump_file
, " with\n ");
3489 def
= unshare_expr (def
);
3490 remove_phi_node (&psi
, false);
3492 /* If def's type has undefined overflow and there were folded
3493 casts, rewrite all stmts added for def into arithmetics
3494 with defined overflow behavior. */
3495 if (folded_casts
&& TYPE_OVERFLOW_UNDEFINED (TREE_TYPE (def
)))
3498 gimple_stmt_iterator gsi2
;
3499 def
= force_gimple_operand (def
, &stmts
, true, NULL_TREE
);
3500 gsi2
= gsi_start (stmts
);
3501 while (!gsi_end_p (gsi2
))
3503 gimple stmt
= gsi_stmt (gsi2
);
3504 gimple_stmt_iterator gsi3
= gsi2
;
3506 gsi_remove (&gsi3
, false);
3507 if (is_gimple_assign (stmt
)
3508 && arith_code_with_undefined_signed_overflow
3509 (gimple_assign_rhs_code (stmt
)))
3510 gsi_insert_seq_before (&gsi
,
3511 rewrite_to_defined_overflow (stmt
),
3514 gsi_insert_before (&gsi
, stmt
, GSI_SAME_STMT
);
3518 def
= force_gimple_operand_gsi (&gsi
, def
, false, NULL_TREE
,
3519 true, GSI_SAME_STMT
);
3521 ass
= gimple_build_assign (rslt
, def
);
3522 gsi_insert_before (&gsi
, ass
, GSI_SAME_STMT
);
3525 print_gimple_stmt (dump_file
, ass
, 0, 0);
3526 fprintf (dump_file
, "\n");
3533 #include "gt-tree-scalar-evolution.h"