1 /* Natural loop functions
2 Copyright (C) 1987-2014 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
23 #include "double-int.h"
29 /* Structure to hold decision about unrolling/peeling. */
40 struct GTY (()) lpt_decision
{
41 enum lpt_dec decision
;
45 /* The type of extend applied to an IV. */
53 /* The structure describing a bound on number of iterations of a loop. */
55 struct GTY ((chain_next ("%h.next"))) nb_iter_bound
{
56 /* The statement STMT is executed at most ... */
59 /* ... BOUND + 1 times (BOUND must be an unsigned constant).
60 The + 1 is added for the following reasons:
62 a) 0 would otherwise be unused, while we would need to care more about
63 overflows (as MAX + 1 is sometimes produced as the estimate on number
64 of executions of STMT).
65 b) it is consistent with the result of number_of_iterations_exit. */
68 /* True if the statement will cause the loop to be leaved the (at most)
69 BOUND + 1-st time it is executed, that is, all the statements after it
70 are executed at most BOUND times. */
73 /* The next bound in the list. */
74 struct nb_iter_bound
*next
;
77 /* Description of the loop exit. */
79 struct GTY (()) loop_exit
{
83 /* Previous and next exit in the list of the exits of the loop. */
84 struct loop_exit
*prev
;
85 struct loop_exit
*next
;
87 /* Next element in the list of loops from that E exits. */
88 struct loop_exit
*next_e
;
91 typedef struct loop
*loop_p
;
93 /* An integer estimation of the number of iterations. Estimate_state
94 describes what is the state of the estimation. */
97 /* Estimate was not computed yet. */
99 /* Estimate is ready. */
104 /* Structure to hold information for each natural loop. */
105 struct GTY ((chain_next ("%h.next"))) loop
{
106 /* Index into loops array. */
109 /* Number of loop insns. */
112 /* Basic block of loop header. */
115 /* Basic block of loop latch. */
118 /* For loop unrolling/peeling decision. */
119 struct lpt_decision lpt_decision
;
121 /* Average number of executed insns per iteration. */
124 /* Number of blocks contained within the loop. */
127 /* Superloops of the loop, starting with the outermost loop. */
128 vec
<loop_p
, va_gc
> *superloops
;
130 /* The first inner (child) loop or NULL if innermost loop. */
133 /* Link to the next (sibling) loop. */
136 /* Auxiliary info specific to a pass. */
137 PTR
GTY ((skip (""))) aux
;
139 /* The number of times the latch of the loop is executed. This can be an
140 INTEGER_CST, or a symbolic expression representing the number of
141 iterations like "N - 1", or a COND_EXPR containing the runtime
142 conditions under which the number of iterations is non zero.
144 Don't access this field directly: number_of_latch_executions
145 computes and caches the computed information in this field. */
148 /* An integer guaranteed to be greater or equal to nb_iterations. Only
149 valid if any_upper_bound is true. */
150 widest_int nb_iterations_upper_bound
;
152 /* An integer giving an estimate on nb_iterations. Unlike
153 nb_iterations_upper_bound, there is no guarantee that it is at least
155 widest_int nb_iterations_estimate
;
157 bool any_upper_bound
;
160 /* True if the loop can be parallel. */
161 bool can_be_parallel
;
163 /* True if -Waggressive-loop-optimizations warned about this loop
165 bool warned_aggressive_loop_optimizations
;
167 /* An integer estimation of the number of iterations. Estimate_state
168 describes what is the state of the estimation. */
169 enum loop_estimation estimate_state
;
171 /* If > 0, an integer, where the user asserted that for any
172 I in [ 0, nb_iterations ) and for any J in
173 [ I, min ( I + safelen, nb_iterations ) ), the Ith and Jth iterations
174 of the loop can be safely evaluated concurrently. */
177 /* True if this loop should never be vectorized. */
180 /* True if we should try harder to vectorize this loop. */
181 bool force_vectorize
;
183 /* For SIMD loops, this is a unique identifier of the loop, referenced
184 by IFN_GOMP_SIMD_VF, IFN_GOMP_SIMD_LANE and IFN_GOMP_SIMD_LAST_LANE
188 /* Upper bound on number of iterations of a loop. */
189 struct nb_iter_bound
*bounds
;
191 /* Head of the cyclic list of the exits of the loop. */
192 struct loop_exit
*exits
;
194 /* Number of iteration analysis data for RTL. */
195 struct niter_desc
*simple_loop_desc
;
197 /* For sanity checking during loop fixup we record here the former
198 loop header for loops marked for removal. Note that this prevents
199 the basic-block from being collected but its index can still be
201 basic_block former_header
;
204 /* Flags for state of loop structure. */
207 LOOPS_HAVE_PREHEADERS
= 1,
208 LOOPS_HAVE_SIMPLE_LATCHES
= 2,
209 LOOPS_HAVE_MARKED_IRREDUCIBLE_REGIONS
= 4,
210 LOOPS_HAVE_RECORDED_EXITS
= 8,
211 LOOPS_MAY_HAVE_MULTIPLE_LATCHES
= 16,
212 LOOP_CLOSED_SSA
= 32,
213 LOOPS_NEED_FIXUP
= 64,
214 LOOPS_HAVE_FALLTHRU_PREHEADERS
= 128
217 #define LOOPS_NORMAL (LOOPS_HAVE_PREHEADERS | LOOPS_HAVE_SIMPLE_LATCHES \
218 | LOOPS_HAVE_MARKED_IRREDUCIBLE_REGIONS)
219 #define AVOID_CFG_MODIFICATIONS (LOOPS_MAY_HAVE_MULTIPLE_LATCHES)
221 /* Structure to hold CFG information about natural loops within a function. */
222 struct GTY (()) loops
{
223 /* State of loops. */
226 /* Array of the loops. */
227 vec
<loop_p
, va_gc
> *larray
;
229 /* Maps edges to the list of their descriptions as loop exits. Edges
230 whose sources or destinations have loop_father == NULL (which may
231 happen during the cfg manipulations) should not appear in EXITS. */
232 htab_t
GTY((param_is (struct loop_exit
))) exits
;
234 /* Pointer to root of loop hierarchy tree. */
235 struct loop
*tree_root
;
238 /* Loop recognition. */
239 bool bb_loop_header_p (basic_block
);
240 void init_loops_structure (struct function
*, struct loops
*, unsigned);
241 extern struct loops
*flow_loops_find (struct loops
*);
242 extern void disambiguate_loops_with_multiple_latches (void);
243 extern void flow_loops_free (struct loops
*);
244 extern void flow_loops_dump (FILE *,
245 void (*)(const struct loop
*, FILE *, int), int);
246 extern void flow_loop_dump (const struct loop
*, FILE *,
247 void (*)(const struct loop
*, FILE *, int), int);
248 struct loop
*alloc_loop (void);
249 extern void flow_loop_free (struct loop
*);
250 int flow_loop_nodes_find (basic_block
, struct loop
*);
251 unsigned fix_loop_structure (bitmap changed_bbs
);
252 bool mark_irreducible_loops (void);
253 void release_recorded_exits (void);
254 void record_loop_exits (void);
255 void rescan_loop_exit (edge
, bool, bool);
257 /* Loop data structure manipulation/querying. */
258 extern void flow_loop_tree_node_add (struct loop
*, struct loop
*);
259 extern void flow_loop_tree_node_remove (struct loop
*);
260 extern void place_new_loop (struct function
*, struct loop
*);
261 extern void add_loop (struct loop
*, struct loop
*);
262 extern bool flow_loop_nested_p (const struct loop
*, const struct loop
*);
263 extern bool flow_bb_inside_loop_p (const struct loop
*, const_basic_block
);
264 extern struct loop
* find_common_loop (struct loop
*, struct loop
*);
265 struct loop
*superloop_at_depth (struct loop
*, unsigned);
266 struct eni_weights_d
;
267 extern int num_loop_insns (const struct loop
*);
268 extern int average_num_loop_insns (const struct loop
*);
269 extern unsigned get_loop_level (const struct loop
*);
270 extern bool loop_exit_edge_p (const struct loop
*, const_edge
);
271 extern bool loop_exits_to_bb_p (struct loop
*, basic_block
);
272 extern bool loop_exits_from_bb_p (struct loop
*, basic_block
);
273 extern void mark_loop_exit_edges (void);
274 extern location_t
get_loop_location (struct loop
*loop
);
276 /* Loops & cfg manipulation. */
277 extern basic_block
*get_loop_body (const struct loop
*);
278 extern unsigned get_loop_body_with_size (const struct loop
*, basic_block
*,
280 extern basic_block
*get_loop_body_in_dom_order (const struct loop
*);
281 extern basic_block
*get_loop_body_in_bfs_order (const struct loop
*);
282 extern basic_block
*get_loop_body_in_custom_order (const struct loop
*,
283 int (*) (const void *, const void *));
285 extern vec
<edge
> get_loop_exit_edges (const struct loop
*);
286 extern edge
single_exit (const struct loop
*);
287 extern edge
single_likely_exit (struct loop
*loop
);
288 extern unsigned num_loop_branches (const struct loop
*);
290 extern edge
loop_preheader_edge (const struct loop
*);
291 extern edge
loop_latch_edge (const struct loop
*);
293 extern void add_bb_to_loop (basic_block
, struct loop
*);
294 extern void remove_bb_from_loops (basic_block
);
296 extern void cancel_loop_tree (struct loop
*);
297 extern void delete_loop (struct loop
*);
301 CP_SIMPLE_PREHEADERS
= 1,
302 CP_FALLTHRU_PREHEADERS
= 2
305 basic_block
create_preheader (struct loop
*, int);
306 extern void create_preheaders (int);
307 extern void force_single_succ_latches (void);
309 extern void verify_loop_structure (void);
312 extern bool just_once_each_iteration_p (const struct loop
*, const_basic_block
);
313 gcov_type
expected_loop_iterations_unbounded (const struct loop
*);
314 extern unsigned expected_loop_iterations (const struct loop
*);
315 extern rtx
doloop_condition_get (rtx
);
318 /* Loop manipulation. */
319 extern bool can_duplicate_loop_p (const struct loop
*loop
);
321 #define DLTHE_FLAG_UPDATE_FREQ 1 /* Update frequencies in
322 duplicate_loop_to_header_edge. */
323 #define DLTHE_RECORD_COPY_NUMBER 2 /* Record copy number in the aux
324 field of newly create BB. */
325 #define DLTHE_FLAG_COMPLETTE_PEEL 4 /* Update frequencies expecting
326 a complete peeling. */
328 extern edge
create_empty_if_region_on_edge (edge
, tree
);
329 extern struct loop
*create_empty_loop_on_edge (edge
, tree
, tree
, tree
, tree
,
330 tree
*, tree
*, struct loop
*);
331 extern struct loop
* duplicate_loop (struct loop
*, struct loop
*);
332 extern void copy_loop_info (struct loop
*loop
, struct loop
*target
);
333 extern void duplicate_subloops (struct loop
*, struct loop
*);
334 extern bool duplicate_loop_to_header_edge (struct loop
*, edge
,
335 unsigned, sbitmap
, edge
,
337 extern struct loop
*loopify (edge
, edge
,
338 basic_block
, edge
, edge
, bool,
340 struct loop
* loop_version (struct loop
*, void *,
341 basic_block
*, unsigned, unsigned, unsigned, bool);
342 extern bool remove_path (edge
);
343 extern void unloop (struct loop
*, bool *, bitmap
);
344 extern void scale_loop_frequencies (struct loop
*, int, int);
345 void mark_loop_for_removal (loop_p
);
348 /* Induction variable analysis. */
350 /* The description of induction variable. The things are a bit complicated
351 due to need to handle subregs and extends. The value of the object described
352 by it can be obtained as follows (all computations are done in extend_mode):
354 Value in i-th iteration is
355 delta + mult * extend_{extend_mode} (subreg_{mode} (base + i * step)).
357 If first_special is true, the value in the first iteration is
360 If extend = UNKNOWN, first_special must be false, delta 0, mult 1 and value is
361 subreg_{mode} (base + i * step)
363 The get_iv_value function can be used to obtain these expressions.
365 ??? Add a third mode field that would specify the mode in that inner
366 computation is done, which would enable it to be different from the
371 /* Its base and step (mode of base and step is supposed to be extend_mode,
372 see the description above). */
375 /* The type of extend applied to it (IV_SIGN_EXTEND, IV_ZERO_EXTEND,
376 or IV_UNKNOWN_EXTEND). */
377 enum iv_extend_code extend
;
379 /* Operations applied in the extended mode. */
382 /* The mode it is extended to. */
383 enum machine_mode extend_mode
;
385 /* The mode the variable iterates in. */
386 enum machine_mode mode
;
388 /* Whether the first iteration needs to be handled specially. */
389 unsigned first_special
: 1;
392 /* The description of an exit from the loop and of the number of iterations
393 till we take the exit. */
395 struct GTY(()) niter_desc
397 /* The edge out of the loop. */
400 /* The other edge leading from the condition. */
403 /* True if we are able to say anything about number of iterations of the
407 /* True if the loop iterates the constant number of times. */
410 /* Number of iterations if constant. */
413 /* Assumptions under that the rest of the information is valid. */
416 /* Assumptions under that the loop ends before reaching the latch,
417 even if value of niter_expr says otherwise. */
418 rtx noloop_assumptions
;
420 /* Condition under that the loop is infinite. */
423 /* Whether the comparison is signed. */
426 /* The mode in that niter_expr should be computed. */
427 enum machine_mode mode
;
429 /* The number of iterations of the loop. */
433 extern void iv_analysis_loop_init (struct loop
*);
434 extern bool iv_analyze (rtx_insn
*, rtx
, struct rtx_iv
*);
435 extern bool iv_analyze_result (rtx_insn
*, rtx
, struct rtx_iv
*);
436 extern bool iv_analyze_expr (rtx_insn
*, rtx
, enum machine_mode
,
438 extern rtx
get_iv_value (struct rtx_iv
*, rtx
);
439 extern bool biv_p (rtx_insn
*, rtx
);
440 extern void find_simple_exit (struct loop
*, struct niter_desc
*);
441 extern void iv_analysis_done (void);
443 extern struct niter_desc
*get_simple_loop_desc (struct loop
*loop
);
444 extern void free_simple_loop_desc (struct loop
*loop
);
446 static inline struct niter_desc
*
447 simple_loop_desc (struct loop
*loop
)
449 return loop
->simple_loop_desc
;
452 /* Accessors for the loop structures. */
454 /* Returns the loop with index NUM from FNs loop tree. */
456 static inline struct loop
*
457 get_loop (struct function
*fn
, unsigned num
)
459 return (*loops_for_fn (fn
)->larray
)[num
];
462 /* Returns the number of superloops of LOOP. */
464 static inline unsigned
465 loop_depth (const struct loop
*loop
)
467 return vec_safe_length (loop
->superloops
);
470 /* Returns the immediate superloop of LOOP, or NULL if LOOP is the outermost
473 static inline struct loop
*
474 loop_outer (const struct loop
*loop
)
476 unsigned n
= vec_safe_length (loop
->superloops
);
481 return (*loop
->superloops
)[n
- 1];
484 /* Returns true if LOOP has at least one exit edge. */
487 loop_has_exit_edges (const struct loop
*loop
)
489 return loop
->exits
->next
->e
!= NULL
;
492 /* Returns the list of loops in FN. */
494 inline vec
<loop_p
, va_gc
> *
495 get_loops (struct function
*fn
)
497 struct loops
*loops
= loops_for_fn (fn
);
501 return loops
->larray
;
504 /* Returns the number of loops in FN (including the removed
505 ones and the fake loop that forms the root of the loop tree). */
507 static inline unsigned
508 number_of_loops (struct function
*fn
)
510 struct loops
*loops
= loops_for_fn (fn
);
514 return vec_safe_length (loops
->larray
);
517 /* Returns true if state of the loops satisfies all properties
518 described by FLAGS. */
521 loops_state_satisfies_p (unsigned flags
)
523 return (current_loops
->state
& flags
) == flags
;
526 /* Sets FLAGS to the loops state. */
529 loops_state_set (unsigned flags
)
531 current_loops
->state
|= flags
;
534 /* Clears FLAGS from the loops state. */
537 loops_state_clear (unsigned flags
)
541 current_loops
->state
&= ~flags
;
544 /* Loop iterators. */
546 /* Flags for loop iteration. */
550 LI_INCLUDE_ROOT
= 1, /* Include the fake root of the loop tree. */
551 LI_FROM_INNERMOST
= 2, /* Iterate over the loops in the reverse order,
552 starting from innermost ones. */
553 LI_ONLY_INNERMOST
= 4 /* Iterate only over innermost loops. */
556 /* The iterator for loops. */
560 loop_iterator (loop_p
*loop
, unsigned flags
);
563 inline loop_p
next ();
565 /* The list of loops to visit. */
568 /* The index of the actual loop. */
573 loop_iterator::next ()
577 while (this->to_visit
.iterate (this->idx
, &anum
))
580 loop_p loop
= get_loop (cfun
, anum
);
589 loop_iterator::loop_iterator (loop_p
*loop
, unsigned flags
)
598 this->to_visit
.create (0);
603 this->to_visit
.create (number_of_loops (cfun
));
604 mn
= (flags
& LI_INCLUDE_ROOT
) ? 0 : 1;
606 if (flags
& LI_ONLY_INNERMOST
)
608 for (i
= 0; vec_safe_iterate (current_loops
->larray
, i
, &aloop
); i
++)
610 && aloop
->inner
== NULL
612 this->to_visit
.quick_push (aloop
->num
);
614 else if (flags
& LI_FROM_INNERMOST
)
616 /* Push the loops to LI->TO_VISIT in postorder. */
617 for (aloop
= current_loops
->tree_root
;
618 aloop
->inner
!= NULL
;
619 aloop
= aloop
->inner
)
624 if (aloop
->num
>= mn
)
625 this->to_visit
.quick_push (aloop
->num
);
629 for (aloop
= aloop
->next
;
630 aloop
->inner
!= NULL
;
631 aloop
= aloop
->inner
)
634 else if (!loop_outer (aloop
))
637 aloop
= loop_outer (aloop
);
642 /* Push the loops to LI->TO_VISIT in preorder. */
643 aloop
= current_loops
->tree_root
;
646 if (aloop
->num
>= mn
)
647 this->to_visit
.quick_push (aloop
->num
);
649 if (aloop
->inner
!= NULL
)
650 aloop
= aloop
->inner
;
653 while (aloop
!= NULL
&& aloop
->next
== NULL
)
654 aloop
= loop_outer (aloop
);
662 *loop
= this->next ();
666 loop_iterator::~loop_iterator ()
668 this->to_visit
.release ();
671 #define FOR_EACH_LOOP(LOOP, FLAGS) \
672 for (loop_iterator li(&(LOOP), FLAGS); \
676 /* The properties of the target. */
677 struct target_cfgloop
{
678 /* Number of available registers. */
679 unsigned x_target_avail_regs
;
681 /* Number of available registers that are call-clobbered. */
682 unsigned x_target_clobbered_regs
;
684 /* Number of registers reserved for temporary expressions. */
685 unsigned x_target_res_regs
;
687 /* The cost for register when there still is some reserve, but we are
688 approaching the number of available registers. */
689 unsigned x_target_reg_cost
[2];
691 /* The cost for register when we need to spill. */
692 unsigned x_target_spill_cost
[2];
695 extern struct target_cfgloop default_target_cfgloop
;
696 #if SWITCHABLE_TARGET
697 extern struct target_cfgloop
*this_target_cfgloop
;
699 #define this_target_cfgloop (&default_target_cfgloop)
702 #define target_avail_regs \
703 (this_target_cfgloop->x_target_avail_regs)
704 #define target_clobbered_regs \
705 (this_target_cfgloop->x_target_clobbered_regs)
706 #define target_res_regs \
707 (this_target_cfgloop->x_target_res_regs)
708 #define target_reg_cost \
709 (this_target_cfgloop->x_target_reg_cost)
710 #define target_spill_cost \
711 (this_target_cfgloop->x_target_spill_cost)
713 /* Register pressure estimation for induction variable optimizations & loop
715 extern unsigned estimate_reg_pressure_cost (unsigned, unsigned, bool, bool);
716 extern void init_set_costs (void);
718 /* Loop optimizer initialization. */
719 extern void loop_optimizer_init (unsigned);
720 extern void loop_optimizer_finalize (void);
722 /* Optimization passes. */
725 UAP_PEEL
= 1, /* Enables loop peeling. */
726 UAP_UNROLL
= 2, /* Enables unrolling of loops if it seems profitable. */
727 UAP_UNROLL_ALL
= 4 /* Enables unrolling of all loops. */
730 extern void unroll_and_peel_loops (int);
731 extern void doloop_optimize_loops (void);
732 extern void move_loop_invariants (void);
733 extern void scale_loop_profile (struct loop
*loop
, int scale
, gcov_type iteration_bound
);
734 extern vec
<basic_block
> get_loop_hot_path (const struct loop
*loop
);
736 /* Returns the outermost loop of the loop nest that contains LOOP.*/
737 static inline struct loop
*
738 loop_outermost (struct loop
*loop
)
740 unsigned n
= vec_safe_length (loop
->superloops
);
745 return (*loop
->superloops
)[1];
748 extern void record_niter_bound (struct loop
*, const widest_int
&, bool, bool);
749 extern HOST_WIDE_INT
get_estimated_loop_iterations_int (struct loop
*);
750 extern HOST_WIDE_INT
get_max_loop_iterations_int (struct loop
*);
751 extern bool get_estimated_loop_iterations (struct loop
*loop
, widest_int
*nit
);
752 extern bool get_max_loop_iterations (struct loop
*loop
, widest_int
*nit
);
753 extern int bb_loop_depth (const_basic_block
);
755 /* Converts VAL to widest_int. */
757 static inline widest_int
758 gcov_type_to_wide_int (gcov_type val
)
762 a
[0] = (unsigned HOST_WIDE_INT
) val
;
763 /* If HOST_BITS_PER_WIDE_INT == HOST_BITS_PER_WIDEST_INT, avoid shifting by
765 val
>>= HOST_BITS_PER_WIDE_INT
- 1;
767 a
[1] = (unsigned HOST_WIDE_INT
) val
;
769 return widest_int::from_array (a
, 2);
771 #endif /* GCC_CFGLOOP_H */