1 /* Natural loop functions
2 Copyright (C) 1987, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
3 2005, 2006, 2007, 2008 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
24 #include "basic-block.h"
28 #include "double-int.h"
30 /* Structure to hold decision about unrolling/peeling. */
41 struct lpt_decision
GTY (())
43 enum lpt_dec decision
;
47 /* The structure describing a bound on number of iterations of a loop. */
49 struct nb_iter_bound
GTY ((chain_next ("%h.next")))
51 /* The statement STMT is executed at most ... */
54 /* ... BOUND + 1 times (BOUND must be an unsigned constant).
55 The + 1 is added for the following reasons:
57 a) 0 would otherwise be unused, while we would need to care more about
58 overflows (as MAX + 1 is sometimes produced as the estimate on number
59 of executions of STMT).
60 b) it is consistent with the result of number_of_iterations_exit. */
63 /* True if the statement will cause the loop to be leaved the (at most)
64 BOUND + 1-st time it is executed, that is, all the statements after it
65 are executed at most BOUND times. */
68 /* The next bound in the list. */
69 struct nb_iter_bound
*next
;
72 /* Description of the loop exit. */
74 struct loop_exit
GTY (())
79 /* Previous and next exit in the list of the exits of the loop. */
80 struct loop_exit
*prev
;
81 struct loop_exit
*next
;
83 /* Next element in the list of loops from that E exits. */
84 struct loop_exit
*next_e
;
87 typedef struct loop
*loop_p
;
89 DEF_VEC_ALLOC_P (loop_p
, heap
);
90 DEF_VEC_ALLOC_P (loop_p
, gc
);
92 /* An integer estimation of the number of iterations. Estimate_state
93 describes what is the state of the estimation. */
96 /* Estimate was not computed yet. */
98 /* Estimate is ready. */
102 /* Structure to hold information for each natural loop. */
103 struct loop
GTY ((chain_next ("%h.next")))
105 /* Index into loops array. */
108 /* Basic block of loop header. */
109 struct basic_block_def
*header
;
111 /* Basic block of loop latch. */
112 struct basic_block_def
*latch
;
114 /* For loop unrolling/peeling decision. */
115 struct lpt_decision lpt_decision
;
117 /* Number of loop insns. */
120 /* Average number of executed insns per iteration. */
123 /* Number of blocks contained within the loop. */
126 /* Superloops of the loop, starting with the outermost loop. */
127 VEC (loop_p
, gc
) *superloops
;
129 /* The first inner (child) loop or NULL if innermost loop. */
132 /* Link to the next (sibling) loop. */
135 /* Auxiliary info specific to a pass. */
136 PTR
GTY ((skip (""))) aux
;
138 /* The number of times the latch of the loop is executed.
139 This is an INTEGER_CST or an expression containing symbolic
140 names. Don't access this field directly:
141 number_of_latch_executions computes and caches the computed
142 information in this field. */
145 /* An integer estimation of the number of iterations. Estimate_state
146 describes what is the state of the estimation. */
147 enum loop_estimation estimate_state
;
149 /* An integer guaranteed to bound the number of iterations of the loop
151 bool any_upper_bound
;
152 double_int nb_iterations_upper_bound
;
154 /* An integer giving the expected number of iterations of the loop. */
156 double_int nb_iterations_estimate
;
158 /* Upper bound on number of iterations of a loop. */
159 struct nb_iter_bound
*bounds
;
161 /* Head of the cyclic list of the exits of the loop. */
162 struct loop_exit
*exits
;
165 /* Flags for state of loop structure. */
168 LOOPS_HAVE_PREHEADERS
= 1,
169 LOOPS_HAVE_SIMPLE_LATCHES
= 2,
170 LOOPS_HAVE_MARKED_IRREDUCIBLE_REGIONS
= 4,
171 LOOPS_HAVE_RECORDED_EXITS
= 8,
172 LOOPS_MAY_HAVE_MULTIPLE_LATCHES
= 16,
173 LOOP_CLOSED_SSA
= 32,
174 LOOPS_NEED_FIXUP
= 64,
175 LOOPS_HAVE_FALLTHRU_PREHEADERS
= 128
178 #define LOOPS_NORMAL (LOOPS_HAVE_PREHEADERS | LOOPS_HAVE_SIMPLE_LATCHES \
179 | LOOPS_HAVE_MARKED_IRREDUCIBLE_REGIONS)
180 #define AVOID_CFG_MODIFICATIONS (LOOPS_MAY_HAVE_MULTIPLE_LATCHES)
182 /* Structure to hold CFG information about natural loops within a function. */
183 struct loops
GTY (())
185 /* State of loops. */
188 /* Array of the loops. */
189 VEC (loop_p
, gc
) *larray
;
191 /* Maps edges to the list of their descriptions as loop exits. Edges
192 whose sources or destinations have loop_father == NULL (which may
193 happen during the cfg manipulations) should not appear in EXITS. */
194 htab_t
GTY((param_is (struct loop_exit
))) exits
;
196 /* Pointer to root of loop hierarchy tree. */
197 struct loop
*tree_root
;
200 /* Loop recognition. */
201 extern int flow_loops_find (struct loops
*);
202 extern void disambiguate_loops_with_multiple_latches (void);
203 extern void flow_loops_free (struct loops
*);
204 extern void flow_loops_dump (FILE *,
205 void (*)(const struct loop
*, FILE *, int), int);
206 extern void flow_loop_dump (const struct loop
*, FILE *,
207 void (*)(const struct loop
*, FILE *, int), int);
208 struct loop
*alloc_loop (void);
209 extern void flow_loop_free (struct loop
*);
210 int flow_loop_nodes_find (basic_block
, struct loop
*);
211 void fix_loop_structure (bitmap changed_bbs
);
212 void mark_irreducible_loops (void);
213 void release_recorded_exits (void);
214 void record_loop_exits (void);
215 void rescan_loop_exit (edge
, bool, bool);
217 /* Loop data structure manipulation/querying. */
218 extern void flow_loop_tree_node_add (struct loop
*, struct loop
*);
219 extern void flow_loop_tree_node_remove (struct loop
*);
220 extern void add_loop (struct loop
*, struct loop
*);
221 extern bool flow_loop_nested_p (const struct loop
*, const struct loop
*);
222 extern bool flow_bb_inside_loop_p (const struct loop
*, const_basic_block
);
223 extern struct loop
* find_common_loop (struct loop
*, struct loop
*);
224 struct loop
*superloop_at_depth (struct loop
*, unsigned);
225 struct eni_weights_d
;
226 extern unsigned tree_num_loop_insns (struct loop
*, struct eni_weights_d
*);
227 extern int num_loop_insns (const struct loop
*);
228 extern int average_num_loop_insns (const struct loop
*);
229 extern unsigned get_loop_level (const struct loop
*);
230 extern bool loop_exit_edge_p (const struct loop
*, const_edge
);
231 extern bool is_loop_exit (struct loop
*, basic_block
);
232 extern void mark_loop_exit_edges (void);
234 /* Loops & cfg manipulation. */
235 extern basic_block
*get_loop_body (const struct loop
*);
236 extern unsigned get_loop_body_with_size (const struct loop
*, basic_block
*,
238 extern basic_block
*get_loop_body_in_dom_order (const struct loop
*);
239 extern basic_block
*get_loop_body_in_bfs_order (const struct loop
*);
240 extern basic_block
*get_loop_body_in_custom_order (const struct loop
*,
241 int (*) (const void *, const void *));
243 extern VEC (edge
, heap
) *get_loop_exit_edges (const struct loop
*);
244 edge
single_exit (const struct loop
*);
245 extern unsigned num_loop_branches (const struct loop
*);
247 extern edge
loop_preheader_edge (const struct loop
*);
248 extern edge
loop_latch_edge (const struct loop
*);
250 extern void add_bb_to_loop (basic_block
, struct loop
*);
251 extern void remove_bb_from_loops (basic_block
);
253 extern void cancel_loop_tree (struct loop
*);
254 extern void delete_loop (struct loop
*);
258 CP_SIMPLE_PREHEADERS
= 1,
259 CP_FALLTHRU_PREHEADERS
= 2
262 basic_block
create_preheader (struct loop
*, int);
263 extern void create_preheaders (int);
264 extern void force_single_succ_latches (void);
266 extern void verify_loop_structure (void);
269 extern bool just_once_each_iteration_p (const struct loop
*, const_basic_block
);
270 gcov_type
expected_loop_iterations_unbounded (const struct loop
*);
271 extern unsigned expected_loop_iterations (const struct loop
*);
272 extern rtx
doloop_condition_get (rtx
);
274 void estimate_numbers_of_iterations_loop (struct loop
*);
275 HOST_WIDE_INT
estimated_loop_iterations_int (struct loop
*, bool);
276 bool estimated_loop_iterations (struct loop
*, bool, double_int
*);
278 /* Loop manipulation. */
279 extern bool can_duplicate_loop_p (const struct loop
*loop
);
281 #define DLTHE_FLAG_UPDATE_FREQ 1 /* Update frequencies in
282 duplicate_loop_to_header_edge. */
283 #define DLTHE_RECORD_COPY_NUMBER 2 /* Record copy number in the aux
284 field of newly create BB. */
285 #define DLTHE_FLAG_COMPLETTE_PEEL 4 /* Update frequencies expecting
286 a complete peeling. */
288 extern edge
create_empty_if_region_on_edge (edge
, tree
);
289 extern struct loop
*create_empty_loop_on_edge (edge
, tree
, tree
, tree
, tree
,
290 tree
*, struct loop
*);
291 extern struct loop
* duplicate_loop (struct loop
*, struct loop
*);
292 extern bool duplicate_loop_to_header_edge (struct loop
*, edge
,
293 unsigned, sbitmap
, edge
,
294 VEC (edge
, heap
) **, int);
295 extern struct loop
*loopify (edge
, edge
,
296 basic_block
, edge
, edge
, bool,
298 struct loop
* loop_version (struct loop
*, void *,
299 basic_block
*, unsigned, unsigned, unsigned, bool);
300 extern bool remove_path (edge
);
301 void scale_loop_frequencies (struct loop
*, int, int);
303 /* Induction variable analysis. */
305 /* The description of induction variable. The things are a bit complicated
306 due to need to handle subregs and extends. The value of the object described
307 by it can be obtained as follows (all computations are done in extend_mode):
309 Value in i-th iteration is
310 delta + mult * extend_{extend_mode} (subreg_{mode} (base + i * step)).
312 If first_special is true, the value in the first iteration is
315 If extend = UNKNOWN, first_special must be false, delta 0, mult 1 and value is
316 subreg_{mode} (base + i * step)
318 The get_iv_value function can be used to obtain these expressions.
320 ??? Add a third mode field that would specify the mode in that inner
321 computation is done, which would enable it to be different from the
326 /* Its base and step (mode of base and step is supposed to be extend_mode,
327 see the description above). */
330 /* The type of extend applied to it (SIGN_EXTEND, ZERO_EXTEND or UNKNOWN). */
331 enum rtx_code extend
;
333 /* Operations applied in the extended mode. */
336 /* The mode it is extended to. */
337 enum machine_mode extend_mode
;
339 /* The mode the variable iterates in. */
340 enum machine_mode mode
;
342 /* Whether the first iteration needs to be handled specially. */
343 unsigned first_special
: 1;
346 /* The description of an exit from the loop and of the number of iterations
347 till we take the exit. */
351 /* The edge out of the loop. */
354 /* The other edge leading from the condition. */
357 /* True if we are able to say anything about number of iterations of the
361 /* True if the loop iterates the constant number of times. */
364 /* Number of iterations if constant. */
365 unsigned HOST_WIDEST_INT niter
;
367 /* Upper bound on the number of iterations. */
368 unsigned HOST_WIDEST_INT niter_max
;
370 /* Assumptions under that the rest of the information is valid. */
373 /* Assumptions under that the loop ends before reaching the latch,
374 even if value of niter_expr says otherwise. */
375 rtx noloop_assumptions
;
377 /* Condition under that the loop is infinite. */
380 /* Whether the comparison is signed. */
383 /* The mode in that niter_expr should be computed. */
384 enum machine_mode mode
;
386 /* The number of iterations of the loop. */
390 extern void iv_analysis_loop_init (struct loop
*);
391 extern bool iv_analyze (rtx
, rtx
, struct rtx_iv
*);
392 extern bool iv_analyze_result (rtx
, rtx
, struct rtx_iv
*);
393 extern bool iv_analyze_expr (rtx
, rtx
, enum machine_mode
, struct rtx_iv
*);
394 extern rtx
get_iv_value (struct rtx_iv
*, rtx
);
395 extern bool biv_p (rtx
, rtx
);
396 extern void find_simple_exit (struct loop
*, struct niter_desc
*);
397 extern void iv_analysis_done (void);
399 extern struct niter_desc
*get_simple_loop_desc (struct loop
*loop
);
400 extern void free_simple_loop_desc (struct loop
*loop
);
402 static inline struct niter_desc
*
403 simple_loop_desc (struct loop
*loop
)
405 return (struct niter_desc
*) loop
->aux
;
408 /* Accessors for the loop structures. */
410 /* Returns the loop with index NUM from current_loops. */
412 static inline struct loop
*
413 get_loop (unsigned num
)
415 return VEC_index (loop_p
, current_loops
->larray
, num
);
418 /* Returns the number of superloops of LOOP. */
420 static inline unsigned
421 loop_depth (const struct loop
*loop
)
423 return VEC_length (loop_p
, loop
->superloops
);
426 /* Returns the immediate superloop of LOOP, or NULL if LOOP is the outermost
429 static inline struct loop
*
430 loop_outer (const struct loop
*loop
)
432 unsigned n
= VEC_length (loop_p
, loop
->superloops
);
437 return VEC_index (loop_p
, loop
->superloops
, n
- 1);
440 /* Returns the list of loops in current_loops. */
442 static inline VEC (loop_p
, gc
) *
448 return current_loops
->larray
;
451 /* Returns the number of loops in current_loops (including the removed
452 ones and the fake loop that forms the root of the loop tree). */
454 static inline unsigned
455 number_of_loops (void)
460 return VEC_length (loop_p
, current_loops
->larray
);
463 /* Returns true if state of the loops satisfies all properties
464 described by FLAGS. */
467 loops_state_satisfies_p (unsigned flags
)
469 return (current_loops
->state
& flags
) == flags
;
472 /* Sets FLAGS to the loops state. */
475 loops_state_set (unsigned flags
)
477 current_loops
->state
|= flags
;
480 /* Clears FLAGS from the loops state. */
483 loops_state_clear (unsigned flags
)
487 current_loops
->state
&= ~flags
;
490 /* Loop iterators. */
492 /* Flags for loop iteration. */
496 LI_INCLUDE_ROOT
= 1, /* Include the fake root of the loop tree. */
497 LI_FROM_INNERMOST
= 2, /* Iterate over the loops in the reverse order,
498 starting from innermost ones. */
499 LI_ONLY_INNERMOST
= 4 /* Iterate only over innermost loops. */
502 /* The iterator for loops. */
506 /* The list of loops to visit. */
507 VEC(int,heap
) *to_visit
;
509 /* The index of the actual loop. */
514 fel_next (loop_iterator
*li
, loop_p
*loop
)
518 while (VEC_iterate (int, li
->to_visit
, li
->idx
, anum
))
521 *loop
= get_loop (anum
);
526 VEC_free (int, heap
, li
->to_visit
);
531 fel_init (loop_iterator
*li
, loop_p
*loop
, unsigned flags
)
545 li
->to_visit
= VEC_alloc (int, heap
, number_of_loops ());
546 mn
= (flags
& LI_INCLUDE_ROOT
) ? 0 : 1;
548 if (flags
& LI_ONLY_INNERMOST
)
550 for (i
= 0; VEC_iterate (loop_p
, current_loops
->larray
, i
, aloop
); i
++)
552 && aloop
->inner
== NULL
554 VEC_quick_push (int, li
->to_visit
, aloop
->num
);
556 else if (flags
& LI_FROM_INNERMOST
)
558 /* Push the loops to LI->TO_VISIT in postorder. */
559 for (aloop
= current_loops
->tree_root
;
560 aloop
->inner
!= NULL
;
561 aloop
= aloop
->inner
)
566 if (aloop
->num
>= mn
)
567 VEC_quick_push (int, li
->to_visit
, aloop
->num
);
571 for (aloop
= aloop
->next
;
572 aloop
->inner
!= NULL
;
573 aloop
= aloop
->inner
)
576 else if (!loop_outer (aloop
))
579 aloop
= loop_outer (aloop
);
584 /* Push the loops to LI->TO_VISIT in preorder. */
585 aloop
= current_loops
->tree_root
;
588 if (aloop
->num
>= mn
)
589 VEC_quick_push (int, li
->to_visit
, aloop
->num
);
591 if (aloop
->inner
!= NULL
)
592 aloop
= aloop
->inner
;
595 while (aloop
!= NULL
&& aloop
->next
== NULL
)
596 aloop
= loop_outer (aloop
);
607 #define FOR_EACH_LOOP(LI, LOOP, FLAGS) \
608 for (fel_init (&(LI), &(LOOP), FLAGS); \
610 fel_next (&(LI), &(LOOP)))
612 #define FOR_EACH_LOOP_BREAK(LI) \
614 VEC_free (int, heap, (LI)->to_visit); \
618 /* The properties of the target. */
620 extern unsigned target_avail_regs
;
621 extern unsigned target_res_regs
;
622 extern unsigned target_reg_cost
[2];
623 extern unsigned target_spill_cost
[2];
625 /* Register pressure estimation for induction variable optimizations & loop
627 extern unsigned estimate_reg_pressure_cost (unsigned, unsigned, bool);
628 extern void init_set_costs (void);
630 /* Loop optimizer initialization. */
631 extern void loop_optimizer_init (unsigned);
632 extern void loop_optimizer_finalize (void);
634 /* Optimization passes. */
635 extern void unswitch_loops (void);
639 UAP_PEEL
= 1, /* Enables loop peeling. */
640 UAP_UNROLL
= 2, /* Enables unrolling of loops if it seems profitable. */
641 UAP_UNROLL_ALL
= 4 /* Enables unrolling of all loops. */
644 extern void unroll_and_peel_loops (int);
645 extern void doloop_optimize_loops (void);
646 extern void move_loop_invariants (void);
648 #endif /* GCC_CFGLOOP_H */