Analyze niter for until-wrap condition [PR101145]
[official-gcc.git] / gcc / loop-init.c
blob04054ef6222f8bdc07f693b44bf17006ee36d430
1 /* Loop optimizer initialization routines and RTL loop optimization passes.
2 Copyright (C) 2002-2021 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "cfghooks.h"
28 #include "df.h"
29 #include "regs.h"
30 #include "cfgcleanup.h"
31 #include "cfgloop.h"
32 #include "tree-pass.h"
33 #include "tree-ssa-loop-niter.h"
34 #include "loop-unroll.h"
35 #include "tree-scalar-evolution.h"
36 #include "tree-cfgcleanup.h"
39 /* Apply FLAGS to the loop state. */
41 static void
42 apply_loop_flags (unsigned flags)
44 if (flags & LOOPS_MAY_HAVE_MULTIPLE_LATCHES)
46 /* If the loops may have multiple latches, we cannot canonicalize
47 them further (and most of the loop manipulation functions will
48 not work). However, we avoid modifying cfg, which some
49 passes may want. */
50 gcc_assert ((flags & ~(LOOPS_MAY_HAVE_MULTIPLE_LATCHES
51 | LOOPS_HAVE_RECORDED_EXITS
52 | LOOPS_HAVE_MARKED_IRREDUCIBLE_REGIONS)) == 0);
53 loops_state_set (LOOPS_MAY_HAVE_MULTIPLE_LATCHES);
55 else
56 disambiguate_loops_with_multiple_latches ();
58 /* Create pre-headers. */
59 if (flags & LOOPS_HAVE_PREHEADERS)
61 int cp_flags = CP_SIMPLE_PREHEADERS;
63 if (flags & LOOPS_HAVE_FALLTHRU_PREHEADERS)
64 cp_flags |= CP_FALLTHRU_PREHEADERS;
66 create_preheaders (cp_flags);
69 /* Force all latches to have only single successor. */
70 if (flags & LOOPS_HAVE_SIMPLE_LATCHES)
71 force_single_succ_latches ();
73 /* Mark irreducible loops. */
74 if (flags & LOOPS_HAVE_MARKED_IRREDUCIBLE_REGIONS)
75 mark_irreducible_loops ();
77 if (flags & LOOPS_HAVE_RECORDED_EXITS)
78 record_loop_exits ();
81 /* Initialize loop structures. This is used by the tree and RTL loop
82 optimizers. FLAGS specify what properties to compute and/or ensure for
83 loops. */
85 void
86 loop_optimizer_init (unsigned flags)
88 timevar_push (TV_LOOP_INIT);
90 if (!current_loops)
92 gcc_assert (!(cfun->curr_properties & PROP_loops));
94 /* Find the loops. */
95 current_loops = flow_loops_find (NULL);
97 else
99 bool recorded_exits = loops_state_satisfies_p (LOOPS_HAVE_RECORDED_EXITS);
100 bool needs_fixup = loops_state_satisfies_p (LOOPS_NEED_FIXUP);
102 gcc_assert (cfun->curr_properties & PROP_loops);
104 /* Ensure that the dominators are computed, like flow_loops_find does. */
105 calculate_dominance_info (CDI_DOMINATORS);
107 if (!needs_fixup)
108 checking_verify_loop_structure ();
110 /* Clear all flags. */
111 if (recorded_exits)
112 release_recorded_exits (cfun);
113 loops_state_clear (~0U);
115 if (needs_fixup)
117 /* Apply LOOPS_MAY_HAVE_MULTIPLE_LATCHES early as fix_loop_structure
118 re-applies flags. */
119 loops_state_set (flags & LOOPS_MAY_HAVE_MULTIPLE_LATCHES);
120 fix_loop_structure (NULL);
124 /* Apply flags to loops. */
125 apply_loop_flags (flags);
127 /* Dump loops. */
128 flow_loops_dump (dump_file, NULL, 1);
130 checking_verify_loop_structure ();
132 timevar_pop (TV_LOOP_INIT);
135 /* Finalize loop structures. */
137 void
138 loop_optimizer_finalize (struct function *fn, bool clean_loop_closed_phi)
140 basic_block bb;
142 timevar_push (TV_LOOP_FINI);
144 if (clean_loop_closed_phi && loops_state_satisfies_p (fn, LOOP_CLOSED_SSA))
146 clean_up_loop_closed_phi (fn);
147 loops_state_clear (fn, LOOP_CLOSED_SSA);
150 if (loops_state_satisfies_p (fn, LOOPS_HAVE_RECORDED_EXITS))
151 release_recorded_exits (fn);
153 free_numbers_of_iterations_estimates (fn);
155 /* If we should preserve loop structure, do not free it but clear
156 flags that advanced properties are there as we are not preserving
157 that in full. */
158 if (fn->curr_properties & PROP_loops)
160 loops_state_clear (fn, LOOP_CLOSED_SSA
161 | LOOPS_HAVE_MARKED_IRREDUCIBLE_REGIONS
162 | LOOPS_HAVE_PREHEADERS
163 | LOOPS_HAVE_SIMPLE_LATCHES
164 | LOOPS_HAVE_FALLTHRU_PREHEADERS);
165 loops_state_set (fn, LOOPS_MAY_HAVE_MULTIPLE_LATCHES);
166 goto loop_fini_done;
169 for (auto loop : loops_list (fn, 0))
170 free_simple_loop_desc (loop);
172 /* Clean up. */
173 flow_loops_free (loops_for_fn (fn));
174 ggc_free (loops_for_fn (fn));
175 set_loops_for_fn (fn, NULL);
177 FOR_ALL_BB_FN (bb, fn)
179 bb->loop_father = NULL;
182 loop_fini_done:
183 timevar_pop (TV_LOOP_FINI);
186 /* The structure of loops might have changed. Some loops might get removed
187 (and their headers and latches were set to NULL), loop exists might get
188 removed (thus the loop nesting may be wrong), and some blocks and edges
189 were changed (so the information about bb --> loop mapping does not have
190 to be correct). But still for the remaining loops the header dominates
191 the latch, and loops did not get new subloops (new loops might possibly
192 get created, but we are not interested in them). Fix up the mess.
194 If CHANGED_BBS is not NULL, basic blocks whose loop depth has changed are
195 marked in it.
197 Returns the number of new discovered loops. */
199 unsigned
200 fix_loop_structure (bitmap changed_bbs)
202 basic_block bb;
203 int record_exits = 0;
204 class loop *loop;
205 unsigned old_nloops, i;
207 timevar_push (TV_LOOP_INIT);
209 if (dump_file && (dump_flags & TDF_DETAILS))
210 fprintf (dump_file, "fix_loop_structure: fixing up loops for function\n");
212 /* We need exact and fast dominance info to be available. */
213 gcc_assert (dom_info_state (CDI_DOMINATORS) == DOM_OK);
215 if (loops_state_satisfies_p (LOOPS_HAVE_RECORDED_EXITS))
217 release_recorded_exits (cfun);
218 record_exits = LOOPS_HAVE_RECORDED_EXITS;
221 /* Remember the depth of the blocks in the loop hierarchy, so that we can
222 recognize blocks whose loop nesting relationship has changed. */
223 if (changed_bbs)
224 FOR_EACH_BB_FN (bb, cfun)
225 bb->aux = (void *) (size_t) loop_depth (bb->loop_father);
227 /* Remove the dead loops from structures. We start from the innermost
228 loops, so that when we remove the loops, we know that the loops inside
229 are preserved, and do not waste time relinking loops that will be
230 removed later. */
231 for (auto loop : loops_list (cfun, LI_FROM_INNERMOST))
233 /* Detect the case that the loop is no longer present even though
234 it wasn't marked for removal.
235 ??? If we do that we can get away with not marking loops for
236 removal at all. And possibly avoid some spurious removals. */
237 if (loop->header
238 && bb_loop_header_p (loop->header))
239 continue;
241 if (dump_file && (dump_flags & TDF_DETAILS))
242 fprintf (dump_file, "fix_loop_structure: removing loop %d\n",
243 loop->num);
245 while (loop->inner)
247 class loop *ploop = loop->inner;
248 flow_loop_tree_node_remove (ploop);
249 flow_loop_tree_node_add (loop_outer (loop), ploop);
252 /* Remove the loop. */
253 if (loop->header)
254 loop->former_header = loop->header;
255 else
256 gcc_assert (loop->former_header != NULL);
257 loop->header = NULL;
258 flow_loop_tree_node_remove (loop);
261 /* Remember the number of loops so we can return how many new loops
262 flow_loops_find discovered. */
263 old_nloops = number_of_loops (cfun);
265 /* Re-compute loop structure in-place. */
266 flow_loops_find (current_loops);
268 /* Mark the blocks whose loop has changed. */
269 if (changed_bbs)
271 FOR_EACH_BB_FN (bb, cfun)
273 if ((void *) (size_t) loop_depth (bb->loop_father) != bb->aux)
274 bitmap_set_bit (changed_bbs, bb->index);
276 bb->aux = NULL;
280 /* Finally free deleted loops. */
281 bool any_deleted = false;
282 FOR_EACH_VEC_ELT (*get_loops (cfun), i, loop)
283 if (loop && loop->header == NULL)
285 if (dump_file
286 && ((unsigned) loop->former_header->index
287 < basic_block_info_for_fn (cfun)->length ()))
289 basic_block former_header
290 = BASIC_BLOCK_FOR_FN (cfun, loop->former_header->index);
291 /* If the old header still exists we want to check if the
292 original loop is re-discovered or the old header is now
293 part of a newly discovered loop.
294 In both cases we should have avoided removing the loop. */
295 if (former_header == loop->former_header)
297 if (former_header->loop_father->header == former_header)
298 fprintf (dump_file, "fix_loop_structure: rediscovered "
299 "removed loop %d as loop %d with old header %d\n",
300 loop->num, former_header->loop_father->num,
301 former_header->index);
302 else if ((unsigned) former_header->loop_father->num
303 >= old_nloops)
304 fprintf (dump_file, "fix_loop_structure: header %d of "
305 "removed loop %d is part of the newly "
306 "discovered loop %d with header %d\n",
307 former_header->index, loop->num,
308 former_header->loop_father->num,
309 former_header->loop_father->header->index);
312 (*get_loops (cfun))[i] = NULL;
313 flow_loop_free (loop);
314 any_deleted = true;
317 /* If we deleted loops then the cached scalar evolutions refering to
318 those loops become invalid. */
319 if (any_deleted && scev_initialized_p ())
320 scev_reset_htab ();
322 loops_state_clear (LOOPS_NEED_FIXUP);
324 /* Apply flags to loops. */
325 apply_loop_flags (current_loops->state | record_exits);
327 checking_verify_loop_structure ();
329 timevar_pop (TV_LOOP_INIT);
331 return number_of_loops (cfun) - old_nloops;
334 /* The RTL loop superpass. The actual passes are subpasses. See passes.c for
335 more on that. */
337 namespace {
339 const pass_data pass_data_loop2 =
341 RTL_PASS, /* type */
342 "loop2", /* name */
343 OPTGROUP_LOOP, /* optinfo_flags */
344 TV_LOOP, /* tv_id */
345 0, /* properties_required */
346 0, /* properties_provided */
347 0, /* properties_destroyed */
348 0, /* todo_flags_start */
349 0, /* todo_flags_finish */
352 class pass_loop2 : public rtl_opt_pass
354 public:
355 pass_loop2 (gcc::context *ctxt)
356 : rtl_opt_pass (pass_data_loop2, ctxt)
359 /* opt_pass methods: */
360 virtual bool gate (function *);
362 }; // class pass_loop2
364 bool
365 pass_loop2::gate (function *fun)
367 if (optimize > 0
368 && (flag_move_loop_invariants
369 || flag_unswitch_loops
370 || flag_unroll_loops
371 || (flag_branch_on_count_reg && targetm.have_doloop_end ())
372 || cfun->has_unroll))
373 return true;
374 else
376 /* No longer preserve loops, remove them now. */
377 fun->curr_properties &= ~PROP_loops;
378 if (current_loops)
379 loop_optimizer_finalize ();
380 return false;
384 } // anon namespace
386 rtl_opt_pass *
387 make_pass_loop2 (gcc::context *ctxt)
389 return new pass_loop2 (ctxt);
393 /* Initialization of the RTL loop passes. */
394 static unsigned int
395 rtl_loop_init (void)
397 gcc_assert (current_ir_type () == IR_RTL_CFGLAYOUT);
399 if (dump_file)
401 dump_reg_info (dump_file);
402 dump_flow_info (dump_file, dump_flags);
405 loop_optimizer_init (LOOPS_NORMAL | LOOPS_HAVE_RECORDED_EXITS);
406 return 0;
409 namespace {
411 const pass_data pass_data_rtl_loop_init =
413 RTL_PASS, /* type */
414 "loop2_init", /* name */
415 OPTGROUP_LOOP, /* optinfo_flags */
416 TV_LOOP, /* tv_id */
417 0, /* properties_required */
418 0, /* properties_provided */
419 0, /* properties_destroyed */
420 0, /* todo_flags_start */
421 0, /* todo_flags_finish */
424 class pass_rtl_loop_init : public rtl_opt_pass
426 public:
427 pass_rtl_loop_init (gcc::context *ctxt)
428 : rtl_opt_pass (pass_data_rtl_loop_init, ctxt)
431 /* opt_pass methods: */
432 virtual unsigned int execute (function *) { return rtl_loop_init (); }
434 }; // class pass_rtl_loop_init
436 } // anon namespace
438 rtl_opt_pass *
439 make_pass_rtl_loop_init (gcc::context *ctxt)
441 return new pass_rtl_loop_init (ctxt);
445 /* Finalization of the RTL loop passes. */
447 namespace {
449 const pass_data pass_data_rtl_loop_done =
451 RTL_PASS, /* type */
452 "loop2_done", /* name */
453 OPTGROUP_LOOP, /* optinfo_flags */
454 TV_LOOP, /* tv_id */
455 0, /* properties_required */
456 0, /* properties_provided */
457 PROP_loops, /* properties_destroyed */
458 0, /* todo_flags_start */
459 0, /* todo_flags_finish */
462 class pass_rtl_loop_done : public rtl_opt_pass
464 public:
465 pass_rtl_loop_done (gcc::context *ctxt)
466 : rtl_opt_pass (pass_data_rtl_loop_done, ctxt)
469 /* opt_pass methods: */
470 virtual unsigned int execute (function *);
472 }; // class pass_rtl_loop_done
474 unsigned int
475 pass_rtl_loop_done::execute (function *fun)
477 /* No longer preserve loops, remove them now. */
478 fun->curr_properties &= ~PROP_loops;
479 loop_optimizer_finalize ();
480 free_dominance_info (CDI_DOMINATORS);
482 cleanup_cfg (0);
483 if (dump_file)
485 dump_reg_info (dump_file);
486 dump_flow_info (dump_file, dump_flags);
489 return 0;
492 } // anon namespace
494 rtl_opt_pass *
495 make_pass_rtl_loop_done (gcc::context *ctxt)
497 return new pass_rtl_loop_done (ctxt);
501 /* Loop invariant code motion. */
503 namespace {
505 const pass_data pass_data_rtl_move_loop_invariants =
507 RTL_PASS, /* type */
508 "loop2_invariant", /* name */
509 OPTGROUP_LOOP, /* optinfo_flags */
510 TV_LOOP_MOVE_INVARIANTS, /* tv_id */
511 0, /* properties_required */
512 0, /* properties_provided */
513 0, /* properties_destroyed */
514 0, /* todo_flags_start */
515 ( TODO_df_verify | TODO_df_finish ), /* todo_flags_finish */
518 class pass_rtl_move_loop_invariants : public rtl_opt_pass
520 public:
521 pass_rtl_move_loop_invariants (gcc::context *ctxt)
522 : rtl_opt_pass (pass_data_rtl_move_loop_invariants, ctxt)
525 /* opt_pass methods: */
526 virtual bool gate (function *) { return flag_move_loop_invariants; }
527 virtual unsigned int execute (function *fun)
529 if (number_of_loops (fun) > 1)
530 move_loop_invariants ();
531 return 0;
534 }; // class pass_rtl_move_loop_invariants
536 } // anon namespace
538 rtl_opt_pass *
539 make_pass_rtl_move_loop_invariants (gcc::context *ctxt)
541 return new pass_rtl_move_loop_invariants (ctxt);
545 namespace {
547 const pass_data pass_data_rtl_unroll_loops =
549 RTL_PASS, /* type */
550 "loop2_unroll", /* name */
551 OPTGROUP_LOOP, /* optinfo_flags */
552 TV_LOOP_UNROLL, /* tv_id */
553 0, /* properties_required */
554 0, /* properties_provided */
555 0, /* properties_destroyed */
556 0, /* todo_flags_start */
557 0, /* todo_flags_finish */
560 class pass_rtl_unroll_loops : public rtl_opt_pass
562 public:
563 pass_rtl_unroll_loops (gcc::context *ctxt)
564 : rtl_opt_pass (pass_data_rtl_unroll_loops, ctxt)
567 /* opt_pass methods: */
568 virtual bool gate (function *)
570 return (flag_unroll_loops || flag_unroll_all_loops || cfun->has_unroll);
573 virtual unsigned int execute (function *);
575 }; // class pass_rtl_unroll_loops
577 unsigned int
578 pass_rtl_unroll_loops::execute (function *fun)
580 if (number_of_loops (fun) > 1)
582 int flags = 0;
583 if (dump_file)
584 df_dump (dump_file);
586 if (flag_unroll_loops)
587 flags |= UAP_UNROLL;
588 if (flag_unroll_all_loops)
589 flags |= UAP_UNROLL_ALL;
591 unroll_loops (flags);
593 return 0;
596 } // anon namespace
598 rtl_opt_pass *
599 make_pass_rtl_unroll_loops (gcc::context *ctxt)
601 return new pass_rtl_unroll_loops (ctxt);
605 namespace {
607 const pass_data pass_data_rtl_doloop =
609 RTL_PASS, /* type */
610 "loop2_doloop", /* name */
611 OPTGROUP_LOOP, /* optinfo_flags */
612 TV_LOOP_DOLOOP, /* tv_id */
613 0, /* properties_required */
614 0, /* properties_provided */
615 0, /* properties_destroyed */
616 0, /* todo_flags_start */
617 0, /* todo_flags_finish */
620 class pass_rtl_doloop : public rtl_opt_pass
622 public:
623 pass_rtl_doloop (gcc::context *ctxt)
624 : rtl_opt_pass (pass_data_rtl_doloop, ctxt)
627 /* opt_pass methods: */
628 virtual bool gate (function *);
629 virtual unsigned int execute (function *);
631 }; // class pass_rtl_doloop
633 bool
634 pass_rtl_doloop::gate (function *)
636 return (flag_branch_on_count_reg && targetm.have_doloop_end ());
639 unsigned int
640 pass_rtl_doloop::execute (function *fun)
642 if (number_of_loops (fun) > 1)
643 doloop_optimize_loops ();
644 return 0;
647 } // anon namespace
649 rtl_opt_pass *
650 make_pass_rtl_doloop (gcc::context *ctxt)
652 return new pass_rtl_doloop (ctxt);