1 /* Loop header copying on trees.
2 Copyright (C) 2004-2020 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it
7 under the terms of the GNU General Public License as published by the
8 Free Software Foundation; either version 3, or (at your option) any
11 GCC is distributed in the hope that it will be useful, but WITHOUT
12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
22 #include "coretypes.h"
27 #include "tree-pass.h"
28 #include "gimple-ssa.h"
29 #include "gimple-iterator.h"
31 #include "tree-into-ssa.h"
33 #include "tree-inline.h"
34 #include "tree-ssa-scopedtables.h"
35 #include "tree-ssa-threadedge.h"
36 #include "tree-ssa-sccvn.h"
37 #include "tree-phinodes.h"
38 #include "ssa-iterators.h"
40 /* Duplicates headers of loops if they are small enough, so that the statements
41 in the loop body are always executed when the loop is entered. This
42 increases effectiveness of code motion optimizations, and reduces the need
43 for loop preconditioning. */
45 /* Check whether we should duplicate HEADER of LOOP. At most *LIMIT
46 instructions should be duplicated, limit is decreased by the actual
50 should_duplicate_loop_header_p (basic_block header
, class loop
*loop
,
53 gimple_stmt_iterator bsi
;
55 gcc_assert (!header
->aux
);
57 /* Loop header copying usually increases size of the code. This used not to
58 be true, since quite often it is possible to verify that the condition is
59 satisfied in the first iteration and therefore to eliminate it. Jump
60 threading handles these cases now. */
61 if (optimize_loop_for_size_p (loop
)
62 && !loop
->force_vectorize
)
64 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
66 " Not duplicating bb %i: optimizing for size.\n",
71 gcc_assert (EDGE_COUNT (header
->succs
) > 0);
72 if (single_succ_p (header
))
74 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
76 " Not duplicating bb %i: it is single succ.\n",
81 if (flow_bb_inside_loop_p (loop
, EDGE_SUCC (header
, 0)->dest
)
82 && flow_bb_inside_loop_p (loop
, EDGE_SUCC (header
, 1)->dest
))
84 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
86 " Not duplicating bb %i: both successors are in loop.\n",
91 /* If this is not the original loop header, we want it to have just
92 one predecessor in order to match the && pattern. */
93 if (header
!= loop
->header
&& !single_pred_p (header
))
95 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
97 " Not duplicating bb %i: it has mutiple predecestors.\n",
102 gcond
*last
= safe_dyn_cast
<gcond
*> (last_stmt (header
));
105 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
107 " Not duplicating bb %i: it does not end by conditional.\n",
112 for (gphi_iterator psi
= gsi_start_phis (header
); !gsi_end_p (psi
);
115 gphi
*phi
= psi
.phi ();
116 tree res
= gimple_phi_result (phi
);
117 if (INTEGRAL_TYPE_P (TREE_TYPE (res
))
118 || POINTER_TYPE_P (TREE_TYPE (res
)))
119 gimple_set_uid (phi
, 1 /* IV */);
121 gimple_set_uid (phi
, 0);
124 /* Count number of instructions and punt on calls.
125 Populate stmts INV/IV flag to later apply heuristics to the
126 kind of conditions we want to copy. */
127 for (bsi
= gsi_start_bb (header
); !gsi_end_p (bsi
); gsi_next (&bsi
))
129 gimple
*last
= gsi_stmt (bsi
);
131 if (gimple_code (last
) == GIMPLE_LABEL
)
134 if (is_gimple_debug (last
))
137 if (gimple_code (last
) == GIMPLE_CALL
138 && (!gimple_inexpensive_call_p (as_a
<gcall
*> (last
))
139 /* IFN_LOOP_DIST_ALIAS means that inner loop is distributed
140 at current loop's header. Don't copy in this case. */
141 || gimple_call_internal_p (last
, IFN_LOOP_DIST_ALIAS
)))
143 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
145 " Not duplicating bb %i: it contains call.\n",
150 *limit
-= estimate_num_insns (last
, &eni_size_weights
);
153 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
155 " Not duplicating bb %i contains too many insns.\n",
160 /* Classify the stmt based on whether its computation is based
161 on a IV or whether it is invariant in the loop. */
162 gimple_set_uid (last
, 0);
163 if (!gimple_vuse (last
))
169 FOR_EACH_SSA_TREE_OPERAND (op
, last
, i
, SSA_OP_USE
)
170 if (!SSA_NAME_IS_DEFAULT_DEF (op
)
171 && flow_bb_inside_loop_p (loop
,
172 gimple_bb (SSA_NAME_DEF_STMT (op
))))
174 if (!(gimple_uid (SSA_NAME_DEF_STMT (op
)) & 2 /* INV */))
176 if (gimple_uid (SSA_NAME_DEF_STMT (op
)) & 1 /* IV */)
179 gimple_set_uid (last
, (iv
? 1 : 0) | (inv
? 2 : 0));
183 /* If the condition tests a non-IV loop variant we do not want to rotate
184 the loop further. Unless this is the original loop header. */
185 tree lhs
= gimple_cond_lhs (last
);
186 tree rhs
= gimple_cond_rhs (last
);
187 if (header
!= loop
->header
188 && ((TREE_CODE (lhs
) == SSA_NAME
189 && !SSA_NAME_IS_DEFAULT_DEF (lhs
)
190 && flow_bb_inside_loop_p (loop
, gimple_bb (SSA_NAME_DEF_STMT (lhs
)))
191 && gimple_uid (SSA_NAME_DEF_STMT (lhs
)) == 0)
192 || (TREE_CODE (rhs
) == SSA_NAME
193 && !SSA_NAME_IS_DEFAULT_DEF (rhs
)
194 && flow_bb_inside_loop_p (loop
,
195 gimple_bb (SSA_NAME_DEF_STMT (rhs
)))
196 && gimple_uid (SSA_NAME_DEF_STMT (rhs
)) == 0)))
198 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
200 " Not duplicating bb %i: condition based on non-IV loop"
201 " variant.\n", header
->index
);
205 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
206 fprintf (dump_file
, " Will duplicate bb %i\n", header
->index
);
210 /* Checks whether LOOP is a do-while style loop. */
213 do_while_loop_p (class loop
*loop
)
215 gimple
*stmt
= last_stmt (loop
->latch
);
217 /* If the latch of the loop is not empty, it is not a do-while loop. */
219 && gimple_code (stmt
) != GIMPLE_LABEL
)
221 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
223 "Loop %i is not do-while loop: latch is not empty.\n",
228 /* If the latch does not have a single predecessor, it is not a
230 if (!single_pred_p (loop
->latch
))
232 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
234 "Loop %i is not do-while loop: latch has multiple "
235 "predecessors.\n", loop
->num
);
239 /* If the latch predecessor doesn't exit the loop, it is not a
241 if (!loop_exits_from_bb_p (loop
, single_pred (loop
->latch
)))
243 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
245 "Loop %i is not do-while loop: latch predecessor "
246 "does not exit loop.\n", loop
->num
);
250 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
251 fprintf (dump_file
, "Loop %i is do-while loop\n", loop
->num
);
258 /* Common superclass for both header-copying phases. */
259 class ch_base
: public gimple_opt_pass
262 ch_base (pass_data data
, gcc::context
*ctxt
)
263 : gimple_opt_pass (data
, ctxt
)
266 /* Copies headers of all loops in FUN for which process_loop_p is true. */
267 unsigned int copy_headers (function
*fun
);
269 /* Return true to copy headers of LOOP or false to skip. */
270 virtual bool process_loop_p (class loop
*loop
) = 0;
273 const pass_data pass_data_ch
=
275 GIMPLE_PASS
, /* type */
277 OPTGROUP_LOOP
, /* optinfo_flags */
278 TV_TREE_CH
, /* tv_id */
279 ( PROP_cfg
| PROP_ssa
), /* properties_required */
280 0, /* properties_provided */
281 0, /* properties_destroyed */
282 0, /* todo_flags_start */
283 0, /* todo_flags_finish */
286 class pass_ch
: public ch_base
289 pass_ch (gcc::context
*ctxt
)
290 : ch_base (pass_data_ch
, ctxt
)
293 /* opt_pass methods: */
294 virtual bool gate (function
*) { return flag_tree_ch
!= 0; }
296 /* Initialize and finalize loop structures, copying headers inbetween. */
297 virtual unsigned int execute (function
*);
299 opt_pass
* clone () { return new pass_ch (m_ctxt
); }
302 /* ch_base method: */
303 virtual bool process_loop_p (class loop
*loop
);
306 const pass_data pass_data_ch_vect
=
308 GIMPLE_PASS
, /* type */
309 "ch_vect", /* name */
310 OPTGROUP_LOOP
, /* optinfo_flags */
311 TV_TREE_CH
, /* tv_id */
312 ( PROP_cfg
| PROP_ssa
), /* properties_required */
313 0, /* properties_provided */
314 0, /* properties_destroyed */
315 0, /* todo_flags_start */
316 0, /* todo_flags_finish */
319 /* This is a more aggressive version of the same pass, designed to run just
320 before if-conversion and vectorization, to put more loops into the form
321 required for those phases. */
322 class pass_ch_vect
: public ch_base
325 pass_ch_vect (gcc::context
*ctxt
)
326 : ch_base (pass_data_ch_vect
, ctxt
)
329 /* opt_pass methods: */
330 virtual bool gate (function
*fun
)
332 return flag_tree_ch
!= 0
333 && (flag_tree_loop_vectorize
!= 0 || fun
->has_force_vectorize_loops
);
336 /* Just copy headers, no initialization/finalization of loop structures. */
337 virtual unsigned int execute (function
*);
340 /* ch_base method: */
341 virtual bool process_loop_p (class loop
*loop
);
342 }; // class pass_ch_vect
344 /* For all loops, copy the condition at the end of the loop body in front
345 of the loop. This is beneficial since it increases efficiency of
346 code motion optimizations. It also saves one jump on entry to the loop. */
349 ch_base::copy_headers (function
*fun
)
354 basic_block
*bbs
, *copied_bbs
;
357 bool changed
= false;
359 if (number_of_loops (fun
) <= 1)
362 bbs
= XNEWVEC (basic_block
, n_basic_blocks_for_fn (fun
));
363 copied_bbs
= XNEWVEC (basic_block
, n_basic_blocks_for_fn (fun
));
364 bbs_size
= n_basic_blocks_for_fn (fun
);
366 auto_vec
<std::pair
<edge
, loop_p
> > copied
;
368 FOR_EACH_LOOP (loop
, 0)
370 int initial_limit
= param_max_loop_header_insns
;
371 int remaining_limit
= initial_limit
;
372 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
374 "Analyzing loop %i\n", loop
->num
);
376 header
= loop
->header
;
378 /* If the loop is already a do-while style one (either because it was
379 written as such, or because jump threading transformed it into one),
380 we might be in fact peeling the first iteration of the loop. This
381 in general is not a good idea. Also avoid touching infinite loops. */
382 if (!loop_has_exit_edges (loop
)
383 || !process_loop_p (loop
))
386 /* Iterate the header copying up to limit; this takes care of the cases
387 like while (a && b) {...}, where we want to have both of the conditions
388 copied. TODO -- handle while (a || b) - like cases, by not requiring
389 the header to have just a single successor and copying up to
394 while (should_duplicate_loop_header_p (header
, loop
, &remaining_limit
))
396 /* Find a successor of header that is inside a loop; i.e. the new
397 header after the condition is copied. */
398 if (flow_bb_inside_loop_p (loop
, EDGE_SUCC (header
, 0)->dest
))
399 exit
= EDGE_SUCC (header
, 0);
401 exit
= EDGE_SUCC (header
, 1);
402 bbs
[n_bbs
++] = header
;
403 gcc_assert (bbs_size
> n_bbs
);
410 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
412 "Duplicating header of the loop %d up to edge %d->%d,"
414 loop
->num
, exit
->src
->index
, exit
->dest
->index
,
415 initial_limit
- remaining_limit
);
417 /* Ensure that the header will have just the latch as a predecessor
419 if (!single_pred_p (exit
->dest
))
420 exit
= single_pred_edge (split_edge (exit
));
422 entry
= loop_preheader_edge (loop
);
424 propagate_threaded_block_debug_into (exit
->dest
, entry
->dest
);
425 if (!gimple_duplicate_sese_region (entry
, exit
, bbs
, n_bbs
, copied_bbs
,
428 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
429 fprintf (dump_file
, "Duplication failed.\n");
432 copied
.safe_push (std::make_pair (entry
, loop
));
434 /* If the loop has the form "for (i = j; i < j + 10; i++)" then
435 this copying can introduce a case where we rely on undefined
436 signed overflow to eliminate the preheader condition, because
437 we assume that "j < j + 10" is true. We don't want to warn
438 about that case for -Wstrict-overflow, because in general we
439 don't warn about overflow involving loops. Prevent the
440 warning by setting the no_warning flag in the condition. */
441 if (warn_strict_overflow
> 0)
445 for (i
= 0; i
< n_bbs
; ++i
)
447 gimple_stmt_iterator bsi
;
449 for (bsi
= gsi_start_bb (copied_bbs
[i
]);
453 gimple
*stmt
= gsi_stmt (bsi
);
454 if (gimple_code (stmt
) == GIMPLE_COND
)
456 tree lhs
= gimple_cond_lhs (stmt
);
457 if (gimple_cond_code (stmt
) != EQ_EXPR
458 && gimple_cond_code (stmt
) != NE_EXPR
459 && INTEGRAL_TYPE_P (TREE_TYPE (lhs
))
460 && TYPE_OVERFLOW_UNDEFINED (TREE_TYPE (lhs
)))
461 gimple_set_no_warning (stmt
, true);
463 else if (is_gimple_assign (stmt
))
465 enum tree_code rhs_code
= gimple_assign_rhs_code (stmt
);
466 tree rhs1
= gimple_assign_rhs1 (stmt
);
467 if (TREE_CODE_CLASS (rhs_code
) == tcc_comparison
468 && rhs_code
!= EQ_EXPR
469 && rhs_code
!= NE_EXPR
470 && INTEGRAL_TYPE_P (TREE_TYPE (rhs1
))
471 && TYPE_OVERFLOW_UNDEFINED (TREE_TYPE (rhs1
)))
472 gimple_set_no_warning (stmt
, true);
478 /* Ensure that the latch and the preheader is simple (we know that they
479 are not now, since there was the loop exit condition. */
480 split_edge (loop_preheader_edge (loop
));
481 split_edge (loop_latch_edge (loop
));
483 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
485 if (do_while_loop_p (loop
))
486 fprintf (dump_file
, "Loop %d is now do-while loop.\n", loop
->num
);
488 fprintf (dump_file
, "Loop %d is still not do-while loop.\n",
497 update_ssa (TODO_update_ssa
);
498 /* After updating SSA form perform CSE on the loop header
499 copies. This is esp. required for the pass before
500 vectorization since nothing cleans up copied exit tests
501 that can now be simplified. CSE from the entry of the
502 region we copied till all loop exit blocks but not
503 entering the loop itself. */
504 for (unsigned i
= 0; i
< copied
.length (); ++i
)
506 edge entry
= copied
[i
].first
;
507 loop_p loop
= copied
[i
].second
;
508 auto_vec
<edge
> exit_edges
= get_loop_exit_edges (loop
);
509 bitmap exit_bbs
= BITMAP_ALLOC (NULL
);
510 for (unsigned j
= 0; j
< exit_edges
.length (); ++j
)
511 bitmap_set_bit (exit_bbs
, exit_edges
[j
]->dest
->index
);
512 bitmap_set_bit (exit_bbs
, loop
->header
->index
);
513 do_rpo_vn (cfun
, entry
, exit_bbs
);
514 BITMAP_FREE (exit_bbs
);
520 return changed
? TODO_cleanup_cfg
: 0;
523 /* Initialize the loop structures we need, and finalize after. */
526 pass_ch::execute (function
*fun
)
528 loop_optimizer_init (LOOPS_HAVE_PREHEADERS
529 | LOOPS_HAVE_SIMPLE_LATCHES
530 | LOOPS_HAVE_RECORDED_EXITS
);
532 unsigned int res
= copy_headers (fun
);
534 loop_optimizer_finalize ();
538 /* Assume an earlier phase has already initialized all the loop structures that
539 we need here (and perhaps others too), and that these will be finalized by
543 pass_ch_vect::execute (function
*fun
)
545 return copy_headers (fun
);
548 /* Apply header copying according to a very simple test of do-while shape. */
551 pass_ch::process_loop_p (class loop
*loop
)
553 return !do_while_loop_p (loop
);
556 /* Apply header-copying to loops where we might enable vectorization. */
559 pass_ch_vect::process_loop_p (class loop
*loop
)
561 if (!flag_tree_loop_vectorize
&& !loop
->force_vectorize
)
564 if (loop
->dont_vectorize
)
567 /* The vectorizer won't handle anything with multiple exits, so skip. */
568 edge exit
= single_exit (loop
);
572 if (!do_while_loop_p (loop
))
581 make_pass_ch_vect (gcc::context
*ctxt
)
583 return new pass_ch_vect (ctxt
);
587 make_pass_ch (gcc::context
*ctxt
)
589 return new pass_ch (ctxt
);