Emit SIMD moves as mov
[official-gcc.git] / gcc / tree-ssa-loop.c
blob19a0f30c525cc98a0eb9ddd7c70712e88f94180c
1 /* Loop optimizations over tree-ssa.
2 Copyright (C) 2003-2017 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it
7 under the terms of the GNU General Public License as published by the
8 Free Software Foundation; either version 3, or (at your option) any
9 later version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT
12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "tree.h"
25 #include "gimple.h"
26 #include "tree-pass.h"
27 #include "memmodel.h"
28 #include "tm_p.h"
29 #include "fold-const.h"
30 #include "gimple-iterator.h"
31 #include "tree-ssa-loop-ivopts.h"
32 #include "tree-ssa-loop-manip.h"
33 #include "tree-ssa-loop-niter.h"
34 #include "tree-ssa-loop.h"
35 #include "cfgloop.h"
36 #include "tree-inline.h"
37 #include "tree-scalar-evolution.h"
38 #include "tree-vectorizer.h"
39 #include "omp-general.h"
40 #include "diagnostic-core.h"
43 /* A pass making sure loops are fixed up. */
45 namespace {
47 const pass_data pass_data_fix_loops =
49 GIMPLE_PASS, /* type */
50 "fix_loops", /* name */
51 OPTGROUP_LOOP, /* optinfo_flags */
52 TV_TREE_LOOP, /* tv_id */
53 PROP_cfg, /* properties_required */
54 0, /* properties_provided */
55 0, /* properties_destroyed */
56 0, /* todo_flags_start */
57 0, /* todo_flags_finish */
60 class pass_fix_loops : public gimple_opt_pass
62 public:
63 pass_fix_loops (gcc::context *ctxt)
64 : gimple_opt_pass (pass_data_fix_loops, ctxt)
67 /* opt_pass methods: */
68 virtual bool gate (function *) { return flag_tree_loop_optimize; }
70 virtual unsigned int execute (function *fn);
71 }; // class pass_fix_loops
73 unsigned int
74 pass_fix_loops::execute (function *)
76 if (loops_state_satisfies_p (LOOPS_NEED_FIXUP))
78 calculate_dominance_info (CDI_DOMINATORS);
79 fix_loop_structure (NULL);
81 return 0;
84 } // anon namespace
86 gimple_opt_pass *
87 make_pass_fix_loops (gcc::context *ctxt)
89 return new pass_fix_loops (ctxt);
93 /* Gate for loop pass group. The group is controlled by -ftree-loop-optimize
94 but we also avoid running it when the IL doesn't contain any loop. */
96 static bool
97 gate_loop (function *fn)
99 if (!flag_tree_loop_optimize)
100 return false;
102 /* For -fdump-passes which runs before loop discovery print the
103 state of -ftree-loop-optimize. */
104 if (!loops_for_fn (fn))
105 return true;
107 return number_of_loops (fn) > 1;
110 /* The loop superpass. */
112 namespace {
114 const pass_data pass_data_tree_loop =
116 GIMPLE_PASS, /* type */
117 "loop", /* name */
118 OPTGROUP_LOOP, /* optinfo_flags */
119 TV_TREE_LOOP, /* tv_id */
120 PROP_cfg, /* properties_required */
121 0, /* properties_provided */
122 0, /* properties_destroyed */
123 0, /* todo_flags_start */
124 0, /* todo_flags_finish */
127 class pass_tree_loop : public gimple_opt_pass
129 public:
130 pass_tree_loop (gcc::context *ctxt)
131 : gimple_opt_pass (pass_data_tree_loop, ctxt)
134 /* opt_pass methods: */
135 virtual bool gate (function *fn) { return gate_loop (fn); }
137 }; // class pass_tree_loop
139 } // anon namespace
141 gimple_opt_pass *
142 make_pass_tree_loop (gcc::context *ctxt)
144 return new pass_tree_loop (ctxt);
147 /* Gate for oacc kernels pass group. */
149 static bool
150 gate_oacc_kernels (function *fn)
152 if (!flag_openacc)
153 return false;
155 if (!lookup_attribute ("oacc kernels", DECL_ATTRIBUTES (fn->decl)))
156 return false;
158 struct loop *loop;
159 FOR_EACH_LOOP (loop, 0)
160 if (loop->in_oacc_kernels_region)
161 return true;
163 return false;
166 /* The oacc kernels superpass. */
168 namespace {
170 const pass_data pass_data_oacc_kernels =
172 GIMPLE_PASS, /* type */
173 "oacc_kernels", /* name */
174 OPTGROUP_LOOP, /* optinfo_flags */
175 TV_TREE_LOOP, /* tv_id */
176 PROP_cfg, /* properties_required */
177 0, /* properties_provided */
178 0, /* properties_destroyed */
179 0, /* todo_flags_start */
180 0, /* todo_flags_finish */
183 class pass_oacc_kernels : public gimple_opt_pass
185 public:
186 pass_oacc_kernels (gcc::context *ctxt)
187 : gimple_opt_pass (pass_data_oacc_kernels, ctxt)
190 /* opt_pass methods: */
191 virtual bool gate (function *fn) { return gate_oacc_kernels (fn); }
193 }; // class pass_oacc_kernels
195 } // anon namespace
197 gimple_opt_pass *
198 make_pass_oacc_kernels (gcc::context *ctxt)
200 return new pass_oacc_kernels (ctxt);
203 /* The ipa oacc superpass. */
205 namespace {
207 const pass_data pass_data_ipa_oacc =
209 SIMPLE_IPA_PASS, /* type */
210 "ipa_oacc", /* name */
211 OPTGROUP_LOOP, /* optinfo_flags */
212 TV_TREE_LOOP, /* tv_id */
213 PROP_cfg, /* properties_required */
214 0, /* properties_provided */
215 0, /* properties_destroyed */
216 0, /* todo_flags_start */
217 0, /* todo_flags_finish */
220 class pass_ipa_oacc : public simple_ipa_opt_pass
222 public:
223 pass_ipa_oacc (gcc::context *ctxt)
224 : simple_ipa_opt_pass (pass_data_ipa_oacc, ctxt)
227 /* opt_pass methods: */
228 virtual bool gate (function *)
230 return (optimize
231 && flag_openacc
232 /* Don't bother doing anything if the program has errors. */
233 && !seen_error ());
236 }; // class pass_ipa_oacc
238 } // anon namespace
240 simple_ipa_opt_pass *
241 make_pass_ipa_oacc (gcc::context *ctxt)
243 return new pass_ipa_oacc (ctxt);
246 /* The ipa oacc kernels pass. */
248 namespace {
250 const pass_data pass_data_ipa_oacc_kernels =
252 SIMPLE_IPA_PASS, /* type */
253 "ipa_oacc_kernels", /* name */
254 OPTGROUP_LOOP, /* optinfo_flags */
255 TV_TREE_LOOP, /* tv_id */
256 PROP_cfg, /* properties_required */
257 0, /* properties_provided */
258 0, /* properties_destroyed */
259 0, /* todo_flags_start */
260 0, /* todo_flags_finish */
263 class pass_ipa_oacc_kernels : public simple_ipa_opt_pass
265 public:
266 pass_ipa_oacc_kernels (gcc::context *ctxt)
267 : simple_ipa_opt_pass (pass_data_ipa_oacc_kernels, ctxt)
270 }; // class pass_ipa_oacc_kernels
272 } // anon namespace
274 simple_ipa_opt_pass *
275 make_pass_ipa_oacc_kernels (gcc::context *ctxt)
277 return new pass_ipa_oacc_kernels (ctxt);
280 /* The no-loop superpass. */
282 namespace {
284 const pass_data pass_data_tree_no_loop =
286 GIMPLE_PASS, /* type */
287 "no_loop", /* name */
288 OPTGROUP_NONE, /* optinfo_flags */
289 TV_TREE_NOLOOP, /* tv_id */
290 PROP_cfg, /* properties_required */
291 0, /* properties_provided */
292 0, /* properties_destroyed */
293 0, /* todo_flags_start */
294 0, /* todo_flags_finish */
297 class pass_tree_no_loop : public gimple_opt_pass
299 public:
300 pass_tree_no_loop (gcc::context *ctxt)
301 : gimple_opt_pass (pass_data_tree_no_loop, ctxt)
304 /* opt_pass methods: */
305 virtual bool gate (function *fn) { return !gate_loop (fn); }
307 }; // class pass_tree_no_loop
309 } // anon namespace
311 gimple_opt_pass *
312 make_pass_tree_no_loop (gcc::context *ctxt)
314 return new pass_tree_no_loop (ctxt);
318 /* Loop optimizer initialization. */
320 namespace {
322 const pass_data pass_data_tree_loop_init =
324 GIMPLE_PASS, /* type */
325 "loopinit", /* name */
326 OPTGROUP_LOOP, /* optinfo_flags */
327 TV_NONE, /* tv_id */
328 PROP_cfg, /* properties_required */
329 0, /* properties_provided */
330 0, /* properties_destroyed */
331 0, /* todo_flags_start */
332 0, /* todo_flags_finish */
335 class pass_tree_loop_init : public gimple_opt_pass
337 public:
338 pass_tree_loop_init (gcc::context *ctxt)
339 : gimple_opt_pass (pass_data_tree_loop_init, ctxt)
342 /* opt_pass methods: */
343 virtual unsigned int execute (function *);
345 }; // class pass_tree_loop_init
347 unsigned int
348 pass_tree_loop_init::execute (function *fun ATTRIBUTE_UNUSED)
350 /* When processing a loop in the loop pipeline, we should be able to assert
351 that:
352 (loops_state_satisfies_p (LOOPS_NORMAL | LOOPS_HAVE_RECORDED_EXITS
353 | LOOP_CLOSED_SSA)
354 && scev_initialized_p ())
356 loop_optimizer_init (LOOPS_NORMAL
357 | LOOPS_HAVE_RECORDED_EXITS);
358 rewrite_into_loop_closed_ssa (NULL, TODO_update_ssa);
359 scev_initialize ();
361 return 0;
364 } // anon namespace
366 gimple_opt_pass *
367 make_pass_tree_loop_init (gcc::context *ctxt)
369 return new pass_tree_loop_init (ctxt);
372 /* Loop autovectorization. */
374 namespace {
376 const pass_data pass_data_vectorize =
378 GIMPLE_PASS, /* type */
379 "vect", /* name */
380 OPTGROUP_LOOP | OPTGROUP_VEC, /* optinfo_flags */
381 TV_TREE_VECTORIZATION, /* tv_id */
382 ( PROP_cfg | PROP_ssa ), /* properties_required */
383 0, /* properties_provided */
384 0, /* properties_destroyed */
385 0, /* todo_flags_start */
386 0, /* todo_flags_finish */
389 class pass_vectorize : public gimple_opt_pass
391 public:
392 pass_vectorize (gcc::context *ctxt)
393 : gimple_opt_pass (pass_data_vectorize, ctxt)
396 /* opt_pass methods: */
397 virtual bool gate (function *fun)
399 return flag_tree_loop_vectorize || fun->has_force_vectorize_loops;
402 virtual unsigned int execute (function *);
404 }; // class pass_vectorize
406 unsigned int
407 pass_vectorize::execute (function *fun)
409 if (number_of_loops (fun) <= 1)
410 return 0;
412 return vectorize_loops ();
415 } // anon namespace
417 gimple_opt_pass *
418 make_pass_vectorize (gcc::context *ctxt)
420 return new pass_vectorize (ctxt);
423 /* Propagation of constants using scev. */
425 namespace {
427 const pass_data pass_data_scev_cprop =
429 GIMPLE_PASS, /* type */
430 "sccp", /* name */
431 OPTGROUP_LOOP, /* optinfo_flags */
432 TV_SCEV_CONST, /* tv_id */
433 ( PROP_cfg | PROP_ssa ), /* properties_required */
434 0, /* properties_provided */
435 0, /* properties_destroyed */
436 0, /* todo_flags_start */
437 ( TODO_cleanup_cfg
438 | TODO_update_ssa_only_virtuals ), /* todo_flags_finish */
441 class pass_scev_cprop : public gimple_opt_pass
443 public:
444 pass_scev_cprop (gcc::context *ctxt)
445 : gimple_opt_pass (pass_data_scev_cprop, ctxt)
448 /* opt_pass methods: */
449 virtual bool gate (function *) { return flag_tree_scev_cprop; }
450 virtual unsigned int execute (function *) { return scev_const_prop (); }
452 }; // class pass_scev_cprop
454 } // anon namespace
456 gimple_opt_pass *
457 make_pass_scev_cprop (gcc::context *ctxt)
459 return new pass_scev_cprop (ctxt);
462 /* Induction variable optimizations. */
464 namespace {
466 const pass_data pass_data_iv_optimize =
468 GIMPLE_PASS, /* type */
469 "ivopts", /* name */
470 OPTGROUP_LOOP, /* optinfo_flags */
471 TV_TREE_LOOP_IVOPTS, /* tv_id */
472 ( PROP_cfg | PROP_ssa ), /* properties_required */
473 0, /* properties_provided */
474 0, /* properties_destroyed */
475 0, /* todo_flags_start */
476 TODO_update_ssa, /* todo_flags_finish */
479 class pass_iv_optimize : public gimple_opt_pass
481 public:
482 pass_iv_optimize (gcc::context *ctxt)
483 : gimple_opt_pass (pass_data_iv_optimize, ctxt)
486 /* opt_pass methods: */
487 virtual bool gate (function *) { return flag_ivopts != 0; }
488 virtual unsigned int execute (function *);
490 }; // class pass_iv_optimize
492 unsigned int
493 pass_iv_optimize::execute (function *fun)
495 if (number_of_loops (fun) <= 1)
496 return 0;
498 tree_ssa_iv_optimize ();
499 return 0;
502 } // anon namespace
504 gimple_opt_pass *
505 make_pass_iv_optimize (gcc::context *ctxt)
507 return new pass_iv_optimize (ctxt);
510 /* Loop optimizer finalization. */
512 static unsigned int
513 tree_ssa_loop_done (void)
515 free_numbers_of_iterations_estimates (cfun);
516 scev_finalize ();
517 loop_optimizer_finalize ();
518 return 0;
521 namespace {
523 const pass_data pass_data_tree_loop_done =
525 GIMPLE_PASS, /* type */
526 "loopdone", /* name */
527 OPTGROUP_LOOP, /* optinfo_flags */
528 TV_NONE, /* tv_id */
529 PROP_cfg, /* properties_required */
530 0, /* properties_provided */
531 0, /* properties_destroyed */
532 0, /* todo_flags_start */
533 TODO_cleanup_cfg, /* todo_flags_finish */
536 class pass_tree_loop_done : public gimple_opt_pass
538 public:
539 pass_tree_loop_done (gcc::context *ctxt)
540 : gimple_opt_pass (pass_data_tree_loop_done, ctxt)
543 /* opt_pass methods: */
544 virtual unsigned int execute (function *) { return tree_ssa_loop_done (); }
546 }; // class pass_tree_loop_done
548 } // anon namespace
550 gimple_opt_pass *
551 make_pass_tree_loop_done (gcc::context *ctxt)
553 return new pass_tree_loop_done (ctxt);
556 /* Calls CBCK for each index in memory reference ADDR_P. There are two
557 kinds situations handled; in each of these cases, the memory reference
558 and DATA are passed to the callback:
560 Access to an array: ARRAY_{RANGE_}REF (base, index). In this case we also
561 pass the pointer to the index to the callback.
563 Pointer dereference: INDIRECT_REF (addr). In this case we also pass the
564 pointer to addr to the callback.
566 If the callback returns false, the whole search stops and false is returned.
567 Otherwise the function returns true after traversing through the whole
568 reference *ADDR_P. */
570 bool
571 for_each_index (tree *addr_p, bool (*cbck) (tree, tree *, void *), void *data)
573 tree *nxt, *idx;
575 for (; ; addr_p = nxt)
577 switch (TREE_CODE (*addr_p))
579 case SSA_NAME:
580 return cbck (*addr_p, addr_p, data);
582 case MEM_REF:
583 nxt = &TREE_OPERAND (*addr_p, 0);
584 return cbck (*addr_p, nxt, data);
586 case BIT_FIELD_REF:
587 case VIEW_CONVERT_EXPR:
588 case REALPART_EXPR:
589 case IMAGPART_EXPR:
590 nxt = &TREE_OPERAND (*addr_p, 0);
591 break;
593 case COMPONENT_REF:
594 /* If the component has varying offset, it behaves like index
595 as well. */
596 idx = &TREE_OPERAND (*addr_p, 2);
597 if (*idx
598 && !cbck (*addr_p, idx, data))
599 return false;
601 nxt = &TREE_OPERAND (*addr_p, 0);
602 break;
604 case ARRAY_REF:
605 case ARRAY_RANGE_REF:
606 nxt = &TREE_OPERAND (*addr_p, 0);
607 if (!cbck (*addr_p, &TREE_OPERAND (*addr_p, 1), data))
608 return false;
609 break;
611 case VAR_DECL:
612 case PARM_DECL:
613 case CONST_DECL:
614 case STRING_CST:
615 case RESULT_DECL:
616 case VECTOR_CST:
617 case COMPLEX_CST:
618 case INTEGER_CST:
619 case REAL_CST:
620 case FIXED_CST:
621 case CONSTRUCTOR:
622 return true;
624 case ADDR_EXPR:
625 gcc_assert (is_gimple_min_invariant (*addr_p));
626 return true;
628 case TARGET_MEM_REF:
629 idx = &TMR_BASE (*addr_p);
630 if (*idx
631 && !cbck (*addr_p, idx, data))
632 return false;
633 idx = &TMR_INDEX (*addr_p);
634 if (*idx
635 && !cbck (*addr_p, idx, data))
636 return false;
637 idx = &TMR_INDEX2 (*addr_p);
638 if (*idx
639 && !cbck (*addr_p, idx, data))
640 return false;
641 return true;
643 default:
644 gcc_unreachable ();
650 /* The name and the length of the currently generated variable
651 for lsm. */
652 #define MAX_LSM_NAME_LENGTH 40
653 static char lsm_tmp_name[MAX_LSM_NAME_LENGTH + 1];
654 static int lsm_tmp_name_length;
656 /* Adds S to lsm_tmp_name. */
658 static void
659 lsm_tmp_name_add (const char *s)
661 int l = strlen (s) + lsm_tmp_name_length;
662 if (l > MAX_LSM_NAME_LENGTH)
663 return;
665 strcpy (lsm_tmp_name + lsm_tmp_name_length, s);
666 lsm_tmp_name_length = l;
669 /* Stores the name for temporary variable that replaces REF to
670 lsm_tmp_name. */
672 static void
673 gen_lsm_tmp_name (tree ref)
675 const char *name;
677 switch (TREE_CODE (ref))
679 case MEM_REF:
680 case TARGET_MEM_REF:
681 gen_lsm_tmp_name (TREE_OPERAND (ref, 0));
682 lsm_tmp_name_add ("_");
683 break;
685 case ADDR_EXPR:
686 gen_lsm_tmp_name (TREE_OPERAND (ref, 0));
687 break;
689 case BIT_FIELD_REF:
690 case VIEW_CONVERT_EXPR:
691 case ARRAY_RANGE_REF:
692 gen_lsm_tmp_name (TREE_OPERAND (ref, 0));
693 break;
695 case REALPART_EXPR:
696 gen_lsm_tmp_name (TREE_OPERAND (ref, 0));
697 lsm_tmp_name_add ("_RE");
698 break;
700 case IMAGPART_EXPR:
701 gen_lsm_tmp_name (TREE_OPERAND (ref, 0));
702 lsm_tmp_name_add ("_IM");
703 break;
705 case COMPONENT_REF:
706 gen_lsm_tmp_name (TREE_OPERAND (ref, 0));
707 lsm_tmp_name_add ("_");
708 name = get_name (TREE_OPERAND (ref, 1));
709 if (!name)
710 name = "F";
711 lsm_tmp_name_add (name);
712 break;
714 case ARRAY_REF:
715 gen_lsm_tmp_name (TREE_OPERAND (ref, 0));
716 lsm_tmp_name_add ("_I");
717 break;
719 case SSA_NAME:
720 case VAR_DECL:
721 case PARM_DECL:
722 case FUNCTION_DECL:
723 case LABEL_DECL:
724 name = get_name (ref);
725 if (!name)
726 name = "D";
727 lsm_tmp_name_add (name);
728 break;
730 case STRING_CST:
731 lsm_tmp_name_add ("S");
732 break;
734 case RESULT_DECL:
735 lsm_tmp_name_add ("R");
736 break;
738 case INTEGER_CST:
739 default:
740 /* Nothing. */
741 break;
745 /* Determines name for temporary variable that replaces REF.
746 The name is accumulated into the lsm_tmp_name variable.
747 N is added to the name of the temporary. */
749 char *
750 get_lsm_tmp_name (tree ref, unsigned n, const char *suffix)
752 char ns[2];
754 lsm_tmp_name_length = 0;
755 gen_lsm_tmp_name (ref);
756 lsm_tmp_name_add ("_lsm");
757 if (n < 10)
759 ns[0] = '0' + n;
760 ns[1] = 0;
761 lsm_tmp_name_add (ns);
763 return lsm_tmp_name;
764 if (suffix != NULL)
765 lsm_tmp_name_add (suffix);
768 /* Computes an estimated number of insns in LOOP, weighted by WEIGHTS. */
770 unsigned
771 tree_num_loop_insns (struct loop *loop, eni_weights *weights)
773 basic_block *body = get_loop_body (loop);
774 gimple_stmt_iterator gsi;
775 unsigned size = 0, i;
777 for (i = 0; i < loop->num_nodes; i++)
778 for (gsi = gsi_start_bb (body[i]); !gsi_end_p (gsi); gsi_next (&gsi))
779 size += estimate_num_insns (gsi_stmt (gsi), weights);
780 free (body);
782 return size;