1 /* Conversion of SESE regions to Polyhedra.
2 Copyright (C) 2009-2014 Free Software Foundation, Inc.
3 Contributed by Sebastian Pop <sebastian.pop@amd.com>.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
26 #include <isl/union_map.h>
27 #include <isl/constraint.h>
29 #include <cloog/cloog.h>
30 #include <cloog/cloog.h>
31 #include <cloog/isl/domain.h>
35 #include "coretypes.h"
37 #include "basic-block.h"
38 #include "tree-ssa-alias.h"
39 #include "internal-fn.h"
40 #include "gimple-expr.h"
43 #include "gimple-iterator.h"
45 #include "gimplify-me.h"
46 #include "gimple-ssa.h"
48 #include "tree-phinodes.h"
49 #include "ssa-iterators.h"
50 #include "stringpool.h"
51 #include "tree-ssanames.h"
52 #include "tree-ssa-loop-manip.h"
53 #include "tree-ssa-loop-niter.h"
54 #include "tree-ssa-loop.h"
55 #include "tree-into-ssa.h"
56 #include "tree-pass.h"
58 #include "tree-chrec.h"
59 #include "tree-data-ref.h"
60 #include "tree-scalar-evolution.h"
63 #include "tree-ssa-propagate.h"
67 #include "graphite-poly.h"
68 #include "graphite-sese-to-poly.h"
71 /* Assigns to RES the value of the INTEGER_CST T. */
74 tree_int_to_gmp (tree t
, mpz_t res
)
76 double_int di
= tree_to_double_int (t
);
77 mpz_set_double_int (res
, di
, TYPE_UNSIGNED (TREE_TYPE (t
)));
80 /* Returns the index of the PHI argument defined in the outermost
84 phi_arg_in_outermost_loop (gimple phi
)
86 loop_p loop
= gimple_bb (phi
)->loop_father
;
89 for (i
= 0; i
< gimple_phi_num_args (phi
); i
++)
90 if (!flow_bb_inside_loop_p (loop
, gimple_phi_arg_edge (phi
, i
)->src
))
92 loop
= gimple_phi_arg_edge (phi
, i
)->src
->loop_father
;
99 /* Removes a simple copy phi node "RES = phi (INIT, RES)" at position
100 PSI by inserting on the loop ENTRY edge assignment "RES = INIT". */
103 remove_simple_copy_phi (gimple_stmt_iterator
*psi
)
105 gimple phi
= gsi_stmt (*psi
);
106 tree res
= gimple_phi_result (phi
);
107 size_t entry
= phi_arg_in_outermost_loop (phi
);
108 tree init
= gimple_phi_arg_def (phi
, entry
);
109 gimple stmt
= gimple_build_assign (res
, init
);
110 edge e
= gimple_phi_arg_edge (phi
, entry
);
112 remove_phi_node (psi
, false);
113 gsi_insert_on_edge_immediate (e
, stmt
);
116 /* Removes an invariant phi node at position PSI by inserting on the
117 loop ENTRY edge the assignment RES = INIT. */
120 remove_invariant_phi (sese region
, gimple_stmt_iterator
*psi
)
122 gimple phi
= gsi_stmt (*psi
);
123 loop_p loop
= loop_containing_stmt (phi
);
124 tree res
= gimple_phi_result (phi
);
125 tree scev
= scalar_evolution_in_region (region
, loop
, res
);
126 size_t entry
= phi_arg_in_outermost_loop (phi
);
127 edge e
= gimple_phi_arg_edge (phi
, entry
);
130 gimple_seq stmts
= NULL
;
132 if (tree_contains_chrecs (scev
, NULL
))
133 scev
= gimple_phi_arg_def (phi
, entry
);
135 var
= force_gimple_operand (scev
, &stmts
, true, NULL_TREE
);
136 stmt
= gimple_build_assign (res
, var
);
137 remove_phi_node (psi
, false);
139 gimple_seq_add_stmt (&stmts
, stmt
);
140 gsi_insert_seq_on_edge (e
, stmts
);
141 gsi_commit_edge_inserts ();
142 SSA_NAME_DEF_STMT (res
) = stmt
;
145 /* Returns true when the phi node at PSI is of the form "a = phi (a, x)". */
148 simple_copy_phi_p (gimple phi
)
152 if (gimple_phi_num_args (phi
) != 2)
155 res
= gimple_phi_result (phi
);
156 return (res
== gimple_phi_arg_def (phi
, 0)
157 || res
== gimple_phi_arg_def (phi
, 1));
160 /* Returns true when the phi node at position PSI is a reduction phi
161 node in REGION. Otherwise moves the pointer PSI to the next phi to
165 reduction_phi_p (sese region
, gimple_stmt_iterator
*psi
)
168 gimple phi
= gsi_stmt (*psi
);
169 tree res
= gimple_phi_result (phi
);
171 loop
= loop_containing_stmt (phi
);
173 if (simple_copy_phi_p (phi
))
175 /* PRE introduces phi nodes like these, for an example,
176 see id-5.f in the fortran graphite testsuite:
178 # prephitmp.85_265 = PHI <prephitmp.85_258(33), prephitmp.85_265(18)>
180 remove_simple_copy_phi (psi
);
184 if (scev_analyzable_p (res
, region
))
186 tree scev
= scalar_evolution_in_region (region
, loop
, res
);
188 if (evolution_function_is_invariant_p (scev
, loop
->num
))
189 remove_invariant_phi (region
, psi
);
196 /* All the other cases are considered reductions. */
200 /* Store the GRAPHITE representation of BB. */
203 new_gimple_bb (basic_block bb
, vec
<data_reference_p
> drs
)
205 struct gimple_bb
*gbb
;
207 gbb
= XNEW (struct gimple_bb
);
210 GBB_DATA_REFS (gbb
) = drs
;
211 GBB_CONDITIONS (gbb
).create (0);
212 GBB_CONDITION_CASES (gbb
).create (0);
218 free_data_refs_aux (vec
<data_reference_p
> datarefs
)
221 struct data_reference
*dr
;
223 FOR_EACH_VEC_ELT (datarefs
, i
, dr
)
226 base_alias_pair
*bap
= (base_alias_pair
*)(dr
->aux
);
228 free (bap
->alias_set
);
237 free_gimple_bb (struct gimple_bb
*gbb
)
239 free_data_refs_aux (GBB_DATA_REFS (gbb
));
240 free_data_refs (GBB_DATA_REFS (gbb
));
242 GBB_CONDITIONS (gbb
).release ();
243 GBB_CONDITION_CASES (gbb
).release ();
244 GBB_BB (gbb
)->aux
= 0;
248 /* Deletes all gimple bbs in SCOP. */
251 remove_gbbs_in_scop (scop_p scop
)
256 FOR_EACH_VEC_ELT (SCOP_BBS (scop
), i
, pbb
)
257 free_gimple_bb (PBB_BLACK_BOX (pbb
));
260 /* Deletes all scops in SCOPS. */
263 free_scops (vec
<scop_p
> scops
)
268 FOR_EACH_VEC_ELT (scops
, i
, scop
)
270 remove_gbbs_in_scop (scop
);
271 free_sese (SCOP_REGION (scop
));
278 /* Same as outermost_loop_in_sese, returns the outermost loop
279 containing BB in REGION, but makes sure that the returned loop
280 belongs to the REGION, and so this returns the first loop in the
281 REGION when the loop containing BB does not belong to REGION. */
284 outermost_loop_in_sese_1 (sese region
, basic_block bb
)
286 loop_p nest
= outermost_loop_in_sese (region
, bb
);
288 if (loop_in_sese_p (nest
, region
))
291 /* When the basic block BB does not belong to a loop in the region,
292 return the first loop in the region. */
295 if (loop_in_sese_p (nest
, region
))
304 /* Generates a polyhedral black box only if the bb contains interesting
308 try_generate_gimple_bb (scop_p scop
, basic_block bb
)
310 vec
<data_reference_p
> drs
;
312 sese region
= SCOP_REGION (scop
);
313 loop_p nest
= outermost_loop_in_sese_1 (region
, bb
);
314 gimple_stmt_iterator gsi
;
316 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
318 gimple stmt
= gsi_stmt (gsi
);
321 if (is_gimple_debug (stmt
))
324 loop
= loop_containing_stmt (stmt
);
325 if (!loop_in_sese_p (loop
, region
))
328 graphite_find_data_references_in_stmt (nest
, loop
, stmt
, &drs
);
331 return new_gimple_bb (bb
, drs
);
334 /* Returns true if all predecessors of BB, that are not dominated by BB, are
335 marked in MAP. The predecessors dominated by BB are loop latches and will
336 be handled after BB. */
339 all_non_dominated_preds_marked_p (basic_block bb
, sbitmap map
)
344 FOR_EACH_EDGE (e
, ei
, bb
->preds
)
345 if (!bitmap_bit_p (map
, e
->src
->index
)
346 && !dominated_by_p (CDI_DOMINATORS
, e
->src
, bb
))
352 /* Compare the depth of two basic_block's P1 and P2. */
355 compare_bb_depths (const void *p1
, const void *p2
)
357 const_basic_block
const bb1
= *(const_basic_block
const*)p1
;
358 const_basic_block
const bb2
= *(const_basic_block
const*)p2
;
359 int d1
= loop_depth (bb1
->loop_father
);
360 int d2
= loop_depth (bb2
->loop_father
);
371 /* Sort the basic blocks from DOM such that the first are the ones at
372 a deepest loop level. */
375 graphite_sort_dominated_info (vec
<basic_block
> dom
)
377 dom
.qsort (compare_bb_depths
);
380 /* Recursive helper function for build_scops_bbs. */
383 build_scop_bbs_1 (scop_p scop
, sbitmap visited
, basic_block bb
)
385 sese region
= SCOP_REGION (scop
);
386 vec
<basic_block
> dom
;
389 if (bitmap_bit_p (visited
, bb
->index
)
390 || !bb_in_sese_p (bb
, region
))
393 pbb
= new_poly_bb (scop
, try_generate_gimple_bb (scop
, bb
));
394 SCOP_BBS (scop
).safe_push (pbb
);
395 bitmap_set_bit (visited
, bb
->index
);
397 dom
= get_dominated_by (CDI_DOMINATORS
, bb
);
402 graphite_sort_dominated_info (dom
);
404 while (!dom
.is_empty ())
409 FOR_EACH_VEC_ELT (dom
, i
, dom_bb
)
410 if (all_non_dominated_preds_marked_p (dom_bb
, visited
))
412 build_scop_bbs_1 (scop
, visited
, dom_bb
);
413 dom
.unordered_remove (i
);
421 /* Gather the basic blocks belonging to the SCOP. */
424 build_scop_bbs (scop_p scop
)
426 sbitmap visited
= sbitmap_alloc (last_basic_block_for_fn (cfun
));
427 sese region
= SCOP_REGION (scop
);
429 bitmap_clear (visited
);
430 build_scop_bbs_1 (scop
, visited
, SESE_ENTRY_BB (region
));
431 sbitmap_free (visited
);
434 /* Return an ISL identifier for the polyhedral basic block PBB. */
437 isl_id_for_pbb (scop_p s
, poly_bb_p pbb
)
440 snprintf (name
, sizeof (name
), "S_%d", pbb_index (pbb
));
441 return isl_id_alloc (s
->ctx
, name
, pbb
);
444 /* Converts the STATIC_SCHEDULE of PBB into a scattering polyhedron.
445 We generate SCATTERING_DIMENSIONS scattering dimensions.
447 CLooG 0.15.0 and previous versions require, that all
448 scattering functions of one CloogProgram have the same number of
449 scattering dimensions, therefore we allow to specify it. This
450 should be removed in future versions of CLooG.
452 The scattering polyhedron consists of these dimensions: scattering,
453 loop_iterators, parameters.
457 | scattering_dimensions = 5
458 | used_scattering_dimensions = 3
466 | Scattering polyhedron:
468 | scattering: {s1, s2, s3, s4, s5}
469 | loop_iterators: {i}
470 | parameters: {p1, p2}
472 | s1 s2 s3 s4 s5 i p1 p2 1
473 | 1 0 0 0 0 0 0 0 -4 = 0
474 | 0 1 0 0 0 -1 0 0 0 = 0
475 | 0 0 1 0 0 0 0 0 -5 = 0 */
478 build_pbb_scattering_polyhedrons (isl_aff
*static_sched
,
479 poly_bb_p pbb
, int scattering_dimensions
)
482 int nb_iterators
= pbb_dim_iter_domain (pbb
);
483 int used_scattering_dimensions
= nb_iterators
* 2 + 1;
487 gcc_assert (scattering_dimensions
>= used_scattering_dimensions
);
491 dc
= isl_set_get_space (pbb
->domain
);
492 dm
= isl_space_add_dims (isl_space_from_domain (dc
),
493 isl_dim_out
, scattering_dimensions
);
494 pbb
->schedule
= isl_map_universe (dm
);
496 for (i
= 0; i
< scattering_dimensions
; i
++)
498 /* Textual order inside this loop. */
501 isl_constraint
*c
= isl_equality_alloc
502 (isl_local_space_from_space (isl_map_get_space (pbb
->schedule
)));
504 if (0 != isl_aff_get_coefficient (static_sched
, isl_dim_in
,
508 isl_int_neg (val
, val
);
509 c
= isl_constraint_set_constant (c
, val
);
510 c
= isl_constraint_set_coefficient_si (c
, isl_dim_out
, i
, 1);
511 pbb
->schedule
= isl_map_add_constraint (pbb
->schedule
, c
);
514 /* Iterations of this loop. */
515 else /* if ((i % 2) == 1) */
517 int loop
= (i
- 1) / 2;
518 pbb
->schedule
= isl_map_equate (pbb
->schedule
, isl_dim_in
, loop
,
525 pbb
->transformed
= isl_map_copy (pbb
->schedule
);
528 /* Build for BB the static schedule.
530 The static schedule is a Dewey numbering of the abstract syntax
531 tree: http://en.wikipedia.org/wiki/Dewey_Decimal_Classification
533 The following example informally defines the static schedule:
552 Static schedules for A to F:
565 build_scop_scattering (scop_p scop
)
569 gimple_bb_p previous_gbb
= NULL
;
570 isl_space
*dc
= isl_set_get_space (scop
->context
);
571 isl_aff
*static_sched
;
573 dc
= isl_space_add_dims (dc
, isl_dim_set
, number_of_loops (cfun
));
574 static_sched
= isl_aff_zero_on_domain (isl_local_space_from_space (dc
));
576 /* We have to start schedules at 0 on the first component and
577 because we cannot compare_prefix_loops against a previous loop,
578 prefix will be equal to zero, and that index will be
579 incremented before copying. */
580 static_sched
= isl_aff_add_coefficient_si (static_sched
, isl_dim_in
, 0, -1);
582 FOR_EACH_VEC_ELT (SCOP_BBS (scop
), i
, pbb
)
584 gimple_bb_p gbb
= PBB_BLACK_BOX (pbb
);
586 int nb_scat_dims
= pbb_dim_iter_domain (pbb
) * 2 + 1;
589 prefix
= nb_common_loops (SCOP_REGION (scop
), previous_gbb
, gbb
);
595 static_sched
= isl_aff_add_coefficient_si (static_sched
, isl_dim_in
,
597 build_pbb_scattering_polyhedrons (static_sched
, pbb
, nb_scat_dims
);
600 isl_aff_free (static_sched
);
603 static isl_pw_aff
*extract_affine (scop_p
, tree
, __isl_take isl_space
*space
);
605 /* Extract an affine expression from the chain of recurrence E. */
608 extract_affine_chrec (scop_p s
, tree e
, __isl_take isl_space
*space
)
610 isl_pw_aff
*lhs
= extract_affine (s
, CHREC_LEFT (e
), isl_space_copy (space
));
611 isl_pw_aff
*rhs
= extract_affine (s
, CHREC_RIGHT (e
), isl_space_copy (space
));
612 isl_local_space
*ls
= isl_local_space_from_space (space
);
613 unsigned pos
= sese_loop_depth ((sese
) s
->region
, get_chrec_loop (e
)) - 1;
614 isl_aff
*loop
= isl_aff_set_coefficient_si
615 (isl_aff_zero_on_domain (ls
), isl_dim_in
, pos
, 1);
616 isl_pw_aff
*l
= isl_pw_aff_from_aff (loop
);
618 /* Before multiplying, make sure that the result is affine. */
619 gcc_assert (isl_pw_aff_is_cst (rhs
)
620 || isl_pw_aff_is_cst (l
));
622 return isl_pw_aff_add (lhs
, isl_pw_aff_mul (rhs
, l
));
625 /* Extract an affine expression from the mult_expr E. */
628 extract_affine_mul (scop_p s
, tree e
, __isl_take isl_space
*space
)
630 isl_pw_aff
*lhs
= extract_affine (s
, TREE_OPERAND (e
, 0),
631 isl_space_copy (space
));
632 isl_pw_aff
*rhs
= extract_affine (s
, TREE_OPERAND (e
, 1), space
);
634 if (!isl_pw_aff_is_cst (lhs
)
635 && !isl_pw_aff_is_cst (rhs
))
637 isl_pw_aff_free (lhs
);
638 isl_pw_aff_free (rhs
);
642 return isl_pw_aff_mul (lhs
, rhs
);
645 /* Return an ISL identifier from the name of the ssa_name E. */
648 isl_id_for_ssa_name (scop_p s
, tree e
)
650 const char *name
= get_name (e
);
654 id
= isl_id_alloc (s
->ctx
, name
, e
);
658 snprintf (name1
, sizeof (name1
), "P_%d", SSA_NAME_VERSION (e
));
659 id
= isl_id_alloc (s
->ctx
, name1
, e
);
665 /* Return an ISL identifier for the data reference DR. */
668 isl_id_for_dr (scop_p s
, data_reference_p dr ATTRIBUTE_UNUSED
)
670 /* Data references all get the same isl_id. They need to be comparable
671 and are distinguished through the first dimension, which contains the
673 return isl_id_alloc (s
->ctx
, "", 0);
676 /* Extract an affine expression from the ssa_name E. */
679 extract_affine_name (scop_p s
, tree e
, __isl_take isl_space
*space
)
686 id
= isl_id_for_ssa_name (s
, e
);
687 dimension
= isl_space_find_dim_by_id (space
, isl_dim_param
, id
);
689 dom
= isl_set_universe (isl_space_copy (space
));
690 aff
= isl_aff_zero_on_domain (isl_local_space_from_space (space
));
691 aff
= isl_aff_add_coefficient_si (aff
, isl_dim_param
, dimension
, 1);
692 return isl_pw_aff_alloc (dom
, aff
);
695 /* Extract an affine expression from the gmp constant G. */
698 extract_affine_gmp (mpz_t g
, __isl_take isl_space
*space
)
700 isl_local_space
*ls
= isl_local_space_from_space (isl_space_copy (space
));
701 isl_aff
*aff
= isl_aff_zero_on_domain (ls
);
702 isl_set
*dom
= isl_set_universe (space
);
706 isl_int_set_gmp (v
, g
);
707 aff
= isl_aff_add_constant (aff
, v
);
710 return isl_pw_aff_alloc (dom
, aff
);
713 /* Extract an affine expression from the integer_cst E. */
716 extract_affine_int (tree e
, __isl_take isl_space
*space
)
722 tree_int_to_gmp (e
, g
);
723 res
= extract_affine_gmp (g
, space
);
729 /* Compute pwaff mod 2^width. */
732 wrap (isl_pw_aff
*pwaff
, unsigned width
)
737 isl_int_set_si (mod
, 1);
738 isl_int_mul_2exp (mod
, mod
, width
);
740 pwaff
= isl_pw_aff_mod (pwaff
, mod
);
747 /* When parameter NAME is in REGION, returns its index in SESE_PARAMS.
748 Otherwise returns -1. */
751 parameter_index_in_region_1 (tree name
, sese region
)
756 gcc_assert (TREE_CODE (name
) == SSA_NAME
);
758 FOR_EACH_VEC_ELT (SESE_PARAMS (region
), i
, p
)
765 /* When the parameter NAME is in REGION, returns its index in
766 SESE_PARAMS. Otherwise this function inserts NAME in SESE_PARAMS
767 and returns the index of NAME. */
770 parameter_index_in_region (tree name
, sese region
)
774 gcc_assert (TREE_CODE (name
) == SSA_NAME
);
776 i
= parameter_index_in_region_1 (name
, region
);
780 gcc_assert (SESE_ADD_PARAMS (region
));
782 i
= SESE_PARAMS (region
).length ();
783 SESE_PARAMS (region
).safe_push (name
);
787 /* Extract an affine expression from the tree E in the scop S. */
790 extract_affine (scop_p s
, tree e
, __isl_take isl_space
*space
)
792 isl_pw_aff
*lhs
, *rhs
, *res
;
795 if (e
== chrec_dont_know
) {
796 isl_space_free (space
);
800 switch (TREE_CODE (e
))
802 case POLYNOMIAL_CHREC
:
803 res
= extract_affine_chrec (s
, e
, space
);
807 res
= extract_affine_mul (s
, e
, space
);
811 case POINTER_PLUS_EXPR
:
812 lhs
= extract_affine (s
, TREE_OPERAND (e
, 0), isl_space_copy (space
));
813 rhs
= extract_affine (s
, TREE_OPERAND (e
, 1), space
);
814 res
= isl_pw_aff_add (lhs
, rhs
);
818 lhs
= extract_affine (s
, TREE_OPERAND (e
, 0), isl_space_copy (space
));
819 rhs
= extract_affine (s
, TREE_OPERAND (e
, 1), space
);
820 res
= isl_pw_aff_sub (lhs
, rhs
);
825 lhs
= extract_affine (s
, TREE_OPERAND (e
, 0), isl_space_copy (space
));
826 rhs
= extract_affine (s
, integer_minus_one_node
, space
);
827 res
= isl_pw_aff_mul (lhs
, rhs
);
831 gcc_assert (-1 != parameter_index_in_region_1 (e
, SCOP_REGION (s
)));
832 res
= extract_affine_name (s
, e
, space
);
836 res
= extract_affine_int (e
, space
);
837 /* No need to wrap a single integer. */
841 case NON_LVALUE_EXPR
:
842 res
= extract_affine (s
, TREE_OPERAND (e
, 0), space
);
850 type
= TREE_TYPE (e
);
851 if (TYPE_UNSIGNED (type
))
852 res
= wrap (res
, TYPE_PRECISION (type
));
857 /* In the context of sese S, scan the expression E and translate it to
858 a linear expression C. When parsing a symbolic multiplication, K
859 represents the constant multiplier of an expression containing
863 scan_tree_for_params (sese s
, tree e
)
865 if (e
== chrec_dont_know
)
868 switch (TREE_CODE (e
))
870 case POLYNOMIAL_CHREC
:
871 scan_tree_for_params (s
, CHREC_LEFT (e
));
875 if (chrec_contains_symbols (TREE_OPERAND (e
, 0)))
876 scan_tree_for_params (s
, TREE_OPERAND (e
, 0));
878 scan_tree_for_params (s
, TREE_OPERAND (e
, 1));
882 case POINTER_PLUS_EXPR
:
884 scan_tree_for_params (s
, TREE_OPERAND (e
, 0));
885 scan_tree_for_params (s
, TREE_OPERAND (e
, 1));
891 case NON_LVALUE_EXPR
:
892 scan_tree_for_params (s
, TREE_OPERAND (e
, 0));
896 parameter_index_in_region (e
, s
);
909 /* Find parameters with respect to REGION in BB. We are looking in memory
910 access functions, conditions and loop bounds. */
913 find_params_in_bb (sese region
, gimple_bb_p gbb
)
919 loop_p loop
= GBB_BB (gbb
)->loop_father
;
921 /* Find parameters in the access functions of data references. */
922 FOR_EACH_VEC_ELT (GBB_DATA_REFS (gbb
), i
, dr
)
923 for (j
= 0; j
< DR_NUM_DIMENSIONS (dr
); j
++)
924 scan_tree_for_params (region
, DR_ACCESS_FN (dr
, j
));
926 /* Find parameters in conditional statements. */
927 FOR_EACH_VEC_ELT (GBB_CONDITIONS (gbb
), i
, stmt
)
929 tree lhs
= scalar_evolution_in_region (region
, loop
,
930 gimple_cond_lhs (stmt
));
931 tree rhs
= scalar_evolution_in_region (region
, loop
,
932 gimple_cond_rhs (stmt
));
934 scan_tree_for_params (region
, lhs
);
935 scan_tree_for_params (region
, rhs
);
939 /* Record the parameters used in the SCOP. A variable is a parameter
940 in a scop if it does not vary during the execution of that scop. */
943 find_scop_parameters (scop_p scop
)
947 sese region
= SCOP_REGION (scop
);
951 /* Find the parameters used in the loop bounds. */
952 FOR_EACH_VEC_ELT (SESE_LOOP_NEST (region
), i
, loop
)
954 tree nb_iters
= number_of_latch_executions (loop
);
956 if (!chrec_contains_symbols (nb_iters
))
959 nb_iters
= scalar_evolution_in_region (region
, loop
, nb_iters
);
960 scan_tree_for_params (region
, nb_iters
);
963 /* Find the parameters used in data accesses. */
964 FOR_EACH_VEC_ELT (SCOP_BBS (scop
), i
, pbb
)
965 find_params_in_bb (region
, PBB_BLACK_BOX (pbb
));
967 nbp
= sese_nb_params (region
);
968 scop_set_nb_params (scop
, nbp
);
969 SESE_ADD_PARAMS (region
) = false;
973 isl_space
*space
= isl_space_set_alloc (scop
->ctx
, nbp
, 0);
975 FOR_EACH_VEC_ELT (SESE_PARAMS (region
), i
, e
)
976 space
= isl_space_set_dim_id (space
, isl_dim_param
, i
,
977 isl_id_for_ssa_name (scop
, e
));
979 scop
->context
= isl_set_universe (space
);
983 /* Builds the constraint polyhedra for LOOP in SCOP. OUTER_PH gives
984 the constraints for the surrounding loops. */
987 build_loop_iteration_domains (scop_p scop
, struct loop
*loop
,
989 isl_set
*outer
, isl_set
**doms
)
991 tree nb_iters
= number_of_latch_executions (loop
);
992 sese region
= SCOP_REGION (scop
);
994 isl_set
*inner
= isl_set_copy (outer
);
997 int pos
= isl_set_dim (outer
, isl_dim_set
);
1004 inner
= isl_set_add_dims (inner
, isl_dim_set
, 1);
1005 space
= isl_set_get_space (inner
);
1008 c
= isl_inequality_alloc
1009 (isl_local_space_from_space (isl_space_copy (space
)));
1010 c
= isl_constraint_set_coefficient_si (c
, isl_dim_set
, pos
, 1);
1011 inner
= isl_set_add_constraint (inner
, c
);
1013 /* loop_i <= cst_nb_iters */
1014 if (TREE_CODE (nb_iters
) == INTEGER_CST
)
1016 c
= isl_inequality_alloc
1017 (isl_local_space_from_space (isl_space_copy (space
)));
1018 c
= isl_constraint_set_coefficient_si (c
, isl_dim_set
, pos
, -1);
1019 tree_int_to_gmp (nb_iters
, g
);
1020 isl_int_set_gmp (v
, g
);
1021 c
= isl_constraint_set_constant (c
, v
);
1022 inner
= isl_set_add_constraint (inner
, c
);
1025 /* loop_i <= expr_nb_iters */
1026 else if (!chrec_contains_undetermined (nb_iters
))
1031 isl_local_space
*ls
;
1035 nb_iters
= scalar_evolution_in_region (region
, loop
, nb_iters
);
1037 aff
= extract_affine (scop
, nb_iters
, isl_set_get_space (inner
));
1038 valid
= isl_pw_aff_nonneg_set (isl_pw_aff_copy (aff
));
1039 valid
= isl_set_project_out (valid
, isl_dim_set
, 0,
1040 isl_set_dim (valid
, isl_dim_set
));
1041 scop
->context
= isl_set_intersect (scop
->context
, valid
);
1043 ls
= isl_local_space_from_space (isl_space_copy (space
));
1044 al
= isl_aff_set_coefficient_si (isl_aff_zero_on_domain (ls
),
1045 isl_dim_in
, pos
, 1);
1046 le
= isl_pw_aff_le_set (isl_pw_aff_from_aff (al
),
1047 isl_pw_aff_copy (aff
));
1048 inner
= isl_set_intersect (inner
, le
);
1050 if (max_stmt_executions (loop
, &nit
))
1052 /* Insert in the context the constraints from the
1053 estimation of the number of iterations NIT and the
1054 symbolic number of iterations (involving parameter
1055 names) NB_ITERS. First, build the affine expression
1056 "NIT - NB_ITERS" and then say that it is positive,
1057 i.e., NIT approximates NB_ITERS: "NIT >= NB_ITERS". */
1064 mpz_set_double_int (g
, nit
, false);
1065 mpz_sub_ui (g
, g
, 1);
1066 approx
= extract_affine_gmp (g
, isl_set_get_space (inner
));
1067 x
= isl_pw_aff_ge_set (approx
, aff
);
1068 x
= isl_set_project_out (x
, isl_dim_set
, 0,
1069 isl_set_dim (x
, isl_dim_set
));
1070 scop
->context
= isl_set_intersect (scop
->context
, x
);
1072 c
= isl_inequality_alloc
1073 (isl_local_space_from_space (isl_space_copy (space
)));
1074 c
= isl_constraint_set_coefficient_si (c
, isl_dim_set
, pos
, -1);
1075 isl_int_set_gmp (v
, g
);
1077 c
= isl_constraint_set_constant (c
, v
);
1078 inner
= isl_set_add_constraint (inner
, c
);
1081 isl_pw_aff_free (aff
);
1086 if (loop
->inner
&& loop_in_sese_p (loop
->inner
, region
))
1087 build_loop_iteration_domains (scop
, loop
->inner
, nb
+ 1,
1088 isl_set_copy (inner
), doms
);
1092 && loop_in_sese_p (loop
->next
, region
))
1093 build_loop_iteration_domains (scop
, loop
->next
, nb
,
1094 isl_set_copy (outer
), doms
);
1096 doms
[loop
->num
] = inner
;
1098 isl_set_free (outer
);
1099 isl_space_free (space
);
1104 /* Returns a linear expression for tree T evaluated in PBB. */
1107 create_pw_aff_from_tree (poly_bb_p pbb
, tree t
)
1109 scop_p scop
= PBB_SCOP (pbb
);
1111 t
= scalar_evolution_in_region (SCOP_REGION (scop
), pbb_loop (pbb
), t
);
1112 gcc_assert (!automatically_generated_chrec_p (t
));
1114 return extract_affine (scop
, t
, isl_set_get_space (pbb
->domain
));
1117 /* Add conditional statement STMT to pbb. CODE is used as the comparison
1118 operator. This allows us to invert the condition or to handle
1122 add_condition_to_pbb (poly_bb_p pbb
, gimple stmt
, enum tree_code code
)
1124 isl_pw_aff
*lhs
= create_pw_aff_from_tree (pbb
, gimple_cond_lhs (stmt
));
1125 isl_pw_aff
*rhs
= create_pw_aff_from_tree (pbb
, gimple_cond_rhs (stmt
));
1131 cond
= isl_pw_aff_lt_set (lhs
, rhs
);
1135 cond
= isl_pw_aff_gt_set (lhs
, rhs
);
1139 cond
= isl_pw_aff_le_set (lhs
, rhs
);
1143 cond
= isl_pw_aff_ge_set (lhs
, rhs
);
1147 cond
= isl_pw_aff_eq_set (lhs
, rhs
);
1151 cond
= isl_pw_aff_ne_set (lhs
, rhs
);
1155 isl_pw_aff_free (lhs
);
1156 isl_pw_aff_free (rhs
);
1160 cond
= isl_set_coalesce (cond
);
1161 cond
= isl_set_set_tuple_id (cond
, isl_set_get_tuple_id (pbb
->domain
));
1162 pbb
->domain
= isl_set_intersect (pbb
->domain
, cond
);
1165 /* Add conditions to the domain of PBB. */
1168 add_conditions_to_domain (poly_bb_p pbb
)
1172 gimple_bb_p gbb
= PBB_BLACK_BOX (pbb
);
1174 if (GBB_CONDITIONS (gbb
).is_empty ())
1177 FOR_EACH_VEC_ELT (GBB_CONDITIONS (gbb
), i
, stmt
)
1178 switch (gimple_code (stmt
))
1182 enum tree_code code
= gimple_cond_code (stmt
);
1184 /* The conditions for ELSE-branches are inverted. */
1185 if (!GBB_CONDITION_CASES (gbb
)[i
])
1186 code
= invert_tree_comparison (code
, false);
1188 add_condition_to_pbb (pbb
, stmt
, code
);
1193 /* Switch statements are not supported right now - fall through. */
1201 /* Traverses all the GBBs of the SCOP and add their constraints to the
1202 iteration domains. */
1205 add_conditions_to_constraints (scop_p scop
)
1210 FOR_EACH_VEC_ELT (SCOP_BBS (scop
), i
, pbb
)
1211 add_conditions_to_domain (pbb
);
1214 /* Returns a COND_EXPR statement when BB has a single predecessor, the
1215 edge between BB and its predecessor is not a loop exit edge, and
1216 the last statement of the single predecessor is a COND_EXPR. */
1219 single_pred_cond_non_loop_exit (basic_block bb
)
1221 if (single_pred_p (bb
))
1223 edge e
= single_pred_edge (bb
);
1224 basic_block pred
= e
->src
;
1227 if (loop_depth (pred
->loop_father
) > loop_depth (bb
->loop_father
))
1230 stmt
= last_stmt (pred
);
1232 if (stmt
&& gimple_code (stmt
) == GIMPLE_COND
)
1239 class sese_dom_walker
: public dom_walker
1242 sese_dom_walker (cdi_direction
, sese
);
1244 virtual void before_dom_children (basic_block
);
1245 virtual void after_dom_children (basic_block
);
1248 auto_vec
<gimple
, 3> m_conditions
, m_cases
;
1252 sese_dom_walker::sese_dom_walker (cdi_direction direction
, sese region
)
1253 : dom_walker (direction
), m_region (region
)
1257 /* Call-back for dom_walk executed before visiting the dominated
1261 sese_dom_walker::before_dom_children (basic_block bb
)
1266 if (!bb_in_sese_p (bb
, m_region
))
1269 stmt
= single_pred_cond_non_loop_exit (bb
);
1273 edge e
= single_pred_edge (bb
);
1275 m_conditions
.safe_push (stmt
);
1277 if (e
->flags
& EDGE_TRUE_VALUE
)
1278 m_cases
.safe_push (stmt
);
1280 m_cases
.safe_push (NULL
);
1283 gbb
= gbb_from_bb (bb
);
1287 GBB_CONDITIONS (gbb
) = m_conditions
.copy ();
1288 GBB_CONDITION_CASES (gbb
) = m_cases
.copy ();
1292 /* Call-back for dom_walk executed after visiting the dominated
1296 sese_dom_walker::after_dom_children (basic_block bb
)
1298 if (!bb_in_sese_p (bb
, m_region
))
1301 if (single_pred_cond_non_loop_exit (bb
))
1303 m_conditions
.pop ();
1308 /* Add constraints on the possible values of parameter P from the type
1312 add_param_constraints (scop_p scop
, graphite_dim_t p
)
1314 tree parameter
= SESE_PARAMS (SCOP_REGION (scop
))[p
];
1315 tree type
= TREE_TYPE (parameter
);
1316 tree lb
= NULL_TREE
;
1317 tree ub
= NULL_TREE
;
1319 if (POINTER_TYPE_P (type
) || !TYPE_MIN_VALUE (type
))
1320 lb
= lower_bound_in_type (type
, type
);
1322 lb
= TYPE_MIN_VALUE (type
);
1324 if (POINTER_TYPE_P (type
) || !TYPE_MAX_VALUE (type
))
1325 ub
= upper_bound_in_type (type
, type
);
1327 ub
= TYPE_MAX_VALUE (type
);
1331 isl_space
*space
= isl_set_get_space (scop
->context
);
1336 c
= isl_inequality_alloc (isl_local_space_from_space (space
));
1339 tree_int_to_gmp (lb
, g
);
1340 isl_int_set_gmp (v
, g
);
1343 c
= isl_constraint_set_constant (c
, v
);
1345 c
= isl_constraint_set_coefficient_si (c
, isl_dim_param
, p
, 1);
1347 scop
->context
= isl_set_add_constraint (scop
->context
, c
);
1352 isl_space
*space
= isl_set_get_space (scop
->context
);
1357 c
= isl_inequality_alloc (isl_local_space_from_space (space
));
1361 tree_int_to_gmp (ub
, g
);
1362 isl_int_set_gmp (v
, g
);
1364 c
= isl_constraint_set_constant (c
, v
);
1366 c
= isl_constraint_set_coefficient_si (c
, isl_dim_param
, p
, -1);
1368 scop
->context
= isl_set_add_constraint (scop
->context
, c
);
1372 /* Build the context of the SCOP. The context usually contains extra
1373 constraints that are added to the iteration domains that constrain
1377 build_scop_context (scop_p scop
)
1379 graphite_dim_t p
, n
= scop_nb_params (scop
);
1381 for (p
= 0; p
< n
; p
++)
1382 add_param_constraints (scop
, p
);
1385 /* Build the iteration domains: the loops belonging to the current
1386 SCOP, and that vary for the execution of the current basic block.
1387 Returns false if there is no loop in SCOP. */
1390 build_scop_iteration_domain (scop_p scop
)
1393 sese region
= SCOP_REGION (scop
);
1396 int nb_loops
= number_of_loops (cfun
);
1397 isl_set
**doms
= XCNEWVEC (isl_set
*, nb_loops
);
1399 FOR_EACH_VEC_ELT (SESE_LOOP_NEST (region
), i
, loop
)
1400 if (!loop_in_sese_p (loop_outer (loop
), region
))
1401 build_loop_iteration_domains (scop
, loop
, 0,
1402 isl_set_copy (scop
->context
), doms
);
1404 FOR_EACH_VEC_ELT (SCOP_BBS (scop
), i
, pbb
)
1406 loop
= pbb_loop (pbb
);
1408 if (doms
[loop
->num
])
1409 pbb
->domain
= isl_set_copy (doms
[loop
->num
]);
1411 pbb
->domain
= isl_set_copy (scop
->context
);
1413 pbb
->domain
= isl_set_set_tuple_id (pbb
->domain
,
1414 isl_id_for_pbb (scop
, pbb
));
1417 for (i
= 0; i
< nb_loops
; i
++)
1419 isl_set_free (doms
[i
]);
1424 /* Add a constrain to the ACCESSES polyhedron for the alias set of
1425 data reference DR. ACCESSP_NB_DIMS is the dimension of the
1426 ACCESSES polyhedron, DOM_NB_DIMS is the dimension of the iteration
1430 pdr_add_alias_set (isl_map
*acc
, data_reference_p dr
)
1433 int alias_set_num
= 0;
1434 base_alias_pair
*bap
= (base_alias_pair
*)(dr
->aux
);
1436 if (bap
&& bap
->alias_set
)
1437 alias_set_num
= *(bap
->alias_set
);
1439 c
= isl_equality_alloc
1440 (isl_local_space_from_space (isl_map_get_space (acc
)));
1441 c
= isl_constraint_set_constant_si (c
, -alias_set_num
);
1442 c
= isl_constraint_set_coefficient_si (c
, isl_dim_out
, 0, 1);
1444 return isl_map_add_constraint (acc
, c
);
1447 /* Assign the affine expression INDEX to the output dimension POS of
1448 MAP and return the result. */
1451 set_index (isl_map
*map
, int pos
, isl_pw_aff
*index
)
1454 int len
= isl_map_dim (map
, isl_dim_out
);
1457 index_map
= isl_map_from_pw_aff (index
);
1458 index_map
= isl_map_insert_dims (index_map
, isl_dim_out
, 0, pos
);
1459 index_map
= isl_map_add_dims (index_map
, isl_dim_out
, len
- pos
- 1);
1461 id
= isl_map_get_tuple_id (map
, isl_dim_out
);
1462 index_map
= isl_map_set_tuple_id (index_map
, isl_dim_out
, id
);
1463 id
= isl_map_get_tuple_id (map
, isl_dim_in
);
1464 index_map
= isl_map_set_tuple_id (index_map
, isl_dim_in
, id
);
1466 return isl_map_intersect (map
, index_map
);
1469 /* Add to ACCESSES polyhedron equalities defining the access functions
1470 to the memory. ACCESSP_NB_DIMS is the dimension of the ACCESSES
1471 polyhedron, DOM_NB_DIMS is the dimension of the iteration domain.
1472 PBB is the poly_bb_p that contains the data reference DR. */
1475 pdr_add_memory_accesses (isl_map
*acc
, data_reference_p dr
, poly_bb_p pbb
)
1477 int i
, nb_subscripts
= DR_NUM_DIMENSIONS (dr
);
1478 scop_p scop
= PBB_SCOP (pbb
);
1480 for (i
= 0; i
< nb_subscripts
; i
++)
1483 tree afn
= DR_ACCESS_FN (dr
, nb_subscripts
- 1 - i
);
1485 aff
= extract_affine (scop
, afn
,
1486 isl_space_domain (isl_map_get_space (acc
)));
1487 acc
= set_index (acc
, i
+ 1, aff
);
1493 /* Add constrains representing the size of the accessed data to the
1494 ACCESSES polyhedron. ACCESSP_NB_DIMS is the dimension of the
1495 ACCESSES polyhedron, DOM_NB_DIMS is the dimension of the iteration
1499 pdr_add_data_dimensions (isl_set
*extent
, scop_p scop
, data_reference_p dr
)
1501 tree ref
= DR_REF (dr
);
1502 int i
, nb_subscripts
= DR_NUM_DIMENSIONS (dr
);
1504 for (i
= nb_subscripts
- 1; i
>= 0; i
--, ref
= TREE_OPERAND (ref
, 0))
1508 if (TREE_CODE (ref
) != ARRAY_REF
)
1511 low
= array_ref_low_bound (ref
);
1512 high
= array_ref_up_bound (ref
);
1514 /* XXX The PPL code dealt separately with
1515 subscript - low >= 0 and high - subscript >= 0 in case one of
1516 the two bounds isn't known. Do the same here? */
1518 if (tree_fits_shwi_p (low
)
1520 && tree_fits_shwi_p (high
)
1521 /* 1-element arrays at end of structures may extend over
1522 their declared size. */
1523 && !(array_at_struct_end_p (ref
)
1524 && operand_equal_p (low
, high
, 0)))
1528 isl_set
*univ
, *lbs
, *ubs
;
1532 isl_pw_aff
*lb
= extract_affine_int (low
, isl_set_get_space (extent
));
1533 isl_pw_aff
*ub
= extract_affine_int (high
, isl_set_get_space (extent
));
1536 valid
= isl_pw_aff_nonneg_set (isl_pw_aff_copy (ub
));
1537 valid
= isl_set_project_out (valid
, isl_dim_set
, 0,
1538 isl_set_dim (valid
, isl_dim_set
));
1539 scop
->context
= isl_set_intersect (scop
->context
, valid
);
1541 space
= isl_set_get_space (extent
);
1542 aff
= isl_aff_zero_on_domain (isl_local_space_from_space (space
));
1543 aff
= isl_aff_add_coefficient_si (aff
, isl_dim_in
, i
+ 1, 1);
1544 univ
= isl_set_universe (isl_space_domain (isl_aff_get_space (aff
)));
1545 index
= isl_pw_aff_alloc (univ
, aff
);
1547 id
= isl_set_get_tuple_id (extent
);
1548 lb
= isl_pw_aff_set_tuple_id (lb
, isl_dim_in
, isl_id_copy (id
));
1549 ub
= isl_pw_aff_set_tuple_id (ub
, isl_dim_in
, id
);
1551 /* low <= sub_i <= high */
1552 lbs
= isl_pw_aff_ge_set (isl_pw_aff_copy (index
), lb
);
1553 ubs
= isl_pw_aff_le_set (index
, ub
);
1554 extent
= isl_set_intersect (extent
, lbs
);
1555 extent
= isl_set_intersect (extent
, ubs
);
1562 /* Build data accesses for DR in PBB. */
1565 build_poly_dr (data_reference_p dr
, poly_bb_p pbb
)
1567 int dr_base_object_set
;
1570 scop_p scop
= PBB_SCOP (pbb
);
1573 isl_space
*dc
= isl_set_get_space (pbb
->domain
);
1574 int nb_out
= 1 + DR_NUM_DIMENSIONS (dr
);
1575 isl_space
*space
= isl_space_add_dims (isl_space_from_domain (dc
),
1576 isl_dim_out
, nb_out
);
1578 acc
= isl_map_universe (space
);
1579 acc
= isl_map_set_tuple_id (acc
, isl_dim_out
, isl_id_for_dr (scop
, dr
));
1582 acc
= pdr_add_alias_set (acc
, dr
);
1583 acc
= pdr_add_memory_accesses (acc
, dr
, pbb
);
1586 isl_id
*id
= isl_id_for_dr (scop
, dr
);
1587 int nb
= 1 + DR_NUM_DIMENSIONS (dr
);
1588 isl_space
*space
= isl_space_set_alloc (scop
->ctx
, 0, nb
);
1589 int alias_set_num
= 0;
1590 base_alias_pair
*bap
= (base_alias_pair
*)(dr
->aux
);
1592 if (bap
&& bap
->alias_set
)
1593 alias_set_num
= *(bap
->alias_set
);
1595 space
= isl_space_set_tuple_id (space
, isl_dim_set
, id
);
1596 extent
= isl_set_nat_universe (space
);
1597 extent
= isl_set_fix_si (extent
, isl_dim_set
, 0, alias_set_num
);
1598 extent
= pdr_add_data_dimensions (extent
, scop
, dr
);
1601 gcc_assert (dr
->aux
);
1602 dr_base_object_set
= ((base_alias_pair
*)(dr
->aux
))->base_obj_set
;
1604 new_poly_dr (pbb
, dr_base_object_set
,
1605 DR_IS_READ (dr
) ? PDR_READ
: PDR_WRITE
,
1606 dr
, DR_NUM_DIMENSIONS (dr
), acc
, extent
);
1609 /* Write to FILE the alias graph of data references in DIMACS format. */
1612 write_alias_graph_to_ascii_dimacs (FILE *file
, char *comment
,
1613 vec
<data_reference_p
> drs
)
1615 int num_vertex
= drs
.length ();
1617 data_reference_p dr1
, dr2
;
1620 if (num_vertex
== 0)
1623 FOR_EACH_VEC_ELT (drs
, i
, dr1
)
1624 for (j
= i
+ 1; drs
.iterate (j
, &dr2
); j
++)
1625 if (dr_may_alias_p (dr1
, dr2
, true))
1628 fprintf (file
, "$\n");
1631 fprintf (file
, "c %s\n", comment
);
1633 fprintf (file
, "p edge %d %d\n", num_vertex
, edge_num
);
1635 FOR_EACH_VEC_ELT (drs
, i
, dr1
)
1636 for (j
= i
+ 1; drs
.iterate (j
, &dr2
); j
++)
1637 if (dr_may_alias_p (dr1
, dr2
, true))
1638 fprintf (file
, "e %d %d\n", i
+ 1, j
+ 1);
1643 /* Write to FILE the alias graph of data references in DOT format. */
1646 write_alias_graph_to_ascii_dot (FILE *file
, char *comment
,
1647 vec
<data_reference_p
> drs
)
1649 int num_vertex
= drs
.length ();
1650 data_reference_p dr1
, dr2
;
1653 if (num_vertex
== 0)
1656 fprintf (file
, "$\n");
1659 fprintf (file
, "c %s\n", comment
);
1661 /* First print all the vertices. */
1662 FOR_EACH_VEC_ELT (drs
, i
, dr1
)
1663 fprintf (file
, "n%d;\n", i
);
1665 FOR_EACH_VEC_ELT (drs
, i
, dr1
)
1666 for (j
= i
+ 1; drs
.iterate (j
, &dr2
); j
++)
1667 if (dr_may_alias_p (dr1
, dr2
, true))
1668 fprintf (file
, "n%d n%d\n", i
, j
);
1673 /* Write to FILE the alias graph of data references in ECC format. */
1676 write_alias_graph_to_ascii_ecc (FILE *file
, char *comment
,
1677 vec
<data_reference_p
> drs
)
1679 int num_vertex
= drs
.length ();
1680 data_reference_p dr1
, dr2
;
1683 if (num_vertex
== 0)
1686 fprintf (file
, "$\n");
1689 fprintf (file
, "c %s\n", comment
);
1691 FOR_EACH_VEC_ELT (drs
, i
, dr1
)
1692 for (j
= i
+ 1; drs
.iterate (j
, &dr2
); j
++)
1693 if (dr_may_alias_p (dr1
, dr2
, true))
1694 fprintf (file
, "%d %d\n", i
, j
);
1699 /* Check if DR1 and DR2 are in the same object set. */
1702 dr_same_base_object_p (const struct data_reference
*dr1
,
1703 const struct data_reference
*dr2
)
1705 return operand_equal_p (DR_BASE_OBJECT (dr1
), DR_BASE_OBJECT (dr2
), 0);
1708 /* Uses DFS component number as representative of alias-sets. Also tests for
1709 optimality by verifying if every connected component is a clique. Returns
1710 true (1) if the above test is true, and false (0) otherwise. */
1713 build_alias_set_optimal_p (vec
<data_reference_p
> drs
)
1715 int num_vertices
= drs
.length ();
1716 struct graph
*g
= new_graph (num_vertices
);
1717 data_reference_p dr1
, dr2
;
1719 int num_connected_components
;
1720 int v_indx1
, v_indx2
, num_vertices_in_component
;
1723 struct graph_edge
*e
;
1724 int this_component_is_clique
;
1725 int all_components_are_cliques
= 1;
1727 FOR_EACH_VEC_ELT (drs
, i
, dr1
)
1728 for (j
= i
+1; drs
.iterate (j
, &dr2
); j
++)
1729 if (dr_may_alias_p (dr1
, dr2
, true))
1735 all_vertices
= XNEWVEC (int, num_vertices
);
1736 vertices
= XNEWVEC (int, num_vertices
);
1737 for (i
= 0; i
< num_vertices
; i
++)
1738 all_vertices
[i
] = i
;
1740 num_connected_components
= graphds_dfs (g
, all_vertices
, num_vertices
,
1742 for (i
= 0; i
< g
->n_vertices
; i
++)
1744 data_reference_p dr
= drs
[i
];
1745 base_alias_pair
*bap
;
1747 gcc_assert (dr
->aux
);
1748 bap
= (base_alias_pair
*)(dr
->aux
);
1750 bap
->alias_set
= XNEW (int);
1751 *(bap
->alias_set
) = g
->vertices
[i
].component
+ 1;
1754 /* Verify if the DFS numbering results in optimal solution. */
1755 for (i
= 0; i
< num_connected_components
; i
++)
1757 num_vertices_in_component
= 0;
1758 /* Get all vertices whose DFS component number is the same as i. */
1759 for (j
= 0; j
< num_vertices
; j
++)
1760 if (g
->vertices
[j
].component
== i
)
1761 vertices
[num_vertices_in_component
++] = j
;
1763 /* Now test if the vertices in 'vertices' form a clique, by testing
1764 for edges among each pair. */
1765 this_component_is_clique
= 1;
1766 for (v_indx1
= 0; v_indx1
< num_vertices_in_component
; v_indx1
++)
1768 for (v_indx2
= v_indx1
+1; v_indx2
< num_vertices_in_component
; v_indx2
++)
1770 /* Check if the two vertices are connected by iterating
1771 through all the edges which have one of these are source. */
1772 e
= g
->vertices
[vertices
[v_indx2
]].pred
;
1775 if (e
->src
== vertices
[v_indx1
])
1781 this_component_is_clique
= 0;
1785 if (!this_component_is_clique
)
1786 all_components_are_cliques
= 0;
1790 free (all_vertices
);
1793 return all_components_are_cliques
;
1796 /* Group each data reference in DRS with its base object set num. */
1799 build_base_obj_set_for_drs (vec
<data_reference_p
> drs
)
1801 int num_vertex
= drs
.length ();
1802 struct graph
*g
= new_graph (num_vertex
);
1803 data_reference_p dr1
, dr2
;
1807 FOR_EACH_VEC_ELT (drs
, i
, dr1
)
1808 for (j
= i
+ 1; drs
.iterate (j
, &dr2
); j
++)
1809 if (dr_same_base_object_p (dr1
, dr2
))
1815 queue
= XNEWVEC (int, num_vertex
);
1816 for (i
= 0; i
< num_vertex
; i
++)
1819 graphds_dfs (g
, queue
, num_vertex
, NULL
, true, NULL
);
1821 for (i
= 0; i
< g
->n_vertices
; i
++)
1823 data_reference_p dr
= drs
[i
];
1824 base_alias_pair
*bap
;
1826 gcc_assert (dr
->aux
);
1827 bap
= (base_alias_pair
*)(dr
->aux
);
1829 bap
->base_obj_set
= g
->vertices
[i
].component
+ 1;
1836 /* Build the data references for PBB. */
1839 build_pbb_drs (poly_bb_p pbb
)
1842 data_reference_p dr
;
1843 vec
<data_reference_p
> gbb_drs
= GBB_DATA_REFS (PBB_BLACK_BOX (pbb
));
1845 FOR_EACH_VEC_ELT (gbb_drs
, j
, dr
)
1846 build_poly_dr (dr
, pbb
);
1849 /* Dump to file the alias graphs for the data references in DRS. */
1852 dump_alias_graphs (vec
<data_reference_p
> drs
)
1855 FILE *file_dimacs
, *file_ecc
, *file_dot
;
1857 file_dimacs
= fopen ("/tmp/dr_alias_graph_dimacs", "ab");
1860 snprintf (comment
, sizeof (comment
), "%s %s", main_input_filename
,
1861 current_function_name ());
1862 write_alias_graph_to_ascii_dimacs (file_dimacs
, comment
, drs
);
1863 fclose (file_dimacs
);
1866 file_ecc
= fopen ("/tmp/dr_alias_graph_ecc", "ab");
1869 snprintf (comment
, sizeof (comment
), "%s %s", main_input_filename
,
1870 current_function_name ());
1871 write_alias_graph_to_ascii_ecc (file_ecc
, comment
, drs
);
1875 file_dot
= fopen ("/tmp/dr_alias_graph_dot", "ab");
1878 snprintf (comment
, sizeof (comment
), "%s %s", main_input_filename
,
1879 current_function_name ());
1880 write_alias_graph_to_ascii_dot (file_dot
, comment
, drs
);
1885 /* Build data references in SCOP. */
1888 build_scop_drs (scop_p scop
)
1892 data_reference_p dr
;
1893 auto_vec
<data_reference_p
, 3> drs
;
1895 /* Remove all the PBBs that do not have data references: these basic
1896 blocks are not handled in the polyhedral representation. */
1897 for (i
= 0; SCOP_BBS (scop
).iterate (i
, &pbb
); i
++)
1898 if (GBB_DATA_REFS (PBB_BLACK_BOX (pbb
)).is_empty ())
1900 free_gimple_bb (PBB_BLACK_BOX (pbb
));
1902 SCOP_BBS (scop
).ordered_remove (i
);
1906 FOR_EACH_VEC_ELT (SCOP_BBS (scop
), i
, pbb
)
1907 for (j
= 0; GBB_DATA_REFS (PBB_BLACK_BOX (pbb
)).iterate (j
, &dr
); j
++)
1910 FOR_EACH_VEC_ELT (drs
, i
, dr
)
1911 dr
->aux
= XNEW (base_alias_pair
);
1913 if (!build_alias_set_optimal_p (drs
))
1915 /* TODO: Add support when building alias set is not optimal. */
1919 build_base_obj_set_for_drs (drs
);
1921 /* When debugging, enable the following code. This cannot be used
1922 in production compilers. */
1924 dump_alias_graphs (drs
);
1928 FOR_EACH_VEC_ELT (SCOP_BBS (scop
), i
, pbb
)
1929 build_pbb_drs (pbb
);
1932 /* Return a gsi at the position of the phi node STMT. */
1934 static gimple_stmt_iterator
1935 gsi_for_phi_node (gimple stmt
)
1937 gimple_stmt_iterator psi
;
1938 basic_block bb
= gimple_bb (stmt
);
1940 for (psi
= gsi_start_phis (bb
); !gsi_end_p (psi
); gsi_next (&psi
))
1941 if (stmt
== gsi_stmt (psi
))
1948 /* Analyze all the data references of STMTS and add them to the
1949 GBB_DATA_REFS vector of BB. */
1952 analyze_drs_in_stmts (scop_p scop
, basic_block bb
, vec
<gimple
> stmts
)
1958 sese region
= SCOP_REGION (scop
);
1960 if (!bb_in_sese_p (bb
, region
))
1963 nest
= outermost_loop_in_sese_1 (region
, bb
);
1964 gbb
= gbb_from_bb (bb
);
1966 FOR_EACH_VEC_ELT (stmts
, i
, stmt
)
1970 if (is_gimple_debug (stmt
))
1973 loop
= loop_containing_stmt (stmt
);
1974 if (!loop_in_sese_p (loop
, region
))
1977 graphite_find_data_references_in_stmt (nest
, loop
, stmt
,
1978 &GBB_DATA_REFS (gbb
));
1982 /* Insert STMT at the end of the STMTS sequence and then insert the
1983 statements from STMTS at INSERT_GSI and call analyze_drs_in_stmts
1987 insert_stmts (scop_p scop
, gimple stmt
, gimple_seq stmts
,
1988 gimple_stmt_iterator insert_gsi
)
1990 gimple_stmt_iterator gsi
;
1991 auto_vec
<gimple
, 3> x
;
1993 gimple_seq_add_stmt (&stmts
, stmt
);
1994 for (gsi
= gsi_start (stmts
); !gsi_end_p (gsi
); gsi_next (&gsi
))
1995 x
.safe_push (gsi_stmt (gsi
));
1997 gsi_insert_seq_before (&insert_gsi
, stmts
, GSI_SAME_STMT
);
1998 analyze_drs_in_stmts (scop
, gsi_bb (insert_gsi
), x
);
2001 /* Insert the assignment "RES := EXPR" just after AFTER_STMT. */
2004 insert_out_of_ssa_copy (scop_p scop
, tree res
, tree expr
, gimple after_stmt
)
2007 gimple_stmt_iterator gsi
;
2008 tree var
= force_gimple_operand (expr
, &stmts
, true, NULL_TREE
);
2009 gimple stmt
= gimple_build_assign (unshare_expr (res
), var
);
2010 auto_vec
<gimple
, 3> x
;
2012 gimple_seq_add_stmt (&stmts
, stmt
);
2013 for (gsi
= gsi_start (stmts
); !gsi_end_p (gsi
); gsi_next (&gsi
))
2014 x
.safe_push (gsi_stmt (gsi
));
2016 if (gimple_code (after_stmt
) == GIMPLE_PHI
)
2018 gsi
= gsi_after_labels (gimple_bb (after_stmt
));
2019 gsi_insert_seq_before (&gsi
, stmts
, GSI_NEW_STMT
);
2023 gsi
= gsi_for_stmt (after_stmt
);
2024 gsi_insert_seq_after (&gsi
, stmts
, GSI_NEW_STMT
);
2027 analyze_drs_in_stmts (scop
, gimple_bb (after_stmt
), x
);
2030 /* Creates a poly_bb_p for basic_block BB from the existing PBB. */
2033 new_pbb_from_pbb (scop_p scop
, poly_bb_p pbb
, basic_block bb
)
2035 vec
<data_reference_p
> drs
;
2037 gimple_bb_p gbb
= PBB_BLACK_BOX (pbb
);
2038 gimple_bb_p gbb1
= new_gimple_bb (bb
, drs
);
2039 poly_bb_p pbb1
= new_poly_bb (scop
, gbb1
);
2040 int index
, n
= SCOP_BBS (scop
).length ();
2042 /* The INDEX of PBB in SCOP_BBS. */
2043 for (index
= 0; index
< n
; index
++)
2044 if (SCOP_BBS (scop
)[index
] == pbb
)
2047 pbb1
->domain
= isl_set_copy (pbb
->domain
);
2049 GBB_PBB (gbb1
) = pbb1
;
2050 GBB_CONDITIONS (gbb1
) = GBB_CONDITIONS (gbb
).copy ();
2051 GBB_CONDITION_CASES (gbb1
) = GBB_CONDITION_CASES (gbb
).copy ();
2052 SCOP_BBS (scop
).safe_insert (index
+ 1, pbb1
);
2055 /* Insert on edge E the assignment "RES := EXPR". */
2058 insert_out_of_ssa_copy_on_edge (scop_p scop
, edge e
, tree res
, tree expr
)
2060 gimple_stmt_iterator gsi
;
2061 gimple_seq stmts
= NULL
;
2062 tree var
= force_gimple_operand (expr
, &stmts
, true, NULL_TREE
);
2063 gimple stmt
= gimple_build_assign (unshare_expr (res
), var
);
2065 auto_vec
<gimple
, 3> x
;
2067 gimple_seq_add_stmt (&stmts
, stmt
);
2068 for (gsi
= gsi_start (stmts
); !gsi_end_p (gsi
); gsi_next (&gsi
))
2069 x
.safe_push (gsi_stmt (gsi
));
2071 gsi_insert_seq_on_edge (e
, stmts
);
2072 gsi_commit_edge_inserts ();
2073 bb
= gimple_bb (stmt
);
2075 if (!bb_in_sese_p (bb
, SCOP_REGION (scop
)))
2078 if (!gbb_from_bb (bb
))
2079 new_pbb_from_pbb (scop
, pbb_from_bb (e
->src
), bb
);
2081 analyze_drs_in_stmts (scop
, bb
, x
);
2084 /* Creates a zero dimension array of the same type as VAR. */
2087 create_zero_dim_array (tree var
, const char *base_name
)
2089 tree index_type
= build_index_type (integer_zero_node
);
2090 tree elt_type
= TREE_TYPE (var
);
2091 tree array_type
= build_array_type (elt_type
, index_type
);
2092 tree base
= create_tmp_var (array_type
, base_name
);
2094 return build4 (ARRAY_REF
, elt_type
, base
, integer_zero_node
, NULL_TREE
,
2098 /* Returns true when PHI is a loop close phi node. */
2101 scalar_close_phi_node_p (gimple phi
)
2103 if (gimple_code (phi
) != GIMPLE_PHI
2104 || virtual_operand_p (gimple_phi_result (phi
)))
2107 /* Note that loop close phi nodes should have a single argument
2108 because we translated the representation into a canonical form
2109 before Graphite: see canonicalize_loop_closed_ssa_form. */
2110 return (gimple_phi_num_args (phi
) == 1);
2113 /* For a definition DEF in REGION, propagates the expression EXPR in
2114 all the uses of DEF outside REGION. */
2117 propagate_expr_outside_region (tree def
, tree expr
, sese region
)
2119 imm_use_iterator imm_iter
;
2122 bool replaced_once
= false;
2124 gcc_assert (TREE_CODE (def
) == SSA_NAME
);
2126 expr
= force_gimple_operand (unshare_expr (expr
), &stmts
, true,
2129 FOR_EACH_IMM_USE_STMT (use_stmt
, imm_iter
, def
)
2130 if (!is_gimple_debug (use_stmt
)
2131 && !bb_in_sese_p (gimple_bb (use_stmt
), region
))
2134 use_operand_p use_p
;
2136 FOR_EACH_PHI_OR_STMT_USE (use_p
, use_stmt
, iter
, SSA_OP_ALL_USES
)
2137 if (operand_equal_p (def
, USE_FROM_PTR (use_p
), 0)
2138 && (replaced_once
= true))
2139 replace_exp (use_p
, expr
);
2141 update_stmt (use_stmt
);
2146 gsi_insert_seq_on_edge (SESE_ENTRY (region
), stmts
);
2147 gsi_commit_edge_inserts ();
2151 /* Rewrite out of SSA the reduction phi node at PSI by creating a zero
2152 dimension array for it. */
2155 rewrite_close_phi_out_of_ssa (scop_p scop
, gimple_stmt_iterator
*psi
)
2157 sese region
= SCOP_REGION (scop
);
2158 gimple phi
= gsi_stmt (*psi
);
2159 tree res
= gimple_phi_result (phi
);
2160 basic_block bb
= gimple_bb (phi
);
2161 gimple_stmt_iterator gsi
= gsi_after_labels (bb
);
2162 tree arg
= gimple_phi_arg_def (phi
, 0);
2165 /* Note that loop close phi nodes should have a single argument
2166 because we translated the representation into a canonical form
2167 before Graphite: see canonicalize_loop_closed_ssa_form. */
2168 gcc_assert (gimple_phi_num_args (phi
) == 1);
2170 /* The phi node can be a non close phi node, when its argument is
2171 invariant, or a default definition. */
2172 if (is_gimple_min_invariant (arg
)
2173 || SSA_NAME_IS_DEFAULT_DEF (arg
))
2175 propagate_expr_outside_region (res
, arg
, region
);
2180 else if (gimple_bb (SSA_NAME_DEF_STMT (arg
))->loop_father
== bb
->loop_father
)
2182 propagate_expr_outside_region (res
, arg
, region
);
2183 stmt
= gimple_build_assign (res
, arg
);
2184 remove_phi_node (psi
, false);
2185 gsi_insert_before (&gsi
, stmt
, GSI_NEW_STMT
);
2189 /* If res is scev analyzable and is not a scalar value, it is safe
2190 to ignore the close phi node: it will be code generated in the
2191 out of Graphite pass. */
2192 else if (scev_analyzable_p (res
, region
))
2194 loop_p loop
= loop_containing_stmt (SSA_NAME_DEF_STMT (res
));
2197 if (!loop_in_sese_p (loop
, region
))
2199 loop
= loop_containing_stmt (SSA_NAME_DEF_STMT (arg
));
2200 scev
= scalar_evolution_in_region (region
, loop
, arg
);
2201 scev
= compute_overall_effect_of_inner_loop (loop
, scev
);
2204 scev
= scalar_evolution_in_region (region
, loop
, res
);
2206 if (tree_does_not_contain_chrecs (scev
))
2207 propagate_expr_outside_region (res
, scev
, region
);
2214 tree zero_dim_array
= create_zero_dim_array (res
, "Close_Phi");
2216 stmt
= gimple_build_assign (res
, unshare_expr (zero_dim_array
));
2218 if (TREE_CODE (arg
) == SSA_NAME
)
2219 insert_out_of_ssa_copy (scop
, zero_dim_array
, arg
,
2220 SSA_NAME_DEF_STMT (arg
));
2222 insert_out_of_ssa_copy_on_edge (scop
, single_pred_edge (bb
),
2223 zero_dim_array
, arg
);
2226 remove_phi_node (psi
, false);
2227 SSA_NAME_DEF_STMT (res
) = stmt
;
2229 insert_stmts (scop
, stmt
, NULL
, gsi_after_labels (bb
));
2232 /* Rewrite out of SSA the reduction phi node at PSI by creating a zero
2233 dimension array for it. */
2236 rewrite_phi_out_of_ssa (scop_p scop
, gimple_stmt_iterator
*psi
)
2239 gimple phi
= gsi_stmt (*psi
);
2240 basic_block bb
= gimple_bb (phi
);
2241 tree res
= gimple_phi_result (phi
);
2242 tree zero_dim_array
= create_zero_dim_array (res
, "phi_out_of_ssa");
2245 for (i
= 0; i
< gimple_phi_num_args (phi
); i
++)
2247 tree arg
= gimple_phi_arg_def (phi
, i
);
2248 edge e
= gimple_phi_arg_edge (phi
, i
);
2250 /* Avoid the insertion of code in the loop latch to please the
2251 pattern matching of the vectorizer. */
2252 if (TREE_CODE (arg
) == SSA_NAME
2253 && e
->src
== bb
->loop_father
->latch
)
2254 insert_out_of_ssa_copy (scop
, zero_dim_array
, arg
,
2255 SSA_NAME_DEF_STMT (arg
));
2257 insert_out_of_ssa_copy_on_edge (scop
, e
, zero_dim_array
, arg
);
2260 stmt
= gimple_build_assign (res
, unshare_expr (zero_dim_array
));
2261 remove_phi_node (psi
, false);
2262 insert_stmts (scop
, stmt
, NULL
, gsi_after_labels (bb
));
2265 /* Rewrite the degenerate phi node at position PSI from the degenerate
2266 form "x = phi (y, y, ..., y)" to "x = y". */
2269 rewrite_degenerate_phi (gimple_stmt_iterator
*psi
)
2273 gimple_stmt_iterator gsi
;
2274 gimple phi
= gsi_stmt (*psi
);
2275 tree res
= gimple_phi_result (phi
);
2278 bb
= gimple_bb (phi
);
2279 rhs
= degenerate_phi_result (phi
);
2282 stmt
= gimple_build_assign (res
, rhs
);
2283 remove_phi_node (psi
, false);
2285 gsi
= gsi_after_labels (bb
);
2286 gsi_insert_before (&gsi
, stmt
, GSI_NEW_STMT
);
2289 /* Rewrite out of SSA all the reduction phi nodes of SCOP. */
2292 rewrite_reductions_out_of_ssa (scop_p scop
)
2295 gimple_stmt_iterator psi
;
2296 sese region
= SCOP_REGION (scop
);
2298 FOR_EACH_BB_FN (bb
, cfun
)
2299 if (bb_in_sese_p (bb
, region
))
2300 for (psi
= gsi_start_phis (bb
); !gsi_end_p (psi
);)
2302 gimple phi
= gsi_stmt (psi
);
2304 if (virtual_operand_p (gimple_phi_result (phi
)))
2310 if (gimple_phi_num_args (phi
) > 1
2311 && degenerate_phi_result (phi
))
2312 rewrite_degenerate_phi (&psi
);
2314 else if (scalar_close_phi_node_p (phi
))
2315 rewrite_close_phi_out_of_ssa (scop
, &psi
);
2317 else if (reduction_phi_p (region
, &psi
))
2318 rewrite_phi_out_of_ssa (scop
, &psi
);
2321 update_ssa (TODO_update_ssa
);
2322 #ifdef ENABLE_CHECKING
2323 verify_loop_closed_ssa (true);
2327 /* Rewrite the scalar dependence of DEF used in USE_STMT with a memory
2328 read from ZERO_DIM_ARRAY. */
2331 rewrite_cross_bb_scalar_dependence (scop_p scop
, tree zero_dim_array
,
2332 tree def
, gimple use_stmt
)
2337 use_operand_p use_p
;
2339 gcc_assert (gimple_code (use_stmt
) != GIMPLE_PHI
);
2341 name
= copy_ssa_name (def
, NULL
);
2342 name_stmt
= gimple_build_assign (name
, zero_dim_array
);
2344 gimple_assign_set_lhs (name_stmt
, name
);
2345 insert_stmts (scop
, name_stmt
, NULL
, gsi_for_stmt (use_stmt
));
2347 FOR_EACH_SSA_USE_OPERAND (use_p
, use_stmt
, iter
, SSA_OP_ALL_USES
)
2348 if (operand_equal_p (def
, USE_FROM_PTR (use_p
), 0))
2349 replace_exp (use_p
, name
);
2351 update_stmt (use_stmt
);
2354 /* For every definition DEF in the SCOP that is used outside the scop,
2355 insert a closing-scop definition in the basic block just after this
2359 handle_scalar_deps_crossing_scop_limits (scop_p scop
, tree def
, gimple stmt
)
2361 tree var
= create_tmp_reg (TREE_TYPE (def
), NULL
);
2362 tree new_name
= make_ssa_name (var
, stmt
);
2363 bool needs_copy
= false;
2364 use_operand_p use_p
;
2365 imm_use_iterator imm_iter
;
2367 sese region
= SCOP_REGION (scop
);
2369 FOR_EACH_IMM_USE_STMT (use_stmt
, imm_iter
, def
)
2371 if (!bb_in_sese_p (gimple_bb (use_stmt
), region
))
2373 FOR_EACH_IMM_USE_ON_STMT (use_p
, imm_iter
)
2375 SET_USE (use_p
, new_name
);
2377 update_stmt (use_stmt
);
2382 /* Insert in the empty BB just after the scop a use of DEF such
2383 that the rewrite of cross_bb_scalar_dependences won't insert
2384 arrays everywhere else. */
2387 gimple assign
= gimple_build_assign (new_name
, def
);
2388 gimple_stmt_iterator psi
= gsi_after_labels (SESE_EXIT (region
)->dest
);
2390 update_stmt (assign
);
2391 gsi_insert_before (&psi
, assign
, GSI_SAME_STMT
);
2395 /* Rewrite the scalar dependences crossing the boundary of the BB
2396 containing STMT with an array. Return true when something has been
2400 rewrite_cross_bb_scalar_deps (scop_p scop
, gimple_stmt_iterator
*gsi
)
2402 sese region
= SCOP_REGION (scop
);
2403 gimple stmt
= gsi_stmt (*gsi
);
2404 imm_use_iterator imm_iter
;
2407 tree zero_dim_array
= NULL_TREE
;
2411 switch (gimple_code (stmt
))
2414 def
= gimple_assign_lhs (stmt
);
2418 def
= gimple_call_lhs (stmt
);
2426 || !is_gimple_reg (def
))
2429 if (scev_analyzable_p (def
, region
))
2431 loop_p loop
= loop_containing_stmt (SSA_NAME_DEF_STMT (def
));
2432 tree scev
= scalar_evolution_in_region (region
, loop
, def
);
2434 if (tree_contains_chrecs (scev
, NULL
))
2437 propagate_expr_outside_region (def
, scev
, region
);
2441 def_bb
= gimple_bb (stmt
);
2443 handle_scalar_deps_crossing_scop_limits (scop
, def
, stmt
);
2445 FOR_EACH_IMM_USE_STMT (use_stmt
, imm_iter
, def
)
2446 if (gimple_code (use_stmt
) == GIMPLE_PHI
2449 gimple_stmt_iterator psi
= gsi_for_stmt (use_stmt
);
2451 if (scalar_close_phi_node_p (gsi_stmt (psi
)))
2452 rewrite_close_phi_out_of_ssa (scop
, &psi
);
2454 rewrite_phi_out_of_ssa (scop
, &psi
);
2457 FOR_EACH_IMM_USE_STMT (use_stmt
, imm_iter
, def
)
2458 if (gimple_code (use_stmt
) != GIMPLE_PHI
2459 && def_bb
!= gimple_bb (use_stmt
)
2460 && !is_gimple_debug (use_stmt
)
2463 if (!zero_dim_array
)
2465 zero_dim_array
= create_zero_dim_array
2466 (def
, "Cross_BB_scalar_dependence");
2467 insert_out_of_ssa_copy (scop
, zero_dim_array
, def
,
2468 SSA_NAME_DEF_STMT (def
));
2472 rewrite_cross_bb_scalar_dependence (scop
, zero_dim_array
,
2479 /* Rewrite out of SSA all the reduction phi nodes of SCOP. */
2482 rewrite_cross_bb_scalar_deps_out_of_ssa (scop_p scop
)
2485 gimple_stmt_iterator psi
;
2486 sese region
= SCOP_REGION (scop
);
2487 bool changed
= false;
2489 /* Create an extra empty BB after the scop. */
2490 split_edge (SESE_EXIT (region
));
2492 FOR_EACH_BB_FN (bb
, cfun
)
2493 if (bb_in_sese_p (bb
, region
))
2494 for (psi
= gsi_start_bb (bb
); !gsi_end_p (psi
); gsi_next (&psi
))
2495 changed
|= rewrite_cross_bb_scalar_deps (scop
, &psi
);
2500 update_ssa (TODO_update_ssa
);
2501 #ifdef ENABLE_CHECKING
2502 verify_loop_closed_ssa (true);
2507 /* Returns the number of pbbs that are in loops contained in SCOP. */
2510 nb_pbbs_in_loops (scop_p scop
)
2516 FOR_EACH_VEC_ELT (SCOP_BBS (scop
), i
, pbb
)
2517 if (loop_in_sese_p (gbb_loop (PBB_BLACK_BOX (pbb
)), SCOP_REGION (scop
)))
2523 /* Return the number of data references in BB that write in
2527 nb_data_writes_in_bb (basic_block bb
)
2530 gimple_stmt_iterator gsi
;
2532 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
2533 if (gimple_vdef (gsi_stmt (gsi
)))
2539 /* Splits at STMT the basic block BB represented as PBB in the
2543 split_pbb (scop_p scop
, poly_bb_p pbb
, basic_block bb
, gimple stmt
)
2545 edge e1
= split_block (bb
, stmt
);
2546 new_pbb_from_pbb (scop
, pbb
, e1
->dest
);
2550 /* Splits STMT out of its current BB. This is done for reduction
2551 statements for which we want to ignore data dependences. */
2554 split_reduction_stmt (scop_p scop
, gimple stmt
)
2556 basic_block bb
= gimple_bb (stmt
);
2557 poly_bb_p pbb
= pbb_from_bb (bb
);
2558 gimple_bb_p gbb
= gbb_from_bb (bb
);
2561 data_reference_p dr
;
2563 /* Do not split basic blocks with no writes to memory: the reduction
2564 will be the only write to memory. */
2565 if (nb_data_writes_in_bb (bb
) == 0
2566 /* Or if we have already marked BB as a reduction. */
2567 || PBB_IS_REDUCTION (pbb_from_bb (bb
)))
2570 e1
= split_pbb (scop
, pbb
, bb
, stmt
);
2572 /* Split once more only when the reduction stmt is not the only one
2573 left in the original BB. */
2574 if (!gsi_one_before_end_p (gsi_start_nondebug_bb (bb
)))
2576 gimple_stmt_iterator gsi
= gsi_last_bb (bb
);
2578 e1
= split_pbb (scop
, pbb
, bb
, gsi_stmt (gsi
));
2581 /* A part of the data references will end in a different basic block
2582 after the split: move the DRs from the original GBB to the newly
2584 FOR_EACH_VEC_ELT (GBB_DATA_REFS (gbb
), i
, dr
)
2586 basic_block bb1
= gimple_bb (DR_STMT (dr
));
2590 gimple_bb_p gbb1
= gbb_from_bb (bb1
);
2591 GBB_DATA_REFS (gbb1
).safe_push (dr
);
2592 GBB_DATA_REFS (gbb
).ordered_remove (i
);
2600 /* Return true when stmt is a reduction operation. */
2603 is_reduction_operation_p (gimple stmt
)
2605 enum tree_code code
;
2607 gcc_assert (is_gimple_assign (stmt
));
2608 code
= gimple_assign_rhs_code (stmt
);
2610 return flag_associative_math
2611 && commutative_tree_code (code
)
2612 && associative_tree_code (code
);
2615 /* Returns true when PHI contains an argument ARG. */
2618 phi_contains_arg (gimple phi
, tree arg
)
2622 for (i
= 0; i
< gimple_phi_num_args (phi
); i
++)
2623 if (operand_equal_p (arg
, gimple_phi_arg_def (phi
, i
), 0))
2629 /* Return a loop phi node that corresponds to a reduction containing LHS. */
2632 follow_ssa_with_commutative_ops (tree arg
, tree lhs
)
2636 if (TREE_CODE (arg
) != SSA_NAME
)
2639 stmt
= SSA_NAME_DEF_STMT (arg
);
2641 if (gimple_code (stmt
) == GIMPLE_NOP
2642 || gimple_code (stmt
) == GIMPLE_CALL
)
2645 if (gimple_code (stmt
) == GIMPLE_PHI
)
2647 if (phi_contains_arg (stmt
, lhs
))
2652 if (!is_gimple_assign (stmt
))
2655 if (gimple_num_ops (stmt
) == 2)
2656 return follow_ssa_with_commutative_ops (gimple_assign_rhs1 (stmt
), lhs
);
2658 if (is_reduction_operation_p (stmt
))
2660 gimple res
= follow_ssa_with_commutative_ops (gimple_assign_rhs1 (stmt
), lhs
);
2663 follow_ssa_with_commutative_ops (gimple_assign_rhs2 (stmt
), lhs
);
2669 /* Detect commutative and associative scalar reductions starting at
2670 the STMT. Return the phi node of the reduction cycle, or NULL. */
2673 detect_commutative_reduction_arg (tree lhs
, gimple stmt
, tree arg
,
2677 gimple phi
= follow_ssa_with_commutative_ops (arg
, lhs
);
2682 in
->safe_push (stmt
);
2683 out
->safe_push (stmt
);
2687 /* Detect commutative and associative scalar reductions starting at
2688 STMT. Return the phi node of the reduction cycle, or NULL. */
2691 detect_commutative_reduction_assign (gimple stmt
, vec
<gimple
> *in
,
2694 tree lhs
= gimple_assign_lhs (stmt
);
2696 if (gimple_num_ops (stmt
) == 2)
2697 return detect_commutative_reduction_arg (lhs
, stmt
,
2698 gimple_assign_rhs1 (stmt
),
2701 if (is_reduction_operation_p (stmt
))
2703 gimple res
= detect_commutative_reduction_arg (lhs
, stmt
,
2704 gimple_assign_rhs1 (stmt
),
2707 : detect_commutative_reduction_arg (lhs
, stmt
,
2708 gimple_assign_rhs2 (stmt
),
2715 /* Return a loop phi node that corresponds to a reduction containing LHS. */
2718 follow_inital_value_to_phi (tree arg
, tree lhs
)
2722 if (!arg
|| TREE_CODE (arg
) != SSA_NAME
)
2725 stmt
= SSA_NAME_DEF_STMT (arg
);
2727 if (gimple_code (stmt
) == GIMPLE_PHI
2728 && phi_contains_arg (stmt
, lhs
))
2735 /* Return the argument of the loop PHI that is the initial value coming
2736 from outside the loop. */
2739 edge_initial_value_for_loop_phi (gimple phi
)
2743 for (i
= 0; i
< gimple_phi_num_args (phi
); i
++)
2745 edge e
= gimple_phi_arg_edge (phi
, i
);
2747 if (loop_depth (e
->src
->loop_father
)
2748 < loop_depth (e
->dest
->loop_father
))
2755 /* Return the argument of the loop PHI that is the initial value coming
2756 from outside the loop. */
2759 initial_value_for_loop_phi (gimple phi
)
2763 for (i
= 0; i
< gimple_phi_num_args (phi
); i
++)
2765 edge e
= gimple_phi_arg_edge (phi
, i
);
2767 if (loop_depth (e
->src
->loop_father
)
2768 < loop_depth (e
->dest
->loop_father
))
2769 return gimple_phi_arg_def (phi
, i
);
2775 /* Returns true when DEF is used outside the reduction cycle of
2779 used_outside_reduction (tree def
, gimple loop_phi
)
2781 use_operand_p use_p
;
2782 imm_use_iterator imm_iter
;
2783 loop_p loop
= loop_containing_stmt (loop_phi
);
2785 /* In LOOP, DEF should be used only in LOOP_PHI. */
2786 FOR_EACH_IMM_USE_FAST (use_p
, imm_iter
, def
)
2788 gimple stmt
= USE_STMT (use_p
);
2790 if (stmt
!= loop_phi
2791 && !is_gimple_debug (stmt
)
2792 && flow_bb_inside_loop_p (loop
, gimple_bb (stmt
)))
2799 /* Detect commutative and associative scalar reductions belonging to
2800 the SCOP starting at the loop closed phi node STMT. Return the phi
2801 node of the reduction cycle, or NULL. */
2804 detect_commutative_reduction (scop_p scop
, gimple stmt
, vec
<gimple
> *in
,
2807 if (scalar_close_phi_node_p (stmt
))
2809 gimple def
, loop_phi
, phi
, close_phi
= stmt
;
2810 tree init
, lhs
, arg
= gimple_phi_arg_def (close_phi
, 0);
2812 if (TREE_CODE (arg
) != SSA_NAME
)
2815 /* Note that loop close phi nodes should have a single argument
2816 because we translated the representation into a canonical form
2817 before Graphite: see canonicalize_loop_closed_ssa_form. */
2818 gcc_assert (gimple_phi_num_args (close_phi
) == 1);
2820 def
= SSA_NAME_DEF_STMT (arg
);
2821 if (!stmt_in_sese_p (def
, SCOP_REGION (scop
))
2822 || !(loop_phi
= detect_commutative_reduction (scop
, def
, in
, out
)))
2825 lhs
= gimple_phi_result (close_phi
);
2826 init
= initial_value_for_loop_phi (loop_phi
);
2827 phi
= follow_inital_value_to_phi (init
, lhs
);
2829 if (phi
&& (used_outside_reduction (lhs
, phi
)
2830 || !has_single_use (gimple_phi_result (phi
))))
2833 in
->safe_push (loop_phi
);
2834 out
->safe_push (close_phi
);
2838 if (gimple_code (stmt
) == GIMPLE_ASSIGN
)
2839 return detect_commutative_reduction_assign (stmt
, in
, out
);
2844 /* Translate the scalar reduction statement STMT to an array RED
2845 knowing that its recursive phi node is LOOP_PHI. */
2848 translate_scalar_reduction_to_array_for_stmt (scop_p scop
, tree red
,
2849 gimple stmt
, gimple loop_phi
)
2851 tree res
= gimple_phi_result (loop_phi
);
2852 gimple assign
= gimple_build_assign (res
, unshare_expr (red
));
2853 gimple_stmt_iterator gsi
;
2855 insert_stmts (scop
, assign
, NULL
, gsi_after_labels (gimple_bb (loop_phi
)));
2857 assign
= gimple_build_assign (unshare_expr (red
), gimple_assign_lhs (stmt
));
2858 gsi
= gsi_for_stmt (stmt
);
2860 insert_stmts (scop
, assign
, NULL
, gsi
);
2863 /* Removes the PHI node and resets all the debug stmts that are using
2867 remove_phi (gimple phi
)
2869 imm_use_iterator imm_iter
;
2871 use_operand_p use_p
;
2872 gimple_stmt_iterator gsi
;
2873 auto_vec
<gimple
, 3> update
;
2877 def
= PHI_RESULT (phi
);
2878 FOR_EACH_IMM_USE_FAST (use_p
, imm_iter
, def
)
2880 stmt
= USE_STMT (use_p
);
2882 if (is_gimple_debug (stmt
))
2884 gimple_debug_bind_reset_value (stmt
);
2885 update
.safe_push (stmt
);
2889 FOR_EACH_VEC_ELT (update
, i
, stmt
)
2892 gsi
= gsi_for_phi_node (phi
);
2893 remove_phi_node (&gsi
, false);
2896 /* Helper function for for_each_index. For each INDEX of the data
2897 reference REF, returns true when its indices are valid in the loop
2898 nest LOOP passed in as DATA. */
2901 dr_indices_valid_in_loop (tree ref ATTRIBUTE_UNUSED
, tree
*index
, void *data
)
2904 basic_block header
, def_bb
;
2907 if (TREE_CODE (*index
) != SSA_NAME
)
2910 loop
= *((loop_p
*) data
);
2911 header
= loop
->header
;
2912 stmt
= SSA_NAME_DEF_STMT (*index
);
2917 def_bb
= gimple_bb (stmt
);
2922 return dominated_by_p (CDI_DOMINATORS
, header
, def_bb
);
2925 /* When the result of a CLOSE_PHI is written to a memory location,
2926 return a pointer to that memory reference, otherwise return
2930 close_phi_written_to_memory (gimple close_phi
)
2932 imm_use_iterator imm_iter
;
2933 use_operand_p use_p
;
2935 tree res
, def
= gimple_phi_result (close_phi
);
2937 FOR_EACH_IMM_USE_FAST (use_p
, imm_iter
, def
)
2938 if ((stmt
= USE_STMT (use_p
))
2939 && gimple_code (stmt
) == GIMPLE_ASSIGN
2940 && (res
= gimple_assign_lhs (stmt
)))
2942 switch (TREE_CODE (res
))
2952 tree arg
= gimple_phi_arg_def (close_phi
, 0);
2953 loop_p nest
= loop_containing_stmt (SSA_NAME_DEF_STMT (arg
));
2955 /* FIXME: this restriction is for id-{24,25}.f and
2956 could be handled by duplicating the computation of
2957 array indices before the loop of the close_phi. */
2958 if (for_each_index (&res
, dr_indices_valid_in_loop
, &nest
))
2970 /* Rewrite out of SSA the reduction described by the loop phi nodes
2971 IN, and the close phi nodes OUT. IN and OUT are structured by loop
2974 IN: stmt, loop_n, ..., loop_0
2975 OUT: stmt, close_n, ..., close_0
2977 the first element is the reduction statement, and the next elements
2978 are the loop and close phi nodes of each of the outer loops. */
2981 translate_scalar_reduction_to_array (scop_p scop
,
2986 unsigned int i
= out
.length () - 1;
2987 tree red
= close_phi_written_to_memory (out
[i
]);
2989 FOR_EACH_VEC_ELT (in
, i
, loop_phi
)
2991 gimple close_phi
= out
[i
];
2995 gimple stmt
= loop_phi
;
2996 basic_block bb
= split_reduction_stmt (scop
, stmt
);
2997 poly_bb_p pbb
= pbb_from_bb (bb
);
2998 PBB_IS_REDUCTION (pbb
) = true;
2999 gcc_assert (close_phi
== loop_phi
);
3002 red
= create_zero_dim_array
3003 (gimple_assign_lhs (stmt
), "Commutative_Associative_Reduction");
3005 translate_scalar_reduction_to_array_for_stmt (scop
, red
, stmt
, in
[1]);
3009 if (i
== in
.length () - 1)
3011 insert_out_of_ssa_copy (scop
, gimple_phi_result (close_phi
),
3012 unshare_expr (red
), close_phi
);
3013 insert_out_of_ssa_copy_on_edge
3014 (scop
, edge_initial_value_for_loop_phi (loop_phi
),
3015 unshare_expr (red
), initial_value_for_loop_phi (loop_phi
));
3018 remove_phi (loop_phi
);
3019 remove_phi (close_phi
);
3023 /* Rewrites out of SSA a commutative reduction at CLOSE_PHI. Returns
3024 true when something has been changed. */
3027 rewrite_commutative_reductions_out_of_ssa_close_phi (scop_p scop
,
3031 auto_vec
<gimple
, 10> in
;
3032 auto_vec
<gimple
, 10> out
;
3034 detect_commutative_reduction (scop
, close_phi
, &in
, &out
);
3035 res
= in
.length () > 1;
3037 translate_scalar_reduction_to_array (scop
, in
, out
);
3042 /* Rewrites all the commutative reductions from LOOP out of SSA.
3043 Returns true when something has been changed. */
3046 rewrite_commutative_reductions_out_of_ssa_loop (scop_p scop
,
3049 gimple_stmt_iterator gsi
;
3050 edge exit
= single_exit (loop
);
3052 bool changed
= false;
3057 for (gsi
= gsi_start_phis (exit
->dest
); !gsi_end_p (gsi
); gsi_next (&gsi
))
3058 if ((res
= gimple_phi_result (gsi_stmt (gsi
)))
3059 && !virtual_operand_p (res
)
3060 && !scev_analyzable_p (res
, SCOP_REGION (scop
)))
3061 changed
|= rewrite_commutative_reductions_out_of_ssa_close_phi
3062 (scop
, gsi_stmt (gsi
));
3067 /* Rewrites all the commutative reductions from SCOP out of SSA. */
3070 rewrite_commutative_reductions_out_of_ssa (scop_p scop
)
3073 bool changed
= false;
3074 sese region
= SCOP_REGION (scop
);
3076 FOR_EACH_LOOP (loop
, 0)
3077 if (loop_in_sese_p (loop
, region
))
3078 changed
|= rewrite_commutative_reductions_out_of_ssa_loop (scop
, loop
);
3083 gsi_commit_edge_inserts ();
3084 update_ssa (TODO_update_ssa
);
3085 #ifdef ENABLE_CHECKING
3086 verify_loop_closed_ssa (true);
3091 /* Can all ivs be represented by a signed integer?
3092 As CLooG might generate negative values in its expressions, signed loop ivs
3093 are required in the backend. */
3096 scop_ivs_can_be_represented (scop_p scop
)
3099 gimple_stmt_iterator psi
;
3102 FOR_EACH_LOOP (loop
, 0)
3104 if (!loop_in_sese_p (loop
, SCOP_REGION (scop
)))
3107 for (psi
= gsi_start_phis (loop
->header
);
3108 !gsi_end_p (psi
); gsi_next (&psi
))
3110 gimple phi
= gsi_stmt (psi
);
3111 tree res
= PHI_RESULT (phi
);
3112 tree type
= TREE_TYPE (res
);
3114 if (TYPE_UNSIGNED (type
)
3115 && TYPE_PRECISION (type
) >= TYPE_PRECISION (long_long_integer_type_node
))
3128 /* Builds the polyhedral representation for a SESE region. */
3131 build_poly_scop (scop_p scop
)
3133 sese region
= SCOP_REGION (scop
);
3134 graphite_dim_t max_dim
;
3136 build_scop_bbs (scop
);
3138 /* FIXME: This restriction is needed to avoid a problem in CLooG.
3139 Once CLooG is fixed, remove this guard. Anyways, it makes no
3140 sense to optimize a scop containing only PBBs that do not belong
3142 if (nb_pbbs_in_loops (scop
) == 0)
3145 if (!scop_ivs_can_be_represented (scop
))
3148 if (flag_associative_math
)
3149 rewrite_commutative_reductions_out_of_ssa (scop
);
3151 build_sese_loop_nests (region
);
3152 /* Record all conditions in REGION. */
3153 sese_dom_walker (CDI_DOMINATORS
, region
).walk (cfun
->cfg
->x_entry_block_ptr
);
3154 find_scop_parameters (scop
);
3156 max_dim
= PARAM_VALUE (PARAM_GRAPHITE_MAX_NB_SCOP_PARAMS
);
3157 if (scop_nb_params (scop
) > max_dim
)
3160 build_scop_iteration_domain (scop
);
3161 build_scop_context (scop
);
3162 add_conditions_to_constraints (scop
);
3164 /* Rewrite out of SSA only after having translated the
3165 representation to the polyhedral representation to avoid scev
3166 analysis failures. That means that these functions will insert
3167 new data references that they create in the right place. */
3168 rewrite_reductions_out_of_ssa (scop
);
3169 rewrite_cross_bb_scalar_deps_out_of_ssa (scop
);
3171 build_scop_drs (scop
);
3173 build_scop_scattering (scop
);
3175 /* This SCoP has been translated to the polyhedral
3177 POLY_SCOP_P (scop
) = true;