2008-06-04 Xinliang David Li <davidxl@google.com>
[official-gcc.git] / gcc / tree-ssa-alias.c
blob05c123c0e99c4ce80cc22abd1ac59eef804ed619
1 /* Alias analysis for trees.
2 Copyright (C) 2004, 2005, 2006, 2007 Free Software Foundation, Inc.
3 Contributed by Diego Novillo <dnovillo@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
10 any later version.
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "tree.h"
26 #include "rtl.h"
27 #include "tm_p.h"
28 #include "hard-reg-set.h"
29 #include "basic-block.h"
30 #include "timevar.h"
31 #include "expr.h"
32 #include "ggc.h"
33 #include "langhooks.h"
34 #include "flags.h"
35 #include "function.h"
36 #include "diagnostic.h"
37 #include "tree-dump.h"
38 #include "tree-gimple.h"
39 #include "tree-flow.h"
40 #include "tree-inline.h"
41 #include "tree-pass.h"
42 #include "tree-ssa-structalias.h"
43 #include "convert.h"
44 #include "params.h"
45 #include "ipa-type-escape.h"
46 #include "vec.h"
47 #include "bitmap.h"
48 #include "vecprim.h"
49 #include "pointer-set.h"
50 #include "alloc-pool.h"
52 /* Broad overview of how aliasing works:
54 First we compute points-to sets, which is done in
55 tree-ssa-structalias.c
57 During points-to set constraint finding, a bunch of little bits of
58 information is collected.
59 This is not done because it is necessary for points-to, but because
60 points-to has to walk every statement anyway. The function performing
61 this collecting is update_alias_info.
63 Bits update_alias_info collects include:
64 1. Directly escaping variables and variables whose value escapes
65 (using is_escape_site). This is the set of variables and values that
66 escape prior to transitive closure of the clobbers.
67 2. The set of variables dereferenced on the LHS (into
68 dereferenced_ptr_stores)
69 3. The set of variables dereferenced on the RHS (into
70 dereferenced_ptr_loads)
71 4. The set of all pointers we saw.
72 5. The number of loads and stores for each variable
73 6. The number of statements touching memory
74 7. The set of address taken variables.
77 #1 is computed by a combination of is_escape_site, and counting the
78 number of uses/deref operators. This function properly accounts for
79 situations like &ptr->field, which is *not* a dereference.
81 After points-to sets are computed, the sets themselves still
82 contain points-to specific variables, such as a variable that says
83 the pointer points to anything, a variable that says the pointer
84 points to readonly memory, etc.
86 These are eliminated in a later phase, as we will see.
88 The rest of the phases are located in tree-ssa-alias.c
90 The next phase after points-to set computation is called
91 "setup_pointers_and_addressables"
93 This pass does 3 main things:
95 1. All variables that can have TREE_ADDRESSABLE removed safely (IE
96 non-globals whose address is not taken), have TREE_ADDRESSABLE
97 removed.
98 2. All variables that may be aliased (which is the set of addressable
99 variables and globals) at all, are marked for renaming, and have
100 symbol memory tags created for them.
101 3. All variables which are stored into have their SMT's added to
102 written vars.
105 After this function is run, all variables that will ever have an
106 SMT, have one, though its aliases are not filled in.
108 The next phase is to compute flow-insensitive aliasing, which in
109 our case, is a misnomer. it is really computing aliasing that
110 requires no transitive closure to be correct. In particular, it
111 uses stack vs non-stack, TBAA, etc, to determine whether two
112 symbols could *ever* alias . This phase works by going through all
113 the pointers we collected during update_alias_info, and for every
114 addressable variable in the program, seeing if they alias. If so,
115 the addressable variable is added to the symbol memory tag for the
116 pointer.
118 As part of this, we handle symbol memory tags that conflict but
119 have no aliases in common, by forcing them to have a symbol in
120 common (through unioning alias sets or adding one as an alias of
121 the other), or by adding one as an alias of another. The case of
122 conflicts with no aliases in common occurs mainly due to aliasing
123 we cannot see. In particular, it generally means we have a load
124 through a pointer whose value came from outside the function.
125 Without an addressable symbol to point to, they would get the wrong
126 answer.
128 After flow insensitive aliasing is computed, we compute name tags
129 (called compute_flow_sensitive_info). We walk each pointer we
130 collected and see if it has a usable points-to set. If so, we
131 generate a name tag using that pointer, and make an alias bitmap for
132 it. Name tags are shared between all things with the same alias
133 bitmap. The alias bitmap will be translated from what points-to
134 computed. In particular, the "anything" variable in points-to will be
135 transformed into a pruned set of SMT's and their aliases that
136 compute_flow_insensitive_aliasing computed.
137 Note that since 4.3, every pointer that points-to computed a solution for
138 will get a name tag (whereas before 4.3, only those whose set did
139 *not* include the anything variable would). At the point where name
140 tags are all assigned, symbol memory tags are dead, and could be
141 deleted, *except* on global variables. Global variables still use
142 symbol memory tags as of right now.
144 After name tags are computed, the set of clobbered variables is
145 transitively closed. In particular, we compute the set of clobbered
146 variables based on the initial set of clobbers, plus the aliases of
147 pointers which either escape, or have their value escape.
149 After this, maybe_create_global_var is run, which handles a corner
150 case where we have no call clobbered variables, but have pure and
151 non-pure functions.
153 Staring at this function, I now remember it is a hack for the fact
154 that we do not mark all globals in the program as call clobbered for a
155 function unless they are actually used in that function. Instead, we
156 only mark the set that is actually clobbered. As a result, you can
157 end up with situations where you have no call clobbered vars set.
159 After maybe_create_global_var, we set pointers with the REF_ALL flag
160 to have alias sets that include all clobbered
161 memory tags and variables.
163 After this, memory partitioning is computed (by the function
164 compute_memory_partitions) and alias sets are reworked accordingly.
166 Lastly, we delete partitions with no symbols, and clean up after
167 ourselves. */
169 /* Structure to map a variable to its alias set. */
170 struct alias_map_d
172 /* Variable and its alias set. */
173 tree var;
174 alias_set_type set;
178 /* Counters used to display statistics on alias analysis. */
179 struct alias_stats_d
181 unsigned int alias_queries;
182 unsigned int alias_mayalias;
183 unsigned int alias_noalias;
184 unsigned int simple_queries;
185 unsigned int simple_resolved;
186 unsigned int tbaa_queries;
187 unsigned int tbaa_resolved;
188 unsigned int structnoaddress_queries;
189 unsigned int structnoaddress_resolved;
193 /* Local variables. */
194 static struct alias_stats_d alias_stats;
195 static bitmap_obstack alias_bitmap_obstack;
197 /* Local functions. */
198 static void compute_flow_insensitive_aliasing (struct alias_info *);
199 static void dump_alias_stats (FILE *);
200 static bool may_alias_p (tree, alias_set_type, tree, alias_set_type, bool);
201 static tree create_memory_tag (tree type, bool is_type_tag);
202 static tree get_smt_for (tree, struct alias_info *);
203 static tree get_nmt_for (tree);
204 static void add_may_alias (tree, tree);
205 static struct alias_info *init_alias_info (void);
206 static void delete_alias_info (struct alias_info *);
207 static void compute_flow_sensitive_aliasing (struct alias_info *);
208 static void setup_pointers_and_addressables (struct alias_info *);
209 static void create_global_var (void);
210 static void maybe_create_global_var (void);
211 static void set_pt_anything (tree);
213 void debug_mp_info (VEC(mem_sym_stats_t,heap) *);
215 static alloc_pool mem_sym_stats_pool;
217 /* Return memory reference stats for symbol VAR. Create a new slot in
218 cfun->gimple_df->mem_sym_stats if needed. */
220 static struct mem_sym_stats_d *
221 get_mem_sym_stats_for (tree var)
223 void **slot;
224 struct mem_sym_stats_d *stats;
225 struct pointer_map_t *map = gimple_mem_ref_stats (cfun)->mem_sym_stats;
227 gcc_assert (map);
229 slot = pointer_map_insert (map, var);
230 if (*slot == NULL)
232 stats = pool_alloc (mem_sym_stats_pool);
233 memset (stats, 0, sizeof (*stats));
234 stats->var = var;
235 *slot = (void *) stats;
237 else
238 stats = (struct mem_sym_stats_d *) *slot;
240 return stats;
244 /* Return memory reference statistics for variable VAR in function FN.
245 This is computed by alias analysis, but it is not kept
246 incrementally up-to-date. So, these stats are only accurate if
247 pass_may_alias has been run recently. If no alias information
248 exists, this function returns NULL. */
250 static mem_sym_stats_t
251 mem_sym_stats (struct function *fn, tree var)
253 void **slot;
254 struct pointer_map_t *stats_map = gimple_mem_ref_stats (fn)->mem_sym_stats;
256 if (stats_map == NULL)
257 return NULL;
259 slot = pointer_map_contains (stats_map, var);
260 if (slot == NULL)
261 return NULL;
263 return (mem_sym_stats_t) *slot;
267 /* Set MPT to be the memory partition associated with symbol SYM. */
269 static inline void
270 set_memory_partition (tree sym, tree mpt)
272 #if defined ENABLE_CHECKING
273 if (mpt)
274 gcc_assert (TREE_CODE (mpt) == MEMORY_PARTITION_TAG
275 && !is_gimple_reg (sym));
276 #endif
278 var_ann (sym)->mpt = mpt;
279 if (mpt)
281 if (MPT_SYMBOLS (mpt) == NULL)
282 MPT_SYMBOLS (mpt) = BITMAP_ALLOC (&alias_bitmap_obstack);
284 bitmap_set_bit (MPT_SYMBOLS (mpt), DECL_UID (sym));
286 /* MPT inherits the call-clobbering attributes from SYM. */
287 if (is_call_clobbered (sym))
289 MTAG_GLOBAL (mpt) = 1;
290 mark_call_clobbered (mpt, ESCAPE_IS_GLOBAL);
296 /* Mark variable VAR as being non-addressable. */
298 static void
299 mark_non_addressable (tree var)
301 tree mpt;
303 if (!TREE_ADDRESSABLE (var))
304 return;
306 mpt = memory_partition (var);
308 clear_call_clobbered (var);
309 TREE_ADDRESSABLE (var) = 0;
311 if (mpt)
313 /* Note that it's possible for a symbol to have an associated
314 MPT and the MPT have a NULL empty set. During
315 init_alias_info, all MPTs get their sets cleared out, but the
316 symbols still point to the old MPTs that used to hold them.
317 This is done so that compute_memory_partitions can now which
318 symbols are losing or changing partitions and mark them for
319 renaming. */
320 if (MPT_SYMBOLS (mpt))
321 bitmap_clear_bit (MPT_SYMBOLS (mpt), DECL_UID (var));
322 set_memory_partition (var, NULL_TREE);
327 /* qsort comparison function to sort type/name tags by DECL_UID. */
329 static int
330 sort_tags_by_id (const void *pa, const void *pb)
332 const_tree const a = *(const_tree const *)pa;
333 const_tree const b = *(const_tree const *)pb;
335 return DECL_UID (a) - DECL_UID (b);
338 /* Initialize WORKLIST to contain those memory tags that are marked call
339 clobbered. Initialized WORKLIST2 to contain the reasons these
340 memory tags escaped. */
342 static void
343 init_transitive_clobber_worklist (VEC (tree, heap) **worklist,
344 VEC (int, heap) **worklist2,
345 bitmap on_worklist)
347 referenced_var_iterator rvi;
348 tree curr;
350 FOR_EACH_REFERENCED_VAR (curr, rvi)
352 if (MTAG_P (curr) && is_call_clobbered (curr))
354 VEC_safe_push (tree, heap, *worklist, curr);
355 VEC_safe_push (int, heap, *worklist2,
356 var_ann (curr)->escape_mask);
357 bitmap_set_bit (on_worklist, DECL_UID (curr));
362 /* Add ALIAS to WORKLIST (and the reason for escaping REASON to WORKLIST2) if
363 ALIAS is not already marked call clobbered, and is a memory
364 tag. */
366 static void
367 add_to_worklist (tree alias, VEC (tree, heap) **worklist,
368 VEC (int, heap) **worklist2, int reason,
369 bitmap on_worklist)
371 if (MTAG_P (alias) && !is_call_clobbered (alias)
372 && !bitmap_bit_p (on_worklist, DECL_UID (alias)))
374 VEC_safe_push (tree, heap, *worklist, alias);
375 VEC_safe_push (int, heap, *worklist2, reason);
376 bitmap_set_bit (on_worklist, DECL_UID (alias));
380 /* Mark aliases of TAG as call clobbered, and place any tags on the
381 alias list that were not already call clobbered on WORKLIST. */
383 static void
384 mark_aliases_call_clobbered (tree tag, VEC (tree, heap) **worklist,
385 VEC (int, heap) **worklist2, bitmap on_worklist)
387 bitmap aliases;
388 bitmap_iterator bi;
389 unsigned int i;
390 tree entry;
391 var_ann_t ta = var_ann (tag);
393 if (!MTAG_P (tag))
394 return;
395 aliases = may_aliases (tag);
396 if (!aliases)
397 return;
399 EXECUTE_IF_SET_IN_BITMAP (aliases, 0, i, bi)
401 entry = referenced_var (i);
402 /* If you clobber one part of a structure, you
403 clobber the entire thing. While this does not make
404 the world a particularly nice place, it is necessary
405 in order to allow C/C++ tricks that involve
406 pointer arithmetic to work. */
407 if (!unmodifiable_var_p (entry))
409 add_to_worklist (entry, worklist, worklist2, ta->escape_mask,
410 on_worklist);
411 mark_call_clobbered (entry, ta->escape_mask);
416 /* Tags containing global vars need to be marked as global.
417 Tags containing call clobbered vars need to be marked as call
418 clobbered. */
420 static void
421 compute_tag_properties (void)
423 referenced_var_iterator rvi;
424 tree tag;
425 bool changed = true;
426 VEC (tree, heap) *taglist = NULL;
428 FOR_EACH_REFERENCED_VAR (tag, rvi)
430 if (!MTAG_P (tag))
431 continue;
432 VEC_safe_push (tree, heap, taglist, tag);
435 /* We sort the taglist by DECL_UID, for two reasons.
436 1. To get a sequential ordering to make the bitmap accesses
437 faster.
438 2. Because of the way we compute aliases, it's more likely that
439 an earlier tag is included in a later tag, and this will reduce
440 the number of iterations.
442 If we had a real tag graph, we would just topo-order it and be
443 done with it. */
444 qsort (VEC_address (tree, taglist),
445 VEC_length (tree, taglist),
446 sizeof (tree),
447 sort_tags_by_id);
449 /* Go through each tag not marked as global, and if it aliases
450 global vars, mark it global.
452 If the tag contains call clobbered vars, mark it call
453 clobbered.
455 This loop iterates because tags may appear in the may-aliases
456 list of other tags when we group. */
458 while (changed)
460 unsigned int k;
462 changed = false;
463 for (k = 0; VEC_iterate (tree, taglist, k, tag); k++)
465 bitmap ma;
466 bitmap_iterator bi;
467 unsigned int i;
468 tree entry;
469 bool tagcc = is_call_clobbered (tag);
470 bool tagglobal = MTAG_GLOBAL (tag);
472 if (tagcc && tagglobal)
473 continue;
475 ma = may_aliases (tag);
476 if (!ma)
477 continue;
479 EXECUTE_IF_SET_IN_BITMAP (ma, 0, i, bi)
481 entry = referenced_var (i);
482 /* Call clobbered entries cause the tag to be marked
483 call clobbered. */
484 if (!tagcc && is_call_clobbered (entry))
486 mark_call_clobbered (tag, var_ann (entry)->escape_mask);
487 tagcc = true;
488 changed = true;
491 /* Global vars cause the tag to be marked global. */
492 if (!tagglobal && is_global_var (entry))
494 MTAG_GLOBAL (tag) = true;
495 changed = true;
496 tagglobal = true;
499 /* Early exit once both global and cc are set, since the
500 loop can't do any more than that. */
501 if (tagcc && tagglobal)
502 break;
506 VEC_free (tree, heap, taglist);
509 /* Set up the initial variable clobbers and globalness.
510 When this function completes, only tags whose aliases need to be
511 clobbered will be set clobbered. Tags clobbered because they
512 contain call clobbered vars are handled in compute_tag_properties. */
514 static void
515 set_initial_properties (struct alias_info *ai)
517 unsigned int i;
518 referenced_var_iterator rvi;
519 tree var;
520 tree ptr;
521 bool any_pt_anything = false;
522 enum escape_type pt_anything_mask = 0;
524 FOR_EACH_REFERENCED_VAR (var, rvi)
526 if (is_global_var (var))
528 if (!unmodifiable_var_p (var))
529 mark_call_clobbered (var, ESCAPE_IS_GLOBAL);
531 else if (TREE_CODE (var) == PARM_DECL
532 && gimple_default_def (cfun, var)
533 && POINTER_TYPE_P (TREE_TYPE (var)))
535 tree def = gimple_default_def (cfun, var);
536 get_ptr_info (def)->value_escapes_p = 1;
537 get_ptr_info (def)->escape_mask |= ESCAPE_IS_PARM;
541 for (i = 0; VEC_iterate (tree, ai->processed_ptrs, i, ptr); i++)
543 struct ptr_info_def *pi = SSA_NAME_PTR_INFO (ptr);
544 tree tag = symbol_mem_tag (SSA_NAME_VAR (ptr));
546 /* A pointer that only escapes via a function return does not
547 add to the call clobber or call used solution.
548 To exclude ESCAPE_TO_PURE_CONST we would need to track
549 call used variables separately or compute those properly
550 in the operand scanner. */
551 if (pi->value_escapes_p
552 && pi->escape_mask & ~ESCAPE_TO_RETURN)
554 /* If PTR escapes then its associated memory tags and
555 pointed-to variables are call-clobbered. */
556 if (pi->name_mem_tag)
557 mark_call_clobbered (pi->name_mem_tag, pi->escape_mask);
559 if (tag)
560 mark_call_clobbered (tag, pi->escape_mask);
562 /* Defer to points-to analysis if possible, otherwise
563 clobber all addressable variables. Parameters cannot
564 point to local memory though.
565 ??? Properly tracking which pointers point to non-local
566 memory only would make a big difference here. */
567 if (!clobber_what_p_points_to (ptr)
568 && !(pi->escape_mask & ESCAPE_IS_PARM))
570 any_pt_anything = true;
571 pt_anything_mask |= pi->escape_mask;
575 /* If the name tag is call clobbered, so is the symbol tag
576 associated with the base VAR_DECL. */
577 if (pi->name_mem_tag
578 && tag
579 && is_call_clobbered (pi->name_mem_tag))
580 mark_call_clobbered (tag, pi->escape_mask);
582 /* Name tags and symbol tags that we don't know where they point
583 to, might point to global memory, and thus, are clobbered.
585 FIXME: This is not quite right. They should only be
586 clobbered if value_escapes_p is true, regardless of whether
587 they point to global memory or not.
588 So removing this code and fixing all the bugs would be nice.
589 It is the cause of a bunch of clobbering. */
590 if ((pi->pt_global_mem || pi->pt_anything)
591 && pi->is_dereferenced && pi->name_mem_tag)
593 mark_call_clobbered (pi->name_mem_tag, ESCAPE_IS_GLOBAL);
594 MTAG_GLOBAL (pi->name_mem_tag) = true;
597 if ((pi->pt_global_mem || pi->pt_anything)
598 && pi->is_dereferenced
599 && tag)
601 mark_call_clobbered (tag, ESCAPE_IS_GLOBAL);
602 MTAG_GLOBAL (tag) = true;
606 /* If a pt_anything pointer escaped we need to mark all addressable
607 variables call clobbered. */
608 if (any_pt_anything)
610 bitmap_iterator bi;
611 unsigned int j;
613 EXECUTE_IF_SET_IN_BITMAP (gimple_addressable_vars (cfun), 0, j, bi)
615 tree var = referenced_var (j);
616 if (!unmodifiable_var_p (var))
617 mark_call_clobbered (var, pt_anything_mask);
622 /* Compute which variables need to be marked call clobbered because
623 their tag is call clobbered, and which tags need to be marked
624 global because they contain global variables. */
626 static void
627 compute_call_clobbered (struct alias_info *ai)
629 VEC (tree, heap) *worklist = NULL;
630 VEC (int,heap) *worklist2 = NULL;
631 bitmap on_worklist;
633 timevar_push (TV_CALL_CLOBBER);
634 on_worklist = BITMAP_ALLOC (NULL);
636 set_initial_properties (ai);
637 init_transitive_clobber_worklist (&worklist, &worklist2, on_worklist);
638 while (VEC_length (tree, worklist) != 0)
640 tree curr = VEC_pop (tree, worklist);
641 int reason = VEC_pop (int, worklist2);
643 bitmap_clear_bit (on_worklist, DECL_UID (curr));
644 mark_call_clobbered (curr, reason);
645 mark_aliases_call_clobbered (curr, &worklist, &worklist2, on_worklist);
647 VEC_free (tree, heap, worklist);
648 VEC_free (int, heap, worklist2);
649 BITMAP_FREE (on_worklist);
650 compute_tag_properties ();
651 timevar_pop (TV_CALL_CLOBBER);
655 /* Dump memory partition information to FILE. */
657 static void
658 dump_memory_partitions (FILE *file)
660 unsigned i, npart;
661 unsigned long nsyms;
662 tree mpt;
664 fprintf (file, "\nMemory partitions\n\n");
665 for (i = 0, npart = 0, nsyms = 0;
666 VEC_iterate (tree, gimple_ssa_operands (cfun)->mpt_table, i, mpt);
667 i++)
669 if (mpt)
671 bitmap syms = MPT_SYMBOLS (mpt);
672 unsigned long n = (syms) ? bitmap_count_bits (syms) : 0;
674 fprintf (file, "#%u: ", i);
675 print_generic_expr (file, mpt, 0);
676 fprintf (file, ": %lu elements: ", n);
677 dump_decl_set (file, syms);
678 npart++;
679 nsyms += n;
683 fprintf (file, "\n%u memory partitions holding %lu symbols\n", npart, nsyms);
687 /* Dump memory partition information to stderr. */
689 void
690 debug_memory_partitions (void)
692 dump_memory_partitions (stderr);
696 /* Return true if memory partitioning is required given the memory
697 reference estimates in STATS. */
699 static inline bool
700 need_to_partition_p (struct mem_ref_stats_d *stats)
702 long num_vops = stats->num_vuses + stats->num_vdefs;
703 long avg_vops = CEIL (num_vops, stats->num_mem_stmts);
704 return (num_vops > (long) MAX_ALIASED_VOPS
705 && avg_vops > (long) AVG_ALIASED_VOPS);
709 /* Count the actual number of virtual operators in CFUN. Note that
710 this is only meaningful after virtual operands have been populated,
711 so it should be invoked at the end of compute_may_aliases.
713 The number of virtual operators are stored in *NUM_VDEFS_P and
714 *NUM_VUSES_P, the number of partitioned symbols in
715 *NUM_PARTITIONED_P and the number of unpartitioned symbols in
716 *NUM_UNPARTITIONED_P.
718 If any of these pointers is NULL the corresponding count is not
719 computed. */
721 static void
722 count_mem_refs (long *num_vuses_p, long *num_vdefs_p,
723 long *num_partitioned_p, long *num_unpartitioned_p)
725 block_stmt_iterator bsi;
726 basic_block bb;
727 long num_vdefs, num_vuses, num_partitioned, num_unpartitioned;
728 referenced_var_iterator rvi;
729 tree sym;
731 num_vuses = num_vdefs = num_partitioned = num_unpartitioned = 0;
733 if (num_vuses_p || num_vdefs_p)
734 FOR_EACH_BB (bb)
735 for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
737 tree stmt = bsi_stmt (bsi);
738 if (stmt_references_memory_p (stmt))
740 num_vuses += NUM_SSA_OPERANDS (stmt, SSA_OP_VUSE);
741 num_vdefs += NUM_SSA_OPERANDS (stmt, SSA_OP_VDEF);
745 if (num_partitioned_p || num_unpartitioned_p)
746 FOR_EACH_REFERENCED_VAR (sym, rvi)
748 if (is_gimple_reg (sym))
749 continue;
751 if (memory_partition (sym))
752 num_partitioned++;
753 else
754 num_unpartitioned++;
757 if (num_vdefs_p)
758 *num_vdefs_p = num_vdefs;
760 if (num_vuses_p)
761 *num_vuses_p = num_vuses;
763 if (num_partitioned_p)
764 *num_partitioned_p = num_partitioned;
766 if (num_unpartitioned_p)
767 *num_unpartitioned_p = num_unpartitioned;
771 /* The list is sorted by increasing partitioning score (PSCORE).
772 This score is computed such that symbols with high scores are
773 those that are least likely to be partitioned. Given a symbol
774 MP->VAR, PSCORE(S) is the result of the following weighted sum
776 PSCORE(S) = FW * 64 + FR * 32
777 + DW * 16 + DR * 8
778 + IW * 4 + IR * 2
779 + NO_ALIAS
781 where
783 FW Execution frequency of writes to S
784 FR Execution frequency of reads from S
785 DW Number of direct writes to S
786 DR Number of direct reads from S
787 IW Number of indirect writes to S
788 IR Number of indirect reads from S
789 NO_ALIAS State of the NO_ALIAS* flags
791 The basic idea here is that symbols that are frequently
792 written-to in hot paths of the code are the last to be considered
793 for partitioning. */
795 static inline long
796 mem_sym_score (mem_sym_stats_t mp)
798 return mp->frequency_writes * 64 + mp->frequency_reads * 32
799 + mp->num_direct_writes * 16 + mp->num_direct_reads * 8
800 + mp->num_indirect_writes * 4 + mp->num_indirect_reads * 2
801 + var_ann (mp->var)->noalias_state;
805 /* Dump memory reference stats for function CFUN to FILE. */
807 void
808 dump_mem_ref_stats (FILE *file)
810 long actual_num_vuses, actual_num_vdefs;
811 long num_partitioned, num_unpartitioned;
812 struct mem_ref_stats_d *stats;
814 stats = gimple_mem_ref_stats (cfun);
816 count_mem_refs (&actual_num_vuses, &actual_num_vdefs, &num_partitioned,
817 &num_unpartitioned);
819 fprintf (file, "\nMemory reference statistics for %s\n\n",
820 lang_hooks.decl_printable_name (current_function_decl, 2));
822 fprintf (file, "Number of memory statements: %ld\n",
823 stats->num_mem_stmts);
824 fprintf (file, "Number of call sites: %ld\n",
825 stats->num_call_sites);
826 fprintf (file, "Number of pure/const call sites: %ld\n",
827 stats->num_pure_const_call_sites);
828 fprintf (file, "Number of asm sites: %ld\n",
829 stats->num_asm_sites);
830 fprintf (file, "Estimated number of loads: %ld (%ld/stmt)\n",
831 stats->num_vuses,
832 (stats->num_mem_stmts)
833 ? CEIL (stats->num_vuses, stats->num_mem_stmts)
834 : 0);
835 fprintf (file, "Actual number of loads: %ld (%ld/stmt)\n",
836 actual_num_vuses,
837 (stats->num_mem_stmts)
838 ? CEIL (actual_num_vuses, stats->num_mem_stmts)
839 : 0);
841 if (actual_num_vuses > stats->num_vuses + (stats->num_vuses / 25))
842 fprintf (file, "\t(warning: estimation is lower by more than 25%%)\n");
844 fprintf (file, "Estimated number of stores: %ld (%ld/stmt)\n",
845 stats->num_vdefs,
846 (stats->num_mem_stmts)
847 ? CEIL (stats->num_vdefs, stats->num_mem_stmts)
848 : 0);
849 fprintf (file, "Actual number of stores: %ld (%ld/stmt)\n",
850 actual_num_vdefs,
851 (stats->num_mem_stmts)
852 ? CEIL (actual_num_vdefs, stats->num_mem_stmts)
853 : 0);
855 if (actual_num_vdefs > stats->num_vdefs + (stats->num_vdefs / 25))
856 fprintf (file, "\t(warning: estimation is lower by more than 25%%)\n");
858 fprintf (file, "Partitioning thresholds: MAX = %d AVG = %d "
859 "(%sNEED TO PARTITION)\n", MAX_ALIASED_VOPS, AVG_ALIASED_VOPS,
860 stats->num_mem_stmts && need_to_partition_p (stats) ? "" : "NO ");
861 fprintf (file, "Number of partitioned symbols: %ld\n", num_partitioned);
862 fprintf (file, "Number of unpartitioned symbols: %ld\n", num_unpartitioned);
866 /* Dump memory reference stats for function FN to stderr. */
868 void
869 debug_mem_ref_stats (void)
871 dump_mem_ref_stats (stderr);
875 /* Dump memory reference stats for variable VAR to FILE. */
877 static void
878 dump_mem_sym_stats (FILE *file, tree var)
880 mem_sym_stats_t stats = mem_sym_stats (cfun, var);
882 if (stats == NULL)
883 return;
885 fprintf (file, "read frequency: %6ld, write frequency: %6ld, "
886 "direct reads: %3ld, direct writes: %3ld, "
887 "indirect reads: %4ld, indirect writes: %4ld, symbol: ",
888 stats->frequency_reads, stats->frequency_writes,
889 stats->num_direct_reads, stats->num_direct_writes,
890 stats->num_indirect_reads, stats->num_indirect_writes);
891 print_generic_expr (file, stats->var, 0);
892 fprintf (file, ", tags: ");
893 dump_decl_set (file, stats->parent_tags);
897 /* Dump memory reference stats for variable VAR to stderr. */
899 void
900 debug_mem_sym_stats (tree var)
902 dump_mem_sym_stats (stderr, var);
905 /* Dump memory reference stats for variable VAR to FILE. For use
906 of tree-dfa.c:dump_variable. */
908 void
909 dump_mem_sym_stats_for_var (FILE *file, tree var)
911 mem_sym_stats_t stats = mem_sym_stats (cfun, var);
913 if (stats == NULL)
914 return;
916 fprintf (file, ", score: %ld", mem_sym_score (stats));
917 fprintf (file, ", direct reads: %ld", stats->num_direct_reads);
918 fprintf (file, ", direct writes: %ld", stats->num_direct_writes);
919 fprintf (file, ", indirect reads: %ld", stats->num_indirect_reads);
920 fprintf (file, ", indirect writes: %ld", stats->num_indirect_writes);
923 /* Dump memory reference stats for all memory symbols to FILE. */
925 static void
926 dump_all_mem_sym_stats (FILE *file)
928 referenced_var_iterator rvi;
929 tree sym;
931 FOR_EACH_REFERENCED_VAR (sym, rvi)
933 if (is_gimple_reg (sym))
934 continue;
936 dump_mem_sym_stats (file, sym);
941 /* Dump memory reference stats for all memory symbols to stderr. */
943 void
944 debug_all_mem_sym_stats (void)
946 dump_all_mem_sym_stats (stderr);
950 /* Dump the MP_INFO array to FILE. */
952 static void
953 dump_mp_info (FILE *file, VEC(mem_sym_stats_t,heap) *mp_info)
955 unsigned i;
956 mem_sym_stats_t mp_p;
958 for (i = 0; VEC_iterate (mem_sym_stats_t, mp_info, i, mp_p); i++)
959 if (!mp_p->partitioned_p)
960 dump_mem_sym_stats (file, mp_p->var);
964 /* Dump the MP_INFO array to stderr. */
966 void
967 debug_mp_info (VEC(mem_sym_stats_t,heap) *mp_info)
969 dump_mp_info (stderr, mp_info);
973 /* Update memory reference stats for symbol VAR in statement STMT.
974 NUM_DIRECT_READS and NUM_DIRECT_WRITES specify the number of times
975 that VAR is read/written in STMT (indirect reads/writes are not
976 recorded by this function, see compute_memory_partitions). */
978 void
979 update_mem_sym_stats_from_stmt (tree var, tree stmt, long num_direct_reads,
980 long num_direct_writes)
982 mem_sym_stats_t stats;
984 gcc_assert (num_direct_reads >= 0 && num_direct_writes >= 0);
986 stats = get_mem_sym_stats_for (var);
988 stats->num_direct_reads += num_direct_reads;
989 stats->frequency_reads += ((long) bb_for_stmt (stmt)->frequency
990 * num_direct_reads);
992 stats->num_direct_writes += num_direct_writes;
993 stats->frequency_writes += ((long) bb_for_stmt (stmt)->frequency
994 * num_direct_writes);
998 /* Given two MP_INFO entries MP1 and MP2, return -1 if MP1->VAR should
999 be partitioned before MP2->VAR, 0 if they are the same or 1 if
1000 MP1->VAR should be partitioned after MP2->VAR. */
1002 static inline int
1003 compare_mp_info_entries (mem_sym_stats_t mp1, mem_sym_stats_t mp2)
1005 long pscore1 = mem_sym_score (mp1);
1006 long pscore2 = mem_sym_score (mp2);
1008 if (pscore1 < pscore2)
1009 return -1;
1010 else if (pscore1 > pscore2)
1011 return 1;
1012 else
1013 return DECL_UID (mp1->var) - DECL_UID (mp2->var);
1017 /* Comparison routine for qsort. The list is sorted by increasing
1018 partitioning score (PSCORE). This score is computed such that
1019 symbols with high scores are those that are least likely to be
1020 partitioned. */
1022 static int
1023 mp_info_cmp (const void *p, const void *q)
1025 mem_sym_stats_t e1 = *((const mem_sym_stats_t *) p);
1026 mem_sym_stats_t e2 = *((const mem_sym_stats_t *) q);
1027 return compare_mp_info_entries (e1, e2);
1031 /* Sort the array of reference counts used to compute memory partitions.
1032 Elements are sorted in ascending order of execution frequency and
1033 descending order of virtual operators needed. */
1035 static inline void
1036 sort_mp_info (VEC(mem_sym_stats_t,heap) *list)
1038 unsigned num = VEC_length (mem_sym_stats_t, list);
1040 if (num < 2)
1041 return;
1043 if (num == 2)
1045 if (compare_mp_info_entries (VEC_index (mem_sym_stats_t, list, 0),
1046 VEC_index (mem_sym_stats_t, list, 1)) > 0)
1048 /* Swap elements if they are in the wrong order. */
1049 mem_sym_stats_t tmp = VEC_index (mem_sym_stats_t, list, 0);
1050 VEC_replace (mem_sym_stats_t, list, 0,
1051 VEC_index (mem_sym_stats_t, list, 1));
1052 VEC_replace (mem_sym_stats_t, list, 1, tmp);
1055 return;
1058 /* There are 3 or more elements, call qsort. */
1059 qsort (VEC_address (mem_sym_stats_t, list),
1060 VEC_length (mem_sym_stats_t, list),
1061 sizeof (mem_sym_stats_t),
1062 mp_info_cmp);
1066 /* Return the memory partition tag (MPT) associated with memory
1067 symbol SYM. */
1069 static tree
1070 get_mpt_for (tree sym)
1072 tree mpt;
1074 /* Don't create a new tag unnecessarily. */
1075 mpt = memory_partition (sym);
1076 if (mpt == NULL_TREE)
1078 mpt = create_tag_raw (MEMORY_PARTITION_TAG, TREE_TYPE (sym), "MPT");
1079 TREE_ADDRESSABLE (mpt) = 0;
1080 add_referenced_var (mpt);
1081 VEC_safe_push (tree, heap, gimple_ssa_operands (cfun)->mpt_table, mpt);
1082 gcc_assert (MPT_SYMBOLS (mpt) == NULL);
1083 set_memory_partition (sym, mpt);
1086 return mpt;
1090 /* Add MP_P->VAR to a memory partition and return the partition. */
1092 static tree
1093 find_partition_for (mem_sym_stats_t mp_p)
1095 unsigned i;
1096 VEC(tree,heap) *mpt_table;
1097 tree mpt;
1099 mpt_table = gimple_ssa_operands (cfun)->mpt_table;
1100 mpt = NULL_TREE;
1102 /* Find an existing partition for MP_P->VAR. */
1103 for (i = 0; VEC_iterate (tree, mpt_table, i, mpt); i++)
1105 mem_sym_stats_t mpt_stats;
1107 /* If MPT does not have any symbols yet, use it. */
1108 if (MPT_SYMBOLS (mpt) == NULL)
1109 break;
1111 /* Otherwise, see if MPT has common parent tags with MP_P->VAR,
1112 but avoid grouping clobbered variables with non-clobbered
1113 variables (otherwise, this tends to creates a single memory
1114 partition because other call-clobbered variables may have
1115 common parent tags with non-clobbered ones). */
1116 mpt_stats = get_mem_sym_stats_for (mpt);
1117 if (mp_p->parent_tags
1118 && mpt_stats->parent_tags
1119 && is_call_clobbered (mpt) == is_call_clobbered (mp_p->var)
1120 && bitmap_intersect_p (mpt_stats->parent_tags, mp_p->parent_tags))
1121 break;
1123 /* If no common parent tags are found, see if both MPT and
1124 MP_P->VAR are call-clobbered. */
1125 if (is_call_clobbered (mpt) && is_call_clobbered (mp_p->var))
1126 break;
1129 if (mpt == NULL_TREE)
1130 mpt = get_mpt_for (mp_p->var);
1131 else
1132 set_memory_partition (mp_p->var, mpt);
1134 mp_p->partitioned_p = true;
1136 mark_sym_for_renaming (mp_p->var);
1137 mark_sym_for_renaming (mpt);
1139 return mpt;
1143 /* Rewrite the alias set for TAG to use the newly created partitions.
1144 If TAG is NULL, rewrite the set of call-clobbered variables.
1145 NEW_ALIASES is a scratch bitmap to build the new set of aliases for
1146 TAG. */
1148 static void
1149 rewrite_alias_set_for (tree tag, bitmap new_aliases)
1151 bitmap_iterator bi;
1152 unsigned i;
1153 tree mpt, sym;
1155 EXECUTE_IF_SET_IN_BITMAP (MTAG_ALIASES (tag), 0, i, bi)
1157 sym = referenced_var (i);
1158 mpt = memory_partition (sym);
1159 if (mpt)
1160 bitmap_set_bit (new_aliases, DECL_UID (mpt));
1161 else
1162 bitmap_set_bit (new_aliases, DECL_UID (sym));
1165 /* Rebuild the may-alias array for TAG. */
1166 bitmap_copy (MTAG_ALIASES (tag), new_aliases);
1170 /* Determine how many virtual operands can be saved by partitioning
1171 MP_P->VAR into MPT. When a symbol S is thrown inside a partition
1172 P, every virtual operand that used to reference S will now
1173 reference P. Whether it reduces the number of virtual operands
1174 depends on:
1176 1- Direct references to S are never saved. Instead of the virtual
1177 operand to S, we will now have a virtual operand to P.
1179 2- Indirect references to S are reduced only for those memory tags
1180 holding S that already had other symbols partitioned into P.
1181 For instance, if a memory tag T has the alias set { a b S c },
1182 the first time we partition S into P, the alias set will become
1183 { a b P c }, so no virtual operands will be saved. However, if
1184 we now partition symbol 'c' into P, then the alias set for T
1185 will become { a b P }, so we will be saving one virtual operand
1186 for every indirect reference to 'c'.
1188 3- Is S is call-clobbered, we save as many virtual operands as
1189 call/asm sites exist in the code, but only if other
1190 call-clobbered symbols have been grouped into P. The first
1191 call-clobbered symbol that we group does not produce any
1192 savings.
1194 MEM_REF_STATS points to CFUN's memory reference information. */
1196 static void
1197 estimate_vop_reduction (struct mem_ref_stats_d *mem_ref_stats,
1198 mem_sym_stats_t mp_p, tree mpt)
1200 unsigned i;
1201 bitmap_iterator bi;
1202 mem_sym_stats_t mpt_stats;
1204 /* We should only get symbols with indirect references here. */
1205 gcc_assert (mp_p->num_indirect_reads > 0 || mp_p->num_indirect_writes > 0);
1207 /* Note that the only statistics we keep for MPT is the set of
1208 parent tags to know which memory tags have had alias members
1209 partitioned, and the indicator has_call_clobbered_vars.
1210 Reference counts are not important for MPT. */
1211 mpt_stats = get_mem_sym_stats_for (mpt);
1213 /* Traverse all the parent tags for MP_P->VAR. For every tag T, if
1214 partition P is already grouping aliases of T, then reduce the
1215 number of virtual operands by the number of direct references
1216 to T. */
1217 if (mp_p->parent_tags)
1219 if (mpt_stats->parent_tags == NULL)
1220 mpt_stats->parent_tags = BITMAP_ALLOC (&alias_bitmap_obstack);
1222 EXECUTE_IF_SET_IN_BITMAP (mp_p->parent_tags, 0, i, bi)
1224 if (bitmap_bit_p (mpt_stats->parent_tags, i))
1226 /* Partition MPT is already partitioning symbols in the
1227 alias set for TAG. This means that we are now saving
1228 1 virtual operand for every direct reference to TAG. */
1229 tree tag = referenced_var (i);
1230 mem_sym_stats_t tag_stats = mem_sym_stats (cfun, tag);
1231 mem_ref_stats->num_vuses -= tag_stats->num_direct_reads;
1232 mem_ref_stats->num_vdefs -= tag_stats->num_direct_writes;
1234 else
1236 /* This is the first symbol in tag I's alias set that is
1237 being grouped under MPT. We will not save any
1238 virtual operands this time, but record that MPT is
1239 grouping a symbol from TAG's alias set so that the
1240 next time we get the savings. */
1241 bitmap_set_bit (mpt_stats->parent_tags, i);
1246 /* If MP_P->VAR is call-clobbered, and MPT is already grouping
1247 call-clobbered symbols, then we will save as many virtual
1248 operands as asm/call sites there are. */
1249 if (is_call_clobbered (mp_p->var))
1251 if (mpt_stats->has_call_clobbered_vars)
1252 mem_ref_stats->num_vdefs -= mem_ref_stats->num_call_sites
1253 + mem_ref_stats->num_asm_sites;
1254 else
1255 mpt_stats->has_call_clobbered_vars = true;
1260 /* Helper for compute_memory_partitions. Transfer reference counts
1261 from pointers to their pointed-to sets. Counters for pointers were
1262 computed by update_alias_info. MEM_REF_STATS points to CFUN's
1263 memory reference information. */
1265 static void
1266 update_reference_counts (struct mem_ref_stats_d *mem_ref_stats)
1268 unsigned i;
1269 bitmap_iterator bi;
1270 mem_sym_stats_t sym_stats;
1272 for (i = 1; i < num_ssa_names; i++)
1274 tree ptr;
1275 struct ptr_info_def *pi;
1277 ptr = ssa_name (i);
1278 if (ptr
1279 && POINTER_TYPE_P (TREE_TYPE (ptr))
1280 && (pi = SSA_NAME_PTR_INFO (ptr)) != NULL
1281 && pi->is_dereferenced)
1283 unsigned j;
1284 bitmap_iterator bj;
1285 tree tag;
1286 mem_sym_stats_t ptr_stats, tag_stats;
1288 /* If PTR has flow-sensitive points-to information, use
1289 PTR's name tag, otherwise use the symbol tag associated
1290 with PTR's symbol. */
1291 if (pi->name_mem_tag)
1292 tag = pi->name_mem_tag;
1293 else
1294 tag = symbol_mem_tag (SSA_NAME_VAR (ptr));
1296 ptr_stats = get_mem_sym_stats_for (ptr);
1297 tag_stats = get_mem_sym_stats_for (tag);
1299 /* TAG has as many direct references as dereferences we
1300 found for its parent pointer. */
1301 tag_stats->num_direct_reads += ptr_stats->num_direct_reads;
1302 tag_stats->num_direct_writes += ptr_stats->num_direct_writes;
1304 /* All the dereferences of pointer PTR are considered direct
1305 references to PTR's memory tag (TAG). In turn,
1306 references to TAG will become virtual operands for every
1307 symbol in TAG's alias set. So, for every symbol ALIAS in
1308 TAG's alias set, add as many indirect references to ALIAS
1309 as direct references there are for TAG. */
1310 if (MTAG_ALIASES (tag))
1311 EXECUTE_IF_SET_IN_BITMAP (MTAG_ALIASES (tag), 0, j, bj)
1313 tree alias = referenced_var (j);
1314 sym_stats = get_mem_sym_stats_for (alias);
1316 /* All the direct references to TAG are indirect references
1317 to ALIAS. */
1318 sym_stats->num_indirect_reads += ptr_stats->num_direct_reads;
1319 sym_stats->num_indirect_writes += ptr_stats->num_direct_writes;
1320 sym_stats->frequency_reads += ptr_stats->frequency_reads;
1321 sym_stats->frequency_writes += ptr_stats->frequency_writes;
1323 /* Indicate that TAG is one of ALIAS's parent tags. */
1324 if (sym_stats->parent_tags == NULL)
1325 sym_stats->parent_tags = BITMAP_ALLOC (&alias_bitmap_obstack);
1326 bitmap_set_bit (sym_stats->parent_tags, DECL_UID (tag));
1331 /* Call-clobbered symbols are indirectly written at every
1332 call/asm site. */
1333 EXECUTE_IF_SET_IN_BITMAP (gimple_call_clobbered_vars (cfun), 0, i, bi)
1335 tree sym = referenced_var (i);
1336 sym_stats = get_mem_sym_stats_for (sym);
1337 sym_stats->num_indirect_writes += mem_ref_stats->num_call_sites
1338 + mem_ref_stats->num_asm_sites;
1341 /* Addressable symbols are indirectly written at some ASM sites.
1342 Since only ASM sites that clobber memory actually affect
1343 addressable symbols, this is an over-estimation. */
1344 EXECUTE_IF_SET_IN_BITMAP (gimple_addressable_vars (cfun), 0, i, bi)
1346 tree sym = referenced_var (i);
1347 sym_stats = get_mem_sym_stats_for (sym);
1348 sym_stats->num_indirect_writes += mem_ref_stats->num_asm_sites;
1353 /* Helper for compute_memory_partitions. Add all memory symbols to
1354 *MP_INFO_P and compute the initial estimate for the total number of
1355 virtual operands needed. MEM_REF_STATS points to CFUN's memory
1356 reference information. On exit, *TAGS_P will contain the list of
1357 memory tags whose alias set need to be rewritten after
1358 partitioning. */
1360 static void
1361 build_mp_info (struct mem_ref_stats_d *mem_ref_stats,
1362 VEC(mem_sym_stats_t,heap) **mp_info_p,
1363 VEC(tree,heap) **tags_p)
1365 tree var;
1366 referenced_var_iterator rvi;
1368 FOR_EACH_REFERENCED_VAR (var, rvi)
1370 mem_sym_stats_t sym_stats;
1371 tree old_mpt;
1373 /* We are only interested in memory symbols other than MPTs. */
1374 if (is_gimple_reg (var) || TREE_CODE (var) == MEMORY_PARTITION_TAG)
1375 continue;
1377 /* Collect memory tags into the TAGS array so that we can
1378 rewrite their alias sets after partitioning. */
1379 if (MTAG_P (var) && MTAG_ALIASES (var))
1380 VEC_safe_push (tree, heap, *tags_p, var);
1382 /* Since we are going to re-compute partitions, any symbols that
1383 used to belong to a partition must be detached from it and
1384 marked for renaming. */
1385 if ((old_mpt = memory_partition (var)) != NULL)
1387 mark_sym_for_renaming (old_mpt);
1388 set_memory_partition (var, NULL_TREE);
1389 mark_sym_for_renaming (var);
1392 sym_stats = get_mem_sym_stats_for (var);
1394 /* Add VAR's reference info to MP_INFO. Note that the only
1395 symbols that make sense to partition are those that have
1396 indirect references. If a symbol S is always directly
1397 referenced, partitioning it will not reduce the number of
1398 virtual operators. The only symbols that are profitable to
1399 partition are those that belong to alias sets and/or are
1400 call-clobbered. */
1401 if (sym_stats->num_indirect_reads > 0
1402 || sym_stats->num_indirect_writes > 0)
1403 VEC_safe_push (mem_sym_stats_t, heap, *mp_info_p, sym_stats);
1405 /* Update the number of estimated VOPS. Note that direct
1406 references to memory tags are always counted as indirect
1407 references to their alias set members, so if a memory tag has
1408 aliases, do not count its direct references to avoid double
1409 accounting. */
1410 if (!MTAG_P (var) || !MTAG_ALIASES (var))
1412 mem_ref_stats->num_vuses += sym_stats->num_direct_reads;
1413 mem_ref_stats->num_vdefs += sym_stats->num_direct_writes;
1416 mem_ref_stats->num_vuses += sym_stats->num_indirect_reads;
1417 mem_ref_stats->num_vdefs += sym_stats->num_indirect_writes;
1422 /* Compute memory partitions. A memory partition (MPT) is an
1423 arbitrary grouping of memory symbols, such that references to one
1424 member of the group is considered a reference to all the members of
1425 the group.
1427 As opposed to alias sets in memory tags, the grouping into
1428 partitions is completely arbitrary and only done to reduce the
1429 number of virtual operands. The only rule that needs to be
1430 observed when creating memory partitions is that given two memory
1431 partitions MPT.i and MPT.j, they must not contain symbols in
1432 common.
1434 Memory partitions are used when putting the program into Memory-SSA
1435 form. In particular, in Memory-SSA PHI nodes are not computed for
1436 individual memory symbols. They are computed for memory
1437 partitions. This reduces the amount of PHI nodes in the SSA graph
1438 at the expense of precision (i.e., it makes unrelated stores affect
1439 each other).
1441 However, it is possible to increase precision by changing this
1442 partitioning scheme. For instance, if the partitioning scheme is
1443 such that get_mpt_for is the identity function (that is,
1444 get_mpt_for (s) = s), this will result in ultimate precision at the
1445 expense of huge SSA webs.
1447 At the other extreme, a partitioning scheme that groups all the
1448 symbols in the same set results in minimal SSA webs and almost
1449 total loss of precision.
1451 There partitioning heuristic uses three parameters to decide the
1452 order in which symbols are processed. The list of symbols is
1453 sorted so that symbols that are more likely to be partitioned are
1454 near the top of the list:
1456 - Execution frequency. If a memory references is in a frequently
1457 executed code path, grouping it into a partition may block useful
1458 transformations and cause sub-optimal code generation. So, the
1459 partition heuristic tries to avoid grouping symbols with high
1460 execution frequency scores. Execution frequency is taken
1461 directly from the basic blocks where every reference is made (see
1462 update_mem_sym_stats_from_stmt), which in turn uses the
1463 profile guided machinery, so if the program is compiled with PGO
1464 enabled, more accurate partitioning decisions will be made.
1466 - Number of references. Symbols with few references in the code,
1467 are partitioned before symbols with many references.
1469 - NO_ALIAS attributes. Symbols with any of the NO_ALIAS*
1470 attributes are partitioned after symbols marked MAY_ALIAS.
1472 Once the list is sorted, the partitioning proceeds as follows:
1474 1- For every symbol S in MP_INFO, create a new memory partition MP,
1475 if necessary. To avoid memory partitions that contain symbols
1476 from non-conflicting alias sets, memory partitions are
1477 associated to the memory tag that holds S in its alias set. So,
1478 when looking for a memory partition for S, the memory partition
1479 associated with one of the memory tags holding S is chosen. If
1480 none exists, a new one is created.
1482 2- Add S to memory partition MP.
1484 3- Reduce by 1 the number of VOPS for every memory tag holding S.
1486 4- If the total number of VOPS is less than MAX_ALIASED_VOPS or the
1487 average number of VOPS per statement is less than
1488 AVG_ALIASED_VOPS, stop. Otherwise, go to the next symbol in the
1489 list. */
1491 static void
1492 compute_memory_partitions (void)
1494 tree tag;
1495 unsigned i;
1496 mem_sym_stats_t mp_p;
1497 VEC(mem_sym_stats_t,heap) *mp_info;
1498 bitmap new_aliases;
1499 VEC(tree,heap) *tags;
1500 struct mem_ref_stats_d *mem_ref_stats;
1501 int prev_max_aliased_vops;
1503 mem_ref_stats = gimple_mem_ref_stats (cfun);
1504 gcc_assert (mem_ref_stats->num_vuses == 0 && mem_ref_stats->num_vdefs == 0);
1506 if (mem_ref_stats->num_mem_stmts == 0)
1507 return;
1509 timevar_push (TV_MEMORY_PARTITIONING);
1511 mp_info = NULL;
1512 tags = NULL;
1513 prev_max_aliased_vops = MAX_ALIASED_VOPS;
1515 /* Since we clearly cannot lower the number of virtual operators
1516 below the total number of memory statements in the function, we
1517 may need to adjust MAX_ALIASED_VOPS beforehand. */
1518 if (MAX_ALIASED_VOPS < mem_ref_stats->num_mem_stmts)
1519 MAX_ALIASED_VOPS = mem_ref_stats->num_mem_stmts;
1521 /* Update reference stats for all the pointed-to variables and
1522 memory tags. */
1523 update_reference_counts (mem_ref_stats);
1525 /* Add all the memory symbols to MP_INFO. */
1526 build_mp_info (mem_ref_stats, &mp_info, &tags);
1528 /* No partitions required if we are below the threshold. */
1529 if (!need_to_partition_p (mem_ref_stats))
1531 if (dump_file)
1532 fprintf (dump_file, "\nMemory partitioning NOT NEEDED for %s\n",
1533 get_name (current_function_decl));
1534 goto done;
1537 /* Sort the MP_INFO array so that symbols that should be partitioned
1538 first are near the top of the list. */
1539 sort_mp_info (mp_info);
1541 if (dump_file)
1543 fprintf (dump_file, "\nMemory partitioning NEEDED for %s\n\n",
1544 get_name (current_function_decl));
1545 fprintf (dump_file, "Memory symbol references before partitioning:\n");
1546 dump_mp_info (dump_file, mp_info);
1549 /* Create partitions for variables in MP_INFO until we have enough
1550 to lower the total number of VOPS below MAX_ALIASED_VOPS or if
1551 the average number of VOPS per statement is below
1552 AVG_ALIASED_VOPS. */
1553 for (i = 0; VEC_iterate (mem_sym_stats_t, mp_info, i, mp_p); i++)
1555 tree mpt;
1557 /* If we are below the threshold, stop. */
1558 if (!need_to_partition_p (mem_ref_stats))
1559 break;
1561 mpt = find_partition_for (mp_p);
1562 estimate_vop_reduction (mem_ref_stats, mp_p, mpt);
1565 /* After partitions have been created, rewrite alias sets to use
1566 them instead of the original symbols. This way, if the alias set
1567 was computed as { a b c d e f }, and the subset { b e f } was
1568 grouped into partition MPT.3, then the new alias set for the tag
1569 will be { a c d MPT.3 }.
1571 Note that this is not strictly necessary. The operand scanner
1572 will always check if a symbol belongs to a partition when adding
1573 virtual operands. However, by reducing the size of the alias
1574 sets to be scanned, the work needed inside the operand scanner is
1575 significantly reduced. */
1576 new_aliases = BITMAP_ALLOC (&alias_bitmap_obstack);
1578 for (i = 0; VEC_iterate (tree, tags, i, tag); i++)
1580 rewrite_alias_set_for (tag, new_aliases);
1581 bitmap_clear (new_aliases);
1584 BITMAP_FREE (new_aliases);
1586 if (dump_file)
1588 fprintf (dump_file, "\nMemory symbol references after partitioning:\n");
1589 dump_mp_info (dump_file, mp_info);
1592 done:
1593 /* Free allocated memory. */
1594 VEC_free (mem_sym_stats_t, heap, mp_info);
1595 VEC_free (tree, heap, tags);
1597 MAX_ALIASED_VOPS = prev_max_aliased_vops;
1599 timevar_pop (TV_MEMORY_PARTITIONING);
1603 /* Compute may-alias information for every variable referenced in function
1604 FNDECL.
1606 Alias analysis proceeds in 3 main phases:
1608 1- Points-to and escape analysis.
1610 This phase walks the use-def chains in the SSA web looking for three
1611 things:
1613 * Assignments of the form P_i = &VAR
1614 * Assignments of the form P_i = malloc()
1615 * Pointers and ADDR_EXPR that escape the current function.
1617 The concept of 'escaping' is the same one used in the Java world. When
1618 a pointer or an ADDR_EXPR escapes, it means that it has been exposed
1619 outside of the current function. So, assignment to global variables,
1620 function arguments and returning a pointer are all escape sites, as are
1621 conversions between pointers and integers.
1623 This is where we are currently limited. Since not everything is renamed
1624 into SSA, we lose track of escape properties when a pointer is stashed
1625 inside a field in a structure, for instance. In those cases, we are
1626 assuming that the pointer does escape.
1628 We use escape analysis to determine whether a variable is
1629 call-clobbered. Simply put, if an ADDR_EXPR escapes, then the variable
1630 is call-clobbered. If a pointer P_i escapes, then all the variables
1631 pointed-to by P_i (and its memory tag) also escape.
1633 2- Compute flow-sensitive aliases
1635 We have two classes of memory tags. Memory tags associated with the
1636 pointed-to data type of the pointers in the program. These tags are
1637 called "symbol memory tag" (SMT). The other class are those associated
1638 with SSA_NAMEs, called "name memory tag" (NMT). The basic idea is that
1639 when adding operands for an INDIRECT_REF *P_i, we will first check
1640 whether P_i has a name tag, if it does we use it, because that will have
1641 more precise aliasing information. Otherwise, we use the standard symbol
1642 tag.
1644 In this phase, we go through all the pointers we found in points-to
1645 analysis and create alias sets for the name memory tags associated with
1646 each pointer P_i. If P_i escapes, we mark call-clobbered the variables
1647 it points to and its tag.
1650 3- Compute flow-insensitive aliases
1652 This pass will compare the alias set of every symbol memory tag and
1653 every addressable variable found in the program. Given a symbol
1654 memory tag SMT and an addressable variable V. If the alias sets of
1655 SMT and V conflict (as computed by may_alias_p), then V is marked
1656 as an alias tag and added to the alias set of SMT.
1658 For instance, consider the following function:
1660 foo (int i)
1662 int *p, a, b;
1664 if (i > 10)
1665 p = &a;
1666 else
1667 p = &b;
1669 *p = 3;
1670 a = b + 2;
1671 return *p;
1674 After aliasing analysis has finished, the symbol memory tag for pointer
1675 'p' will have two aliases, namely variables 'a' and 'b'. Every time
1676 pointer 'p' is dereferenced, we want to mark the operation as a
1677 potential reference to 'a' and 'b'.
1679 foo (int i)
1681 int *p, a, b;
1683 if (i_2 > 10)
1684 p_4 = &a;
1685 else
1686 p_6 = &b;
1687 # p_1 = PHI <p_4(1), p_6(2)>;
1689 # a_7 = VDEF <a_3>;
1690 # b_8 = VDEF <b_5>;
1691 *p_1 = 3;
1693 # a_9 = VDEF <a_7>
1694 # VUSE <b_8>
1695 a_9 = b_8 + 2;
1697 # VUSE <a_9>;
1698 # VUSE <b_8>;
1699 return *p_1;
1702 In certain cases, the list of may aliases for a pointer may grow too
1703 large. This may cause an explosion in the number of virtual operands
1704 inserted in the code. Resulting in increased memory consumption and
1705 compilation time.
1707 When the number of virtual operands needed to represent aliased
1708 loads and stores grows too large (configurable with option --param
1709 max-aliased-vops and --param avg-aliased-vops), alias sets are
1710 grouped to avoid severe compile-time slow downs and memory
1711 consumption. See compute_memory_partitions. */
1713 unsigned int
1714 compute_may_aliases (void)
1716 struct alias_info *ai;
1718 timevar_push (TV_TREE_MAY_ALIAS);
1720 memset (&alias_stats, 0, sizeof (alias_stats));
1722 /* Initialize aliasing information. */
1723 ai = init_alias_info ();
1725 /* For each pointer P_i, determine the sets of variables that P_i may
1726 point-to. For every addressable variable V, determine whether the
1727 address of V escapes the current function, making V call-clobbered
1728 (i.e., whether &V is stored in a global variable or if its passed as a
1729 function call argument). */
1730 compute_points_to_sets (ai);
1732 /* Collect all pointers and addressable variables, compute alias sets,
1733 create memory tags for pointers and promote variables whose address is
1734 not needed anymore. */
1735 setup_pointers_and_addressables (ai);
1737 /* Compute type-based flow-insensitive aliasing for all the type
1738 memory tags. */
1739 compute_flow_insensitive_aliasing (ai);
1741 /* Compute flow-sensitive, points-to based aliasing for all the name
1742 memory tags. */
1743 compute_flow_sensitive_aliasing (ai);
1745 /* Compute call clobbering information. */
1746 compute_call_clobbered (ai);
1748 /* If the program makes no reference to global variables, but it
1749 contains a mixture of pure and non-pure functions, then we need
1750 to create use-def and def-def links between these functions to
1751 avoid invalid transformations on them. */
1752 maybe_create_global_var ();
1754 /* Compute memory partitions for every memory variable. */
1755 compute_memory_partitions ();
1757 /* Remove partitions with no symbols. Partitions may end up with an
1758 empty MPT_SYMBOLS set if a previous round of alias analysis
1759 needed to partition more symbols. Since we don't need those
1760 partitions anymore, remove them to free up the space. */
1762 tree mpt;
1763 unsigned i;
1764 VEC(tree,heap) *mpt_table;
1766 mpt_table = gimple_ssa_operands (cfun)->mpt_table;
1767 i = 0;
1768 while (i < VEC_length (tree, mpt_table))
1770 mpt = VEC_index (tree, mpt_table, i);
1771 if (MPT_SYMBOLS (mpt) == NULL)
1772 VEC_unordered_remove (tree, mpt_table, i);
1773 else
1774 i++;
1778 /* Populate all virtual operands and newly promoted register operands. */
1780 block_stmt_iterator bsi;
1781 basic_block bb;
1782 FOR_EACH_BB (bb)
1783 for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
1784 update_stmt_if_modified (bsi_stmt (bsi));
1787 /* Debugging dumps. */
1788 if (dump_file)
1790 dump_mem_ref_stats (dump_file);
1791 dump_alias_info (dump_file);
1792 dump_points_to_info (dump_file);
1794 if (dump_flags & TDF_STATS)
1795 dump_alias_stats (dump_file);
1797 if (dump_flags & TDF_DETAILS)
1798 dump_referenced_vars (dump_file);
1801 /* Report strict aliasing violations. */
1802 strict_aliasing_warning_backend ();
1804 /* Deallocate memory used by aliasing data structures. */
1805 delete_alias_info (ai);
1807 if (need_ssa_update_p ())
1808 update_ssa (TODO_update_ssa);
1810 timevar_pop (TV_TREE_MAY_ALIAS);
1812 return 0;
1815 /* Data structure used to count the number of dereferences to PTR
1816 inside an expression. */
1817 struct count_ptr_d
1819 tree ptr;
1820 unsigned count;
1824 /* Helper for count_uses_and_derefs. Called by walk_tree to look for
1825 (ALIGN/MISALIGNED_)INDIRECT_REF nodes for the pointer passed in DATA. */
1827 static tree
1828 count_ptr_derefs (tree *tp, int *walk_subtrees, void *data)
1830 struct count_ptr_d *count_p = (struct count_ptr_d *) data;
1832 /* Do not walk inside ADDR_EXPR nodes. In the expression &ptr->fld,
1833 pointer 'ptr' is *not* dereferenced, it is simply used to compute
1834 the address of 'fld' as 'ptr + offsetof(fld)'. */
1835 if (TREE_CODE (*tp) == ADDR_EXPR)
1837 *walk_subtrees = 0;
1838 return NULL_TREE;
1841 if (INDIRECT_REF_P (*tp) && TREE_OPERAND (*tp, 0) == count_p->ptr)
1842 count_p->count++;
1844 return NULL_TREE;
1848 /* Count the number of direct and indirect uses for pointer PTR in
1849 statement STMT. The number of direct uses is stored in
1850 *NUM_USES_P. Indirect references are counted separately depending
1851 on whether they are store or load operations. The counts are
1852 stored in *NUM_STORES_P and *NUM_LOADS_P. */
1854 void
1855 count_uses_and_derefs (tree ptr, tree stmt, unsigned *num_uses_p,
1856 unsigned *num_loads_p, unsigned *num_stores_p)
1858 ssa_op_iter i;
1859 tree use;
1861 *num_uses_p = 0;
1862 *num_loads_p = 0;
1863 *num_stores_p = 0;
1865 /* Find out the total number of uses of PTR in STMT. */
1866 FOR_EACH_SSA_TREE_OPERAND (use, stmt, i, SSA_OP_USE)
1867 if (use == ptr)
1868 (*num_uses_p)++;
1870 /* Now count the number of indirect references to PTR. This is
1871 truly awful, but we don't have much choice. There are no parent
1872 pointers inside INDIRECT_REFs, so an expression like
1873 '*x_1 = foo (x_1, *x_1)' needs to be traversed piece by piece to
1874 find all the indirect and direct uses of x_1 inside. The only
1875 shortcut we can take is the fact that GIMPLE only allows
1876 INDIRECT_REFs inside the expressions below. */
1877 if (TREE_CODE (stmt) == GIMPLE_MODIFY_STMT
1878 || (TREE_CODE (stmt) == RETURN_EXPR
1879 && TREE_CODE (TREE_OPERAND (stmt, 0)) == GIMPLE_MODIFY_STMT)
1880 || TREE_CODE (stmt) == ASM_EXPR
1881 || TREE_CODE (stmt) == CALL_EXPR)
1883 tree lhs, rhs;
1885 if (TREE_CODE (stmt) == GIMPLE_MODIFY_STMT)
1887 lhs = GIMPLE_STMT_OPERAND (stmt, 0);
1888 rhs = GIMPLE_STMT_OPERAND (stmt, 1);
1890 else if (TREE_CODE (stmt) == RETURN_EXPR)
1892 tree e = TREE_OPERAND (stmt, 0);
1893 lhs = GIMPLE_STMT_OPERAND (e, 0);
1894 rhs = GIMPLE_STMT_OPERAND (e, 1);
1896 else if (TREE_CODE (stmt) == ASM_EXPR)
1898 lhs = ASM_OUTPUTS (stmt);
1899 rhs = ASM_INPUTS (stmt);
1901 else
1903 lhs = NULL_TREE;
1904 rhs = stmt;
1907 if (lhs
1908 && (TREE_CODE (lhs) == TREE_LIST
1909 || EXPR_P (lhs)
1910 || GIMPLE_STMT_P (lhs)))
1912 struct count_ptr_d count;
1913 count.ptr = ptr;
1914 count.count = 0;
1915 walk_tree (&lhs, count_ptr_derefs, &count, NULL);
1916 *num_stores_p = count.count;
1919 if (rhs
1920 && (TREE_CODE (rhs) == TREE_LIST
1921 || EXPR_P (rhs)
1922 || GIMPLE_STMT_P (rhs)))
1924 struct count_ptr_d count;
1925 count.ptr = ptr;
1926 count.count = 0;
1927 walk_tree (&rhs, count_ptr_derefs, &count, NULL);
1928 *num_loads_p = count.count;
1932 gcc_assert (*num_uses_p >= *num_loads_p + *num_stores_p);
1935 /* Remove memory references stats for function FN. */
1937 void
1938 delete_mem_ref_stats (struct function *fn)
1940 if (gimple_mem_ref_stats (fn)->mem_sym_stats)
1942 free_alloc_pool (mem_sym_stats_pool);
1943 pointer_map_destroy (gimple_mem_ref_stats (fn)->mem_sym_stats);
1945 gimple_mem_ref_stats (fn)->mem_sym_stats = NULL;
1949 /* Initialize memory reference stats. */
1951 static void
1952 init_mem_ref_stats (void)
1954 struct mem_ref_stats_d *mem_ref_stats = gimple_mem_ref_stats (cfun);
1956 mem_sym_stats_pool = create_alloc_pool ("Mem sym stats",
1957 sizeof (struct mem_sym_stats_d),
1958 100);
1959 memset (mem_ref_stats, 0, sizeof (struct mem_ref_stats_d));
1960 mem_ref_stats->mem_sym_stats = pointer_map_create ();
1964 /* Helper for init_alias_info. Reset existing aliasing information. */
1966 static void
1967 reset_alias_info (void)
1969 referenced_var_iterator rvi;
1970 tree var;
1971 unsigned i;
1972 bitmap active_nmts, all_nmts;
1974 /* Clear the set of addressable variables. We do not need to clear
1975 the TREE_ADDRESSABLE bit on every symbol because we are going to
1976 re-compute addressability here. */
1977 bitmap_clear (gimple_addressable_vars (cfun));
1979 active_nmts = BITMAP_ALLOC (&alias_bitmap_obstack);
1980 all_nmts = BITMAP_ALLOC (&alias_bitmap_obstack);
1982 /* Clear flow-insensitive alias information from each symbol. */
1983 FOR_EACH_REFERENCED_VAR (var, rvi)
1985 if (is_gimple_reg (var))
1986 continue;
1988 if (MTAG_P (var))
1989 MTAG_ALIASES (var) = NULL;
1991 /* Memory partition information will be computed from scratch. */
1992 if (TREE_CODE (var) == MEMORY_PARTITION_TAG)
1993 MPT_SYMBOLS (var) = NULL;
1995 /* Collect all the name tags to determine if we have any
1996 orphaned that need to be removed from the IL. A name tag
1997 will be orphaned if it is not associated with any active SSA
1998 name. */
1999 if (TREE_CODE (var) == NAME_MEMORY_TAG)
2000 bitmap_set_bit (all_nmts, DECL_UID (var));
2002 /* Since we are about to re-discover call-clobbered
2003 variables, clear the call-clobbered flag. */
2004 clear_call_clobbered (var);
2007 /* There should be no call-clobbered variable left. */
2008 gcc_assert (bitmap_empty_p (gimple_call_clobbered_vars (cfun)));
2010 /* Clear flow-sensitive points-to information from each SSA name. */
2011 for (i = 1; i < num_ssa_names; i++)
2013 tree name = ssa_name (i);
2015 if (!name || !POINTER_TYPE_P (TREE_TYPE (name)))
2016 continue;
2018 if (SSA_NAME_PTR_INFO (name))
2020 struct ptr_info_def *pi = SSA_NAME_PTR_INFO (name);
2022 /* Clear all the flags but keep the name tag to
2023 avoid creating new temporaries unnecessarily. If
2024 this pointer is found to point to a subset or
2025 superset of its former points-to set, then a new
2026 tag will need to be created in create_name_tags. */
2027 pi->pt_anything = 0;
2028 pi->pt_null = 0;
2029 pi->value_escapes_p = 0;
2030 pi->is_dereferenced = 0;
2031 if (pi->pt_vars)
2032 bitmap_clear (pi->pt_vars);
2034 /* Add NAME's name tag to the set of active tags. */
2035 if (pi->name_mem_tag)
2036 bitmap_set_bit (active_nmts, DECL_UID (pi->name_mem_tag));
2040 /* Name memory tags that are no longer associated with an SSA name
2041 are considered stale and should be removed from the IL. All the
2042 name tags that are in the set ALL_NMTS but not in ACTIVE_NMTS are
2043 considered stale and marked for renaming. */
2044 bitmap_and_compl_into (all_nmts, active_nmts);
2045 mark_set_for_renaming (all_nmts);
2047 BITMAP_FREE (all_nmts);
2048 BITMAP_FREE (active_nmts);
2052 /* Initialize the data structures used for alias analysis. */
2054 static struct alias_info *
2055 init_alias_info (void)
2057 struct alias_info *ai;
2058 referenced_var_iterator rvi;
2059 tree var;
2061 ai = XCNEW (struct alias_info);
2062 ai->ssa_names_visited = sbitmap_alloc (num_ssa_names);
2063 sbitmap_zero (ai->ssa_names_visited);
2064 ai->processed_ptrs = VEC_alloc (tree, heap, 50);
2065 ai->written_vars = pointer_set_create ();
2066 ai->dereferenced_ptrs_store = pointer_set_create ();
2067 ai->dereferenced_ptrs_load = pointer_set_create ();
2069 /* Clear out all memory reference stats. */
2070 init_mem_ref_stats ();
2072 /* If aliases have been computed before, clear existing information. */
2073 if (gimple_aliases_computed_p (cfun))
2074 reset_alias_info ();
2075 else
2077 /* If this is the first time we compute aliasing information,
2078 every non-register symbol will need to be put into SSA form
2079 (the initial SSA form only operates on GIMPLE registers). */
2080 FOR_EACH_REFERENCED_VAR (var, rvi)
2081 if (!is_gimple_reg (var))
2082 mark_sym_for_renaming (var);
2085 /* Next time, we will need to reset alias information. */
2086 cfun->gimple_df->aliases_computed_p = true;
2087 if (alias_bitmap_obstack.elements != NULL)
2088 bitmap_obstack_release (&alias_bitmap_obstack);
2089 bitmap_obstack_initialize (&alias_bitmap_obstack);
2091 return ai;
2095 /* Deallocate memory used by alias analysis. */
2097 static void
2098 delete_alias_info (struct alias_info *ai)
2100 size_t i;
2102 sbitmap_free (ai->ssa_names_visited);
2104 VEC_free (tree, heap, ai->processed_ptrs);
2106 for (i = 0; i < ai->num_addressable_vars; i++)
2107 free (ai->addressable_vars[i]);
2108 free (ai->addressable_vars);
2110 for (i = 0; i < ai->num_pointers; i++)
2111 free (ai->pointers[i]);
2112 free (ai->pointers);
2114 pointer_set_destroy (ai->written_vars);
2115 pointer_set_destroy (ai->dereferenced_ptrs_store);
2116 pointer_set_destroy (ai->dereferenced_ptrs_load);
2117 free (ai);
2119 delete_mem_ref_stats (cfun);
2120 delete_points_to_sets ();
2124 /* Used for hashing to identify pointer infos with identical
2125 pt_vars bitmaps. */
2127 static int
2128 eq_ptr_info (const void *p1, const void *p2)
2130 const struct ptr_info_def *n1 = (const struct ptr_info_def *) p1;
2131 const struct ptr_info_def *n2 = (const struct ptr_info_def *) p2;
2132 return bitmap_equal_p (n1->pt_vars, n2->pt_vars);
2135 static hashval_t
2136 ptr_info_hash (const void *p)
2138 const struct ptr_info_def *n = (const struct ptr_info_def *) p;
2139 return bitmap_hash (n->pt_vars);
2143 /* Create name tags for all the pointers that have been dereferenced.
2144 We only create a name tag for a pointer P if P is found to point to
2145 a set of variables (so that we can alias them to *P) or if it is
2146 the result of a call to malloc (which means that P cannot point to
2147 anything else nor alias any other variable).
2149 If two pointers P and Q point to the same set of variables, they
2150 are assigned the same name tag. */
2152 static void
2153 create_name_tags (void)
2155 size_t i;
2156 VEC (tree, heap) *with_ptvars = NULL;
2157 tree ptr;
2158 htab_t ptr_hash;
2160 /* Collect the list of pointers with a non-empty points to set. */
2161 for (i = 1; i < num_ssa_names; i++)
2163 tree ptr = ssa_name (i);
2164 struct ptr_info_def *pi;
2166 if (!ptr
2167 || !POINTER_TYPE_P (TREE_TYPE (ptr))
2168 || !SSA_NAME_PTR_INFO (ptr))
2169 continue;
2171 pi = SSA_NAME_PTR_INFO (ptr);
2173 if (pi->pt_anything || !pi->is_dereferenced)
2175 /* No name tags for pointers that have not been
2176 dereferenced or point to an arbitrary location. */
2177 pi->name_mem_tag = NULL_TREE;
2178 continue;
2181 /* Set pt_anything on the pointers without pt_vars filled in so
2182 that they are assigned a symbol tag. */
2183 if (pi->pt_vars && !bitmap_empty_p (pi->pt_vars))
2184 VEC_safe_push (tree, heap, with_ptvars, ptr);
2185 else
2186 set_pt_anything (ptr);
2189 /* If we didn't find any pointers with pt_vars set, we're done. */
2190 if (!with_ptvars)
2191 return;
2193 ptr_hash = htab_create (10, ptr_info_hash, eq_ptr_info, NULL);
2195 /* Now go through the pointers with pt_vars, and find a name tag
2196 with the same pt_vars as this pointer, or create one if one
2197 doesn't exist. */
2198 for (i = 0; VEC_iterate (tree, with_ptvars, i, ptr); i++)
2200 struct ptr_info_def *pi = SSA_NAME_PTR_INFO (ptr);
2201 tree old_name_tag = pi->name_mem_tag;
2202 struct ptr_info_def **slot;
2204 /* If PTR points to a set of variables, check if we don't
2205 have another pointer Q with the same points-to set before
2206 creating a tag. If so, use Q's tag instead of creating a
2207 new one.
2209 This is important for not creating unnecessary symbols
2210 and also for copy propagation. If we ever need to
2211 propagate PTR into Q or vice-versa, we would run into
2212 problems if they both had different name tags because
2213 they would have different SSA version numbers (which
2214 would force us to take the name tags in and out of SSA). */
2215 slot = (struct ptr_info_def **) htab_find_slot (ptr_hash, pi, INSERT);
2216 if (*slot)
2217 pi->name_mem_tag = (*slot)->name_mem_tag;
2218 else
2220 *slot = pi;
2222 /* If we didn't find a pointer with the same points-to set
2223 as PTR, create a new name tag if needed. */
2224 if (pi->name_mem_tag == NULL_TREE)
2225 pi->name_mem_tag = get_nmt_for (ptr);
2228 /* If the new name tag computed for PTR is different than
2229 the old name tag that it used to have, then the old tag
2230 needs to be removed from the IL, so we mark it for
2231 renaming. */
2232 if (old_name_tag && old_name_tag != pi->name_mem_tag)
2233 mark_sym_for_renaming (old_name_tag);
2235 /* Inherit volatility from the pointed-to type. */
2236 TREE_THIS_VOLATILE (pi->name_mem_tag)
2237 |= TYPE_VOLATILE (TREE_TYPE (TREE_TYPE (ptr)));
2239 /* Mark the new name tag for renaming. */
2240 mark_sym_for_renaming (pi->name_mem_tag);
2243 htab_delete (ptr_hash);
2245 VEC_free (tree, heap, with_ptvars);
2249 /* Union the alias set SET into the may-aliases for TAG. */
2251 static void
2252 union_alias_set_into (tree tag, bitmap set)
2254 bitmap ma = MTAG_ALIASES (tag);
2256 if (bitmap_empty_p (set))
2257 return;
2259 if (!ma)
2260 ma = MTAG_ALIASES (tag) = BITMAP_ALLOC (&alias_bitmap_obstack);
2261 bitmap_ior_into (ma, set);
2265 /* For every pointer P_i in AI->PROCESSED_PTRS, create may-alias sets for
2266 the name memory tag (NMT) associated with P_i. If P_i escapes, then its
2267 name tag and the variables it points-to are call-clobbered. Finally, if
2268 P_i escapes and we could not determine where it points to, then all the
2269 variables in the same alias set as *P_i are marked call-clobbered. This
2270 is necessary because we must assume that P_i may take the address of any
2271 variable in the same alias set. */
2273 static void
2274 compute_flow_sensitive_aliasing (struct alias_info *ai)
2276 size_t i;
2277 tree ptr;
2279 timevar_push (TV_FLOW_SENSITIVE);
2280 set_used_smts ();
2282 for (i = 0; VEC_iterate (tree, ai->processed_ptrs, i, ptr); i++)
2284 if (!find_what_p_points_to (ptr))
2285 set_pt_anything (ptr);
2288 create_name_tags ();
2290 for (i = 0; VEC_iterate (tree, ai->processed_ptrs, i, ptr); i++)
2292 struct ptr_info_def *pi = SSA_NAME_PTR_INFO (ptr);
2294 /* Set up aliasing information for PTR's name memory tag (if it has
2295 one). Note that only pointers that have been dereferenced will
2296 have a name memory tag. */
2297 if (pi->name_mem_tag && pi->pt_vars)
2299 if (!bitmap_empty_p (pi->pt_vars))
2300 union_alias_set_into (pi->name_mem_tag, pi->pt_vars);
2303 timevar_pop (TV_FLOW_SENSITIVE);
2307 /* Return TRUE if at least one symbol in TAG2's alias set is also
2308 present in TAG1's alias set. */
2310 static bool
2311 have_common_aliases_p (bitmap tag1aliases, bitmap tag2aliases)
2314 /* This is the old behavior of have_common_aliases_p, which is to
2315 return false if both sets are empty, or one set is and the other
2316 isn't. */
2317 if (tag1aliases == NULL || tag2aliases == NULL)
2318 return false;
2320 return bitmap_intersect_p (tag1aliases, tag2aliases);
2323 /* Compute type-based alias sets. Traverse all the pointers and
2324 addressable variables found in setup_pointers_and_addressables.
2326 For every pointer P in AI->POINTERS and addressable variable V in
2327 AI->ADDRESSABLE_VARS, add V to the may-alias sets of P's symbol
2328 memory tag (SMT) if their alias sets conflict. V is then marked as
2329 an aliased symbol so that the operand scanner knows that statements
2330 containing V have aliased operands. */
2332 static void
2333 compute_flow_insensitive_aliasing (struct alias_info *ai)
2335 size_t i;
2337 timevar_push (TV_FLOW_INSENSITIVE);
2338 /* For every pointer P, determine which addressable variables may alias
2339 with P's symbol memory tag. */
2340 for (i = 0; i < ai->num_pointers; i++)
2342 size_t j;
2343 struct alias_map_d *p_map = ai->pointers[i];
2344 tree tag = symbol_mem_tag (p_map->var);
2345 tree var;
2347 for (j = 0; j < ai->num_addressable_vars; j++)
2349 struct alias_map_d *v_map;
2350 var_ann_t v_ann;
2351 bool tag_stored_p, var_stored_p;
2353 v_map = ai->addressable_vars[j];
2354 var = v_map->var;
2355 v_ann = var_ann (var);
2357 /* Skip memory tags and variables that have never been
2358 written to. We also need to check if the variables are
2359 call-clobbered because they may be overwritten by
2360 function calls. */
2361 tag_stored_p = pointer_set_contains (ai->written_vars, tag)
2362 || is_call_clobbered (tag);
2363 var_stored_p = pointer_set_contains (ai->written_vars, var)
2364 || is_call_clobbered (var);
2365 if (!tag_stored_p && !var_stored_p)
2366 continue;
2368 if (may_alias_p (p_map->var, p_map->set, var, v_map->set, false))
2370 /* Add VAR to TAG's may-aliases set. */
2371 add_may_alias (tag, var);
2376 /* Since this analysis is based exclusively on symbols, it fails to
2377 handle cases where two pointers P and Q have different memory
2378 tags with conflicting alias set numbers but no aliased symbols in
2379 common.
2381 For example, suppose that we have two memory tags SMT.1 and SMT.2
2382 such that
2384 may-aliases (SMT.1) = { a }
2385 may-aliases (SMT.2) = { b }
2387 and the alias set number of SMT.1 conflicts with that of SMT.2.
2388 Since they don't have symbols in common, loads and stores from
2389 SMT.1 and SMT.2 will seem independent of each other, which will
2390 lead to the optimizers making invalid transformations (see
2391 testsuite/gcc.c-torture/execute/pr15262-[12].c).
2393 To avoid this problem, we do a final traversal of AI->POINTERS
2394 looking for pairs of pointers that have no aliased symbols in
2395 common and yet have conflicting alias set numbers. */
2396 for (i = 0; i < ai->num_pointers; i++)
2398 size_t j;
2399 struct alias_map_d *p_map1 = ai->pointers[i];
2400 tree tag1 = symbol_mem_tag (p_map1->var);
2401 bitmap may_aliases1 = MTAG_ALIASES (tag1);
2403 for (j = 0; j < ai->num_pointers; j++)
2405 struct alias_map_d *p_map2 = ai->pointers[j];
2406 tree tag2 = symbol_mem_tag (p_map2->var);
2407 bitmap may_aliases2 = may_aliases (tag2);
2409 /* By convention tags don't alias themselves. */
2410 if (tag1 == tag2)
2411 continue;
2413 /* If the pointers may not point to each other, do nothing. */
2414 if (!may_alias_p (p_map1->var, p_map1->set, tag2, p_map2->set, true))
2415 continue;
2417 /* The two pointers may alias each other. If they already have
2418 symbols in common, do nothing. */
2419 if (have_common_aliases_p (may_aliases1, may_aliases2))
2420 continue;
2422 add_may_alias (tag1, tag2);
2425 timevar_pop (TV_FLOW_INSENSITIVE);
2429 /* Create a new alias set entry for VAR in AI->ADDRESSABLE_VARS. */
2431 static void
2432 create_alias_map_for (tree var, struct alias_info *ai)
2434 struct alias_map_d *alias_map;
2435 alias_map = XCNEW (struct alias_map_d);
2436 alias_map->var = var;
2437 alias_map->set = get_alias_set (var);
2438 ai->addressable_vars[ai->num_addressable_vars++] = alias_map;
2442 /* Create memory tags for all the dereferenced pointers and build the
2443 ADDRESSABLE_VARS and POINTERS arrays used for building the may-alias
2444 sets. Based on the address escape and points-to information collected
2445 earlier, this pass will also clear the TREE_ADDRESSABLE flag from those
2446 variables whose address is not needed anymore. */
2448 static void
2449 setup_pointers_and_addressables (struct alias_info *ai)
2451 size_t num_addressable_vars, num_pointers;
2452 referenced_var_iterator rvi;
2453 tree var;
2454 VEC (tree, heap) *varvec = NULL;
2455 safe_referenced_var_iterator srvi;
2457 /* Size up the arrays ADDRESSABLE_VARS and POINTERS. */
2458 num_addressable_vars = num_pointers = 0;
2460 FOR_EACH_REFERENCED_VAR (var, rvi)
2462 if (may_be_aliased (var))
2463 num_addressable_vars++;
2465 if (POINTER_TYPE_P (TREE_TYPE (var)))
2467 /* Since we don't keep track of volatile variables, assume that
2468 these pointers are used in indirect store operations. */
2469 if (TREE_THIS_VOLATILE (var))
2470 pointer_set_insert (ai->dereferenced_ptrs_store, var);
2472 num_pointers++;
2476 /* Create ADDRESSABLE_VARS and POINTERS. Note that these arrays are
2477 always going to be slightly bigger than we actually need them
2478 because some TREE_ADDRESSABLE variables will be marked
2479 non-addressable below and only pointers with unique symbol tags are
2480 going to be added to POINTERS. */
2481 ai->addressable_vars = XCNEWVEC (struct alias_map_d *, num_addressable_vars);
2482 ai->pointers = XCNEWVEC (struct alias_map_d *, num_pointers);
2483 ai->num_addressable_vars = 0;
2484 ai->num_pointers = 0;
2486 FOR_EACH_REFERENCED_VAR_SAFE (var, varvec, srvi)
2488 /* Name memory tags already have flow-sensitive aliasing
2489 information, so they need not be processed by
2490 compute_flow_insensitive_aliasing. Similarly, symbol memory
2491 tags are already accounted for when we process their
2492 associated pointer.
2494 Structure fields, on the other hand, have to have some of this
2495 information processed for them, but it's pointless to mark them
2496 non-addressable (since they are fake variables anyway). */
2497 if (MTAG_P (var))
2498 continue;
2500 /* Remove the ADDRESSABLE flag from every addressable variable whose
2501 address is not needed anymore. This is caused by the propagation
2502 of ADDR_EXPR constants into INDIRECT_REF expressions and the
2503 removal of dead pointer assignments done by the early scalar
2504 cleanup passes. */
2505 if (TREE_ADDRESSABLE (var))
2507 if (!bitmap_bit_p (gimple_addressable_vars (cfun), DECL_UID (var))
2508 && TREE_CODE (var) != RESULT_DECL
2509 && !is_global_var (var))
2511 bool okay_to_mark = true;
2513 /* Since VAR is now a regular GIMPLE register, we will need
2514 to rename VAR into SSA afterwards. */
2515 mark_sym_for_renaming (var);
2517 /* The address of VAR is not needed, remove the
2518 addressable bit, so that it can be optimized as a
2519 regular variable. */
2520 if (okay_to_mark)
2522 /* The memory partition holding VAR will no longer
2523 contain VAR, and statements referencing it will need
2524 to be updated. */
2525 if (memory_partition (var))
2526 mark_sym_for_renaming (memory_partition (var));
2528 mark_non_addressable (var);
2533 /* Global variables and addressable locals may be aliased. Create an
2534 entry in ADDRESSABLE_VARS for VAR. */
2535 if (may_be_aliased (var))
2537 create_alias_map_for (var, ai);
2538 mark_sym_for_renaming (var);
2541 /* Add pointer variables that have been dereferenced to the POINTERS
2542 array and create a symbol memory tag for them. */
2543 if (POINTER_TYPE_P (TREE_TYPE (var)))
2545 if ((pointer_set_contains (ai->dereferenced_ptrs_store, var)
2546 || pointer_set_contains (ai->dereferenced_ptrs_load, var)))
2548 tree tag, old_tag;
2549 var_ann_t t_ann;
2551 /* If pointer VAR still doesn't have a memory tag
2552 associated with it, create it now or re-use an
2553 existing one. */
2554 tag = get_smt_for (var, ai);
2555 t_ann = var_ann (tag);
2557 /* The symbol tag will need to be renamed into SSA
2558 afterwards. Note that we cannot do this inside
2559 get_smt_for because aliasing may run multiple times
2560 and we only create symbol tags the first time. */
2561 mark_sym_for_renaming (tag);
2563 /* Similarly, if pointer VAR used to have another type
2564 tag, we will need to process it in the renamer to
2565 remove the stale virtual operands. */
2566 old_tag = symbol_mem_tag (var);
2567 if (old_tag)
2568 mark_sym_for_renaming (old_tag);
2570 /* Associate the tag with pointer VAR. */
2571 set_symbol_mem_tag (var, tag);
2573 /* If pointer VAR has been used in a store operation,
2574 then its memory tag must be marked as written-to. */
2575 if (pointer_set_contains (ai->dereferenced_ptrs_store, var))
2576 pointer_set_insert (ai->written_vars, tag);
2578 else
2580 /* The pointer has not been dereferenced. If it had a
2581 symbol memory tag, remove it and mark the old tag for
2582 renaming to remove it out of the IL. */
2583 tree tag = symbol_mem_tag (var);
2584 if (tag)
2586 mark_sym_for_renaming (tag);
2587 set_symbol_mem_tag (var, NULL_TREE);
2593 VEC_free (tree, heap, varvec);
2597 /* Determine whether to use .GLOBAL_VAR to model call clobbering
2598 semantics. If the function makes no references to global
2599 variables and contains at least one call to a non-pure function,
2600 then we need to mark the side-effects of the call using .GLOBAL_VAR
2601 to represent all possible global memory referenced by the callee. */
2603 static void
2604 maybe_create_global_var (void)
2606 /* No need to create it, if we have one already. */
2607 if (gimple_global_var (cfun) == NULL_TREE)
2609 struct mem_ref_stats_d *stats = gimple_mem_ref_stats (cfun);
2611 /* Create .GLOBAL_VAR if there are no call-clobbered
2612 variables and the program contains a mixture of pure/const
2613 and regular function calls. This is to avoid the problem
2614 described in PR 20115:
2616 int X;
2617 int func_pure (void) { return X; }
2618 int func_non_pure (int a) { X += a; }
2619 int foo ()
2621 int a = func_pure ();
2622 func_non_pure (a);
2623 a = func_pure ();
2624 return a;
2627 Since foo() has no call-clobbered variables, there is
2628 no relationship between the calls to func_pure and
2629 func_non_pure. Since func_pure has no side-effects, value
2630 numbering optimizations elide the second call to func_pure.
2631 So, if we have some pure/const and some regular calls in the
2632 program we create .GLOBAL_VAR to avoid missing these
2633 relations. */
2634 if (bitmap_empty_p (gimple_call_clobbered_vars (cfun))
2635 && stats->num_call_sites > 0
2636 && stats->num_pure_const_call_sites > 0
2637 && stats->num_call_sites > stats->num_pure_const_call_sites)
2638 create_global_var ();
2643 /* Return TRUE if pointer PTR may point to variable VAR.
2645 MEM_ALIAS_SET is the alias set for the memory location pointed-to by PTR
2646 This is needed because when checking for type conflicts we are
2647 interested in the alias set of the memory location pointed-to by
2648 PTR. The alias set of PTR itself is irrelevant.
2650 VAR_ALIAS_SET is the alias set for VAR. */
2652 static bool
2653 may_alias_p (tree ptr, alias_set_type mem_alias_set,
2654 tree var, alias_set_type var_alias_set,
2655 bool alias_set_only)
2657 tree mem;
2659 alias_stats.alias_queries++;
2660 alias_stats.simple_queries++;
2662 /* By convention, a variable cannot alias itself. */
2663 mem = symbol_mem_tag (ptr);
2664 if (mem == var)
2666 alias_stats.alias_noalias++;
2667 alias_stats.simple_resolved++;
2668 return false;
2671 /* If -fargument-noalias-global is > 2, pointer arguments may
2672 not point to anything else. */
2673 if (flag_argument_noalias > 2 && TREE_CODE (ptr) == PARM_DECL)
2675 alias_stats.alias_noalias++;
2676 alias_stats.simple_resolved++;
2677 return false;
2680 /* If -fargument-noalias-global is > 1, pointer arguments may
2681 not point to global variables. */
2682 if (flag_argument_noalias > 1 && is_global_var (var)
2683 && TREE_CODE (ptr) == PARM_DECL)
2685 alias_stats.alias_noalias++;
2686 alias_stats.simple_resolved++;
2687 return false;
2690 /* If either MEM or VAR is a read-only global and the other one
2691 isn't, then PTR cannot point to VAR. */
2692 if ((unmodifiable_var_p (mem) && !unmodifiable_var_p (var))
2693 || (unmodifiable_var_p (var) && !unmodifiable_var_p (mem)))
2695 alias_stats.alias_noalias++;
2696 alias_stats.simple_resolved++;
2697 return false;
2700 /* If the pointed to memory has alias set zero, or the pointer
2701 is ref-all, or the pointer decl is marked that no TBAA is to
2702 be applied, the MEM can alias VAR. */
2703 if (mem_alias_set == 0
2704 || DECL_POINTER_ALIAS_SET (ptr) == 0
2705 || TYPE_REF_CAN_ALIAS_ALL (TREE_TYPE (ptr))
2706 || DECL_NO_TBAA_P (ptr))
2708 alias_stats.alias_mayalias++;
2709 alias_stats.simple_resolved++;
2710 return true;
2713 gcc_assert (TREE_CODE (mem) == SYMBOL_MEMORY_TAG);
2715 alias_stats.tbaa_queries++;
2717 /* If the alias sets don't conflict then MEM cannot alias VAR. */
2718 if (mem_alias_set != var_alias_set
2719 && !alias_set_subset_of (mem_alias_set, var_alias_set))
2721 alias_stats.alias_noalias++;
2722 alias_stats.tbaa_resolved++;
2723 return false;
2726 /* If VAR is a record or union type, PTR cannot point into VAR
2727 unless there is some explicit address operation in the
2728 program that can reference a field of the type pointed-to by
2729 PTR. This also assumes that the types of both VAR and PTR
2730 are contained within the compilation unit, and that there is
2731 no fancy addressing arithmetic associated with any of the
2732 types involved. */
2733 if (mem_alias_set != 0 && var_alias_set != 0)
2735 tree ptr_type = TREE_TYPE (ptr);
2736 tree var_type = TREE_TYPE (var);
2738 /* The star count is -1 if the type at the end of the
2739 pointer_to chain is not a record or union type. */
2740 if (!alias_set_only
2741 && ipa_type_escape_star_count_of_interesting_type (var_type) >= 0)
2743 int ptr_star_count = 0;
2745 /* ipa_type_escape_star_count_of_interesting_type is a
2746 little too restrictive for the pointer type, need to
2747 allow pointers to primitive types as long as those
2748 types cannot be pointers to everything. */
2749 while (POINTER_TYPE_P (ptr_type))
2751 /* Strip the *s off. */
2752 ptr_type = TREE_TYPE (ptr_type);
2753 ptr_star_count++;
2756 /* There does not appear to be a better test to see if
2757 the pointer type was one of the pointer to everything
2758 types. */
2759 if (ptr_star_count > 0)
2761 alias_stats.structnoaddress_queries++;
2762 if (ipa_type_escape_field_does_not_clobber_p (var_type,
2763 TREE_TYPE (ptr)))
2765 alias_stats.structnoaddress_resolved++;
2766 alias_stats.alias_noalias++;
2767 return false;
2770 else if (ptr_star_count == 0)
2772 /* If PTR_TYPE was not really a pointer to type, it cannot
2773 alias. */
2774 alias_stats.structnoaddress_queries++;
2775 alias_stats.structnoaddress_resolved++;
2776 alias_stats.alias_noalias++;
2777 return false;
2782 alias_stats.alias_mayalias++;
2783 return true;
2787 /* Add ALIAS to the set of variables that may alias VAR. */
2789 static void
2790 add_may_alias (tree var, tree alias)
2792 /* Don't allow self-referential aliases. */
2793 gcc_assert (var != alias);
2795 /* ALIAS must be addressable if it's being added to an alias set. */
2796 #if 1
2797 TREE_ADDRESSABLE (alias) = 1;
2798 #else
2799 gcc_assert (may_be_aliased (alias));
2800 #endif
2802 /* VAR must be a symbol or a name tag. */
2803 gcc_assert (TREE_CODE (var) == SYMBOL_MEMORY_TAG
2804 || TREE_CODE (var) == NAME_MEMORY_TAG);
2806 if (MTAG_ALIASES (var) == NULL)
2807 MTAG_ALIASES (var) = BITMAP_ALLOC (&alias_bitmap_obstack);
2809 bitmap_set_bit (MTAG_ALIASES (var), DECL_UID (alias));
2813 /* Mark pointer PTR as pointing to an arbitrary memory location. */
2815 static void
2816 set_pt_anything (tree ptr)
2818 struct ptr_info_def *pi = get_ptr_info (ptr);
2820 pi->pt_anything = 1;
2821 /* Anything includes global memory. */
2822 pi->pt_global_mem = 1;
2823 pi->pt_vars = NULL;
2825 /* The pointer used to have a name tag, but we now found it pointing
2826 to an arbitrary location. The name tag needs to be renamed and
2827 disassociated from PTR. */
2828 if (pi->name_mem_tag)
2830 mark_sym_for_renaming (pi->name_mem_tag);
2831 pi->name_mem_tag = NULL_TREE;
2836 /* Return true if STMT is an "escape" site from the current function. Escape
2837 sites those statements which might expose the address of a variable
2838 outside the current function. STMT is an escape site iff:
2840 1- STMT is a function call, or
2841 2- STMT is an __asm__ expression, or
2842 3- STMT is an assignment to a non-local variable, or
2843 4- STMT is a return statement.
2845 Return the type of escape site found, if we found one, or NO_ESCAPE
2846 if none. */
2848 enum escape_type
2849 is_escape_site (tree stmt)
2851 tree call = get_call_expr_in (stmt);
2852 if (call != NULL_TREE)
2854 if (!TREE_SIDE_EFFECTS (call))
2855 return ESCAPE_TO_PURE_CONST;
2857 return ESCAPE_TO_CALL;
2859 else if (TREE_CODE (stmt) == ASM_EXPR)
2860 return ESCAPE_TO_ASM;
2861 else if (TREE_CODE (stmt) == GIMPLE_MODIFY_STMT)
2863 tree lhs = GIMPLE_STMT_OPERAND (stmt, 0);
2865 /* Get to the base of _REF nodes. */
2866 if (TREE_CODE (lhs) != SSA_NAME)
2867 lhs = get_base_address (lhs);
2869 /* If we couldn't recognize the LHS of the assignment, assume that it
2870 is a non-local store. */
2871 if (lhs == NULL_TREE)
2872 return ESCAPE_UNKNOWN;
2874 if (CONVERT_EXPR_P (GIMPLE_STMT_OPERAND (stmt, 1))
2875 || TREE_CODE (GIMPLE_STMT_OPERAND (stmt, 1)) == VIEW_CONVERT_EXPR)
2877 tree from
2878 = TREE_TYPE (TREE_OPERAND (GIMPLE_STMT_OPERAND (stmt, 1), 0));
2879 tree to = TREE_TYPE (GIMPLE_STMT_OPERAND (stmt, 1));
2881 /* If the RHS is a conversion between a pointer and an integer, the
2882 pointer escapes since we can't track the integer. */
2883 if (POINTER_TYPE_P (from) && !POINTER_TYPE_P (to))
2884 return ESCAPE_BAD_CAST;
2887 /* If the LHS is an SSA name, it can't possibly represent a non-local
2888 memory store. */
2889 if (TREE_CODE (lhs) == SSA_NAME)
2890 return NO_ESCAPE;
2892 /* FIXME: LHS is not an SSA_NAME. Even if it's an assignment to a
2893 local variables we cannot be sure if it will escape, because we
2894 don't have information about objects not in SSA form. Need to
2895 implement something along the lines of
2897 J.-D. Choi, M. Gupta, M. J. Serrano, V. C. Sreedhar, and S. P.
2898 Midkiff, ``Escape analysis for java,'' in Proceedings of the
2899 Conference on Object-Oriented Programming Systems, Languages, and
2900 Applications (OOPSLA), pp. 1-19, 1999. */
2901 return ESCAPE_STORED_IN_GLOBAL;
2903 else if (TREE_CODE (stmt) == RETURN_EXPR)
2904 return ESCAPE_TO_RETURN;
2906 return NO_ESCAPE;
2909 /* Create a new memory tag of type TYPE.
2910 Does NOT push it into the current binding. */
2912 tree
2913 create_tag_raw (enum tree_code code, tree type, const char *prefix)
2915 tree tmp_var;
2917 tmp_var = build_decl (code, create_tmp_var_name (prefix), type);
2919 /* Memory tags are always writable and non-static. */
2920 TREE_READONLY (tmp_var) = 0;
2921 TREE_STATIC (tmp_var) = 0;
2923 /* It doesn't start out global. */
2924 MTAG_GLOBAL (tmp_var) = 0;
2925 TREE_USED (tmp_var) = 1;
2927 return tmp_var;
2930 /* Create a new memory tag of type TYPE. If IS_TYPE_TAG is true, the tag
2931 is considered to represent all the pointers whose pointed-to types are
2932 in the same alias set class. Otherwise, the tag represents a single
2933 SSA_NAME pointer variable. */
2935 static tree
2936 create_memory_tag (tree type, bool is_type_tag)
2938 tree tag = create_tag_raw (is_type_tag ? SYMBOL_MEMORY_TAG : NAME_MEMORY_TAG,
2939 type, (is_type_tag) ? "SMT" : "NMT");
2941 /* By default, memory tags are local variables. Alias analysis will
2942 determine whether they should be considered globals. */
2943 DECL_CONTEXT (tag) = current_function_decl;
2945 /* Memory tags are by definition addressable. */
2946 TREE_ADDRESSABLE (tag) = 1;
2948 set_symbol_mem_tag (tag, NULL_TREE);
2950 /* Add the tag to the symbol table. */
2951 add_referenced_var (tag);
2953 return tag;
2957 /* Create a name memory tag to represent a specific SSA_NAME pointer P_i.
2958 This is used if P_i has been found to point to a specific set of
2959 variables or to a non-aliased memory location like the address returned
2960 by malloc functions. */
2962 static tree
2963 get_nmt_for (tree ptr)
2965 struct ptr_info_def *pi = get_ptr_info (ptr);
2966 tree tag = pi->name_mem_tag;
2968 if (tag == NULL_TREE)
2969 tag = create_memory_tag (TREE_TYPE (TREE_TYPE (ptr)), false);
2970 return tag;
2974 /* Return the symbol memory tag associated to pointer PTR. A memory
2975 tag is an artificial variable that represents the memory location
2976 pointed-to by PTR. It is used to model the effects of pointer
2977 de-references on addressable variables.
2979 AI points to the data gathered during alias analysis. This
2980 function populates the array AI->POINTERS. */
2982 static tree
2983 get_smt_for (tree ptr, struct alias_info *ai)
2985 size_t i;
2986 tree tag;
2987 tree tag_type = TREE_TYPE (TREE_TYPE (ptr));
2988 alias_set_type tag_set = get_alias_set (tag_type);
2990 /* To avoid creating unnecessary memory tags, only create one memory tag
2991 per alias set class. Note that it may be tempting to group
2992 memory tags based on conflicting alias sets instead of
2993 equivalence. That would be wrong because alias sets are not
2994 necessarily transitive (as demonstrated by the libstdc++ test
2995 23_containers/vector/cons/4.cc). Given three alias sets A, B, C
2996 such that conflicts (A, B) == true and conflicts (A, C) == true,
2997 it does not necessarily follow that conflicts (B, C) == true. */
2998 for (i = 0, tag = NULL_TREE; i < ai->num_pointers; i++)
3000 struct alias_map_d *curr = ai->pointers[i];
3001 tree curr_tag = symbol_mem_tag (curr->var);
3002 if (tag_set == curr->set)
3004 tag = curr_tag;
3005 break;
3009 /* If VAR cannot alias with any of the existing memory tags, create a new
3010 tag for PTR and add it to the POINTERS array. */
3011 if (tag == NULL_TREE)
3013 struct alias_map_d *alias_map;
3015 /* If PTR did not have a symbol tag already, create a new SMT.*
3016 artificial variable representing the memory location
3017 pointed-to by PTR. */
3018 tag = symbol_mem_tag (ptr);
3019 if (tag == NULL_TREE)
3020 tag = create_memory_tag (tag_type, true);
3022 /* Add PTR to the POINTERS array. Note that we are not interested in
3023 PTR's alias set. Instead, we cache the alias set for the memory that
3024 PTR points to. */
3025 alias_map = XCNEW (struct alias_map_d);
3026 alias_map->var = ptr;
3027 alias_map->set = tag_set;
3028 ai->pointers[ai->num_pointers++] = alias_map;
3031 /* If the pointed-to type is volatile, so is the tag. */
3032 TREE_THIS_VOLATILE (tag) |= TREE_THIS_VOLATILE (tag_type);
3034 /* Make sure that the symbol tag has the same alias set as the
3035 pointed-to type or at least accesses through the pointer will
3036 alias that set. The latter can happen after the vectorizer
3037 created pointers of vector type. */
3038 gcc_assert (tag_set == get_alias_set (tag)
3039 || alias_set_subset_of (tag_set, get_alias_set (tag)));
3041 return tag;
3045 /* Create GLOBAL_VAR, an artificial global variable to act as a
3046 representative of all the variables that may be clobbered by function
3047 calls. */
3049 static void
3050 create_global_var (void)
3052 tree global_var = build_decl (VAR_DECL, get_identifier (".GLOBAL_VAR"),
3053 void_type_node);
3054 DECL_ARTIFICIAL (global_var) = 1;
3055 TREE_READONLY (global_var) = 0;
3056 DECL_EXTERNAL (global_var) = 1;
3057 TREE_STATIC (global_var) = 1;
3058 TREE_USED (global_var) = 1;
3059 DECL_CONTEXT (global_var) = NULL_TREE;
3060 TREE_THIS_VOLATILE (global_var) = 0;
3061 TREE_ADDRESSABLE (global_var) = 0;
3063 create_var_ann (global_var);
3064 mark_call_clobbered (global_var, ESCAPE_UNKNOWN);
3065 add_referenced_var (global_var);
3066 mark_sym_for_renaming (global_var);
3067 cfun->gimple_df->global_var = global_var;
3071 /* Dump alias statistics on FILE. */
3073 static void
3074 dump_alias_stats (FILE *file)
3076 const char *funcname
3077 = lang_hooks.decl_printable_name (current_function_decl, 2);
3078 fprintf (file, "\nAlias statistics for %s\n\n", funcname);
3079 fprintf (file, "Total alias queries:\t%u\n", alias_stats.alias_queries);
3080 fprintf (file, "Total alias mayalias results:\t%u\n",
3081 alias_stats.alias_mayalias);
3082 fprintf (file, "Total alias noalias results:\t%u\n",
3083 alias_stats.alias_noalias);
3084 fprintf (file, "Total simple queries:\t%u\n",
3085 alias_stats.simple_queries);
3086 fprintf (file, "Total simple resolved:\t%u\n",
3087 alias_stats.simple_resolved);
3088 fprintf (file, "Total TBAA queries:\t%u\n",
3089 alias_stats.tbaa_queries);
3090 fprintf (file, "Total TBAA resolved:\t%u\n",
3091 alias_stats.tbaa_resolved);
3092 fprintf (file, "Total non-addressable structure type queries:\t%u\n",
3093 alias_stats.structnoaddress_queries);
3094 fprintf (file, "Total non-addressable structure type resolved:\t%u\n",
3095 alias_stats.structnoaddress_resolved);
3099 /* Dump alias information on FILE. */
3101 void
3102 dump_alias_info (FILE *file)
3104 size_t i;
3105 const char *funcname
3106 = lang_hooks.decl_printable_name (current_function_decl, 2);
3107 referenced_var_iterator rvi;
3108 tree var;
3110 fprintf (file, "\nAlias information for %s\n\n", funcname);
3112 dump_memory_partitions (file);
3114 fprintf (file, "\nFlow-insensitive alias information for %s\n\n", funcname);
3116 fprintf (file, "Aliased symbols\n\n");
3118 FOR_EACH_REFERENCED_VAR (var, rvi)
3120 if (may_be_aliased (var))
3121 dump_variable (file, var);
3124 fprintf (file, "\nDereferenced pointers\n\n");
3126 FOR_EACH_REFERENCED_VAR (var, rvi)
3127 if (symbol_mem_tag (var))
3128 dump_variable (file, var);
3130 fprintf (file, "\nSymbol memory tags\n\n");
3132 FOR_EACH_REFERENCED_VAR (var, rvi)
3134 if (TREE_CODE (var) == SYMBOL_MEMORY_TAG)
3135 dump_variable (file, var);
3138 fprintf (file, "\n\nFlow-sensitive alias information for %s\n\n", funcname);
3140 fprintf (file, "SSA_NAME pointers\n\n");
3141 for (i = 1; i < num_ssa_names; i++)
3143 tree ptr = ssa_name (i);
3144 struct ptr_info_def *pi;
3146 if (ptr == NULL_TREE)
3147 continue;
3149 pi = SSA_NAME_PTR_INFO (ptr);
3150 if (!SSA_NAME_IN_FREE_LIST (ptr)
3151 && pi
3152 && pi->name_mem_tag)
3153 dump_points_to_info_for (file, ptr);
3156 fprintf (file, "\nName memory tags\n\n");
3158 FOR_EACH_REFERENCED_VAR (var, rvi)
3160 if (TREE_CODE (var) == NAME_MEMORY_TAG)
3161 dump_variable (file, var);
3164 fprintf (file, "\n");
3168 /* Dump alias information on stderr. */
3170 void
3171 debug_alias_info (void)
3173 dump_alias_info (stderr);
3177 /* Return the alias information associated with pointer T. It creates a
3178 new instance if none existed. */
3180 struct ptr_info_def *
3181 get_ptr_info (tree t)
3183 struct ptr_info_def *pi;
3185 gcc_assert (POINTER_TYPE_P (TREE_TYPE (t)));
3187 pi = SSA_NAME_PTR_INFO (t);
3188 if (pi == NULL)
3190 pi = GGC_CNEW (struct ptr_info_def);
3191 SSA_NAME_PTR_INFO (t) = pi;
3194 return pi;
3198 /* Dump points-to information for SSA_NAME PTR into FILE. */
3200 void
3201 dump_points_to_info_for (FILE *file, tree ptr)
3203 struct ptr_info_def *pi = SSA_NAME_PTR_INFO (ptr);
3205 print_generic_expr (file, ptr, dump_flags);
3207 if (pi)
3209 if (pi->name_mem_tag)
3211 fprintf (file, ", name memory tag: ");
3212 print_generic_expr (file, pi->name_mem_tag, dump_flags);
3215 if (pi->is_dereferenced)
3216 fprintf (file, ", is dereferenced");
3218 if (pi->value_escapes_p)
3219 fprintf (file, ", its value escapes");
3221 if (pi->pt_anything)
3222 fprintf (file, ", points-to anything");
3224 if (pi->pt_null)
3225 fprintf (file, ", points-to NULL");
3227 if (pi->pt_vars)
3229 fprintf (file, ", points-to vars: ");
3230 dump_decl_set (file, pi->pt_vars);
3234 fprintf (file, "\n");
3238 /* Dump points-to information for VAR into stderr. */
3240 void
3241 debug_points_to_info_for (tree var)
3243 dump_points_to_info_for (stderr, var);
3247 /* Dump points-to information into FILE. NOTE: This function is slow, as
3248 it needs to traverse the whole CFG looking for pointer SSA_NAMEs. */
3250 void
3251 dump_points_to_info (FILE *file)
3253 basic_block bb;
3254 block_stmt_iterator si;
3255 ssa_op_iter iter;
3256 const char *fname =
3257 lang_hooks.decl_printable_name (current_function_decl, 2);
3258 referenced_var_iterator rvi;
3259 tree var;
3261 fprintf (file, "\n\nPointed-to sets for pointers in %s\n\n", fname);
3263 /* First dump points-to information for the default definitions of
3264 pointer variables. This is necessary because default definitions are
3265 not part of the code. */
3266 FOR_EACH_REFERENCED_VAR (var, rvi)
3268 if (POINTER_TYPE_P (TREE_TYPE (var)))
3270 tree def = gimple_default_def (cfun, var);
3271 if (def)
3272 dump_points_to_info_for (file, def);
3276 /* Dump points-to information for every pointer defined in the program. */
3277 FOR_EACH_BB (bb)
3279 tree phi;
3281 for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
3283 tree ptr = PHI_RESULT (phi);
3284 if (POINTER_TYPE_P (TREE_TYPE (ptr)))
3285 dump_points_to_info_for (file, ptr);
3288 for (si = bsi_start (bb); !bsi_end_p (si); bsi_next (&si))
3290 tree stmt = bsi_stmt (si);
3291 tree def;
3292 FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_DEF)
3293 if (TREE_CODE (def) == SSA_NAME
3294 && POINTER_TYPE_P (TREE_TYPE (def)))
3295 dump_points_to_info_for (file, def);
3299 fprintf (file, "\n");
3303 /* Dump points-to info pointed to by PTO into STDERR. */
3305 void
3306 debug_points_to_info (void)
3308 dump_points_to_info (stderr);
3311 /* Dump to FILE the list of variables that may be aliasing VAR. */
3313 void
3314 dump_may_aliases_for (FILE *file, tree var)
3316 bitmap aliases;
3318 aliases = MTAG_ALIASES (var);
3319 if (aliases)
3321 bitmap_iterator bi;
3322 unsigned int i;
3323 tree al;
3325 fprintf (file, "{ ");
3326 EXECUTE_IF_SET_IN_BITMAP (aliases, 0, i, bi)
3328 al = referenced_var (i);
3329 print_generic_expr (file, al, dump_flags);
3330 fprintf (file, " ");
3332 fprintf (file, "}");
3337 /* Dump to stderr the list of variables that may be aliasing VAR. */
3339 void
3340 debug_may_aliases_for (tree var)
3342 dump_may_aliases_for (stderr, var);
3346 /* Return true if VAR may be aliased. */
3348 bool
3349 may_be_aliased (tree var)
3351 /* Obviously. */
3352 if (TREE_ADDRESSABLE (var))
3353 return true;
3355 /* Globally visible variables can have their addresses taken by other
3356 translation units. */
3357 if (MTAG_P (var)
3358 && MTAG_GLOBAL (var))
3359 return true;
3360 else if (!MTAG_P (var)
3361 && (DECL_EXTERNAL (var) || TREE_PUBLIC (var)))
3362 return true;
3364 /* Automatic variables can't have their addresses escape any other
3365 way. This must be after the check for global variables, as
3366 extern declarations do not have TREE_STATIC set. */
3367 if (!TREE_STATIC (var))
3368 return false;
3370 /* If we're in unit-at-a-time mode, then we must have seen all
3371 occurrences of address-of operators, and so we can trust
3372 TREE_ADDRESSABLE. Otherwise we can only be sure the variable
3373 isn't addressable if it's local to the current function. */
3374 if (flag_unit_at_a_time)
3375 return false;
3377 if (decl_function_context (var) == current_function_decl)
3378 return false;
3380 return true;
3383 /* The following is based on code in add_stmt_operand to ensure that the
3384 same defs/uses/vdefs/vuses will be found after replacing a reference
3385 to var (or ARRAY_REF to var) with an INDIRECT_REF to ptr whose value
3386 is the address of var. Return a memtag for the ptr, after adding the
3387 proper may_aliases to it (which are the aliases of var, if it has any,
3388 or var itself). */
3390 static tree
3391 add_may_alias_for_new_tag (tree tag, tree var)
3393 bitmap aliases = NULL;
3395 if (MTAG_P (var))
3396 aliases = may_aliases (var);
3398 /* Case 1: |aliases| == 1 */
3399 if (aliases
3400 && bitmap_single_bit_set_p (aliases))
3402 tree ali = referenced_var (bitmap_first_set_bit (aliases));
3403 if (TREE_CODE (ali) == SYMBOL_MEMORY_TAG)
3404 return ali;
3407 /* Case 2: |aliases| == 0 */
3408 if (aliases == NULL)
3409 add_may_alias (tag, var);
3410 else
3412 /* Case 3: |aliases| > 1 */
3413 union_alias_set_into (tag, aliases);
3415 return tag;
3418 /* Create a new symbol tag for PTR. Construct the may-alias list of
3419 this type tag so that it has the aliasing of VAR according to the
3420 location accessed by EXPR.
3422 Note, the set of aliases represented by the new symbol tag are not
3423 marked for renaming. */
3425 void
3426 new_type_alias (tree ptr, tree var, tree expr)
3428 tree tag_type = TREE_TYPE (TREE_TYPE (ptr));
3429 tree tag;
3430 tree ali = NULL_TREE;
3431 HOST_WIDE_INT offset, size, maxsize;
3432 tree ref;
3434 gcc_assert (symbol_mem_tag (ptr) == NULL_TREE);
3435 gcc_assert (!MTAG_P (var));
3437 ref = get_ref_base_and_extent (expr, &offset, &size, &maxsize);
3438 gcc_assert (ref);
3440 tag = create_memory_tag (tag_type, true);
3441 set_symbol_mem_tag (ptr, tag);
3443 ali = add_may_alias_for_new_tag (tag, var);
3445 set_symbol_mem_tag (ptr, ali);
3446 MTAG_GLOBAL (tag) = is_global_var (var);
3450 /* Reset the call_clobbered flags on our referenced vars. In
3451 theory, this only needs to be done for globals. */
3453 static unsigned int
3454 reset_cc_flags (void)
3456 tree var;
3457 referenced_var_iterator rvi;
3459 FOR_EACH_REFERENCED_VAR (var, rvi)
3460 var_ann (var)->call_clobbered = false;
3461 return 0;
3464 struct gimple_opt_pass pass_reset_cc_flags =
3467 GIMPLE_PASS,
3468 NULL, /* name */
3469 NULL, /* gate */
3470 reset_cc_flags, /* execute */
3471 NULL, /* sub */
3472 NULL, /* next */
3473 0, /* static_pass_number */
3474 0, /* tv_id */
3475 PROP_referenced_vars |PROP_cfg, /* properties_required */
3476 0, /* properties_provided */
3477 0, /* properties_destroyed */
3478 0, /* todo_flags_start */
3479 0 /* todo_flags_finish */
3484 /* A dummy pass to cause aliases to be computed via TODO_rebuild_alias. */
3486 struct gimple_opt_pass pass_build_alias =
3489 GIMPLE_PASS,
3490 "alias", /* name */
3491 NULL, /* gate */
3492 NULL, /* execute */
3493 NULL, /* sub */
3494 NULL, /* next */
3495 0, /* static_pass_number */
3496 0, /* tv_id */
3497 PROP_cfg | PROP_ssa, /* properties_required */
3498 PROP_alias, /* properties_provided */
3499 0, /* properties_destroyed */
3500 0, /* todo_flags_start */
3501 TODO_rebuild_alias | TODO_dump_func /* todo_flags_finish */