Daily bump.
[official-gcc.git] / gcc / alias.c
blob7a36284cb3af36c02cbb7c49942ed55d295242e0
1 /* Alias analysis for GNU C
2 Copyright (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006
3 Free Software Foundation, Inc.
4 Contributed by John Carr (jfc@mit.edu).
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 2, or (at your option) any later
11 version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING. If not, write to the Free
20 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
21 02110-1301, USA. */
23 #include "config.h"
24 #include "system.h"
25 #include "coretypes.h"
26 #include "tm.h"
27 #include "rtl.h"
28 #include "tree.h"
29 #include "tm_p.h"
30 #include "function.h"
31 #include "alias.h"
32 #include "emit-rtl.h"
33 #include "regs.h"
34 #include "hard-reg-set.h"
35 #include "basic-block.h"
36 #include "flags.h"
37 #include "output.h"
38 #include "toplev.h"
39 #include "cselib.h"
40 #include "splay-tree.h"
41 #include "ggc.h"
42 #include "langhooks.h"
43 #include "timevar.h"
44 #include "target.h"
45 #include "cgraph.h"
46 #include "varray.h"
47 #include "tree-pass.h"
48 #include "ipa-type-escape.h"
50 /* The aliasing API provided here solves related but different problems:
52 Say there exists (in c)
54 struct X {
55 struct Y y1;
56 struct Z z2;
57 } x1, *px1, *px2;
59 struct Y y2, *py;
60 struct Z z2, *pz;
63 py = &px1.y1;
64 px2 = &x1;
66 Consider the four questions:
68 Can a store to x1 interfere with px2->y1?
69 Can a store to x1 interfere with px2->z2?
70 (*px2).z2
71 Can a store to x1 change the value pointed to by with py?
72 Can a store to x1 change the value pointed to by with pz?
74 The answer to these questions can be yes, yes, yes, and maybe.
76 The first two questions can be answered with a simple examination
77 of the type system. If structure X contains a field of type Y then
78 a store thru a pointer to an X can overwrite any field that is
79 contained (recursively) in an X (unless we know that px1 != px2).
81 The last two of the questions can be solved in the same way as the
82 first two questions but this is too conservative. The observation
83 is that in some cases analysis we can know if which (if any) fields
84 are addressed and if those addresses are used in bad ways. This
85 analysis may be language specific. In C, arbitrary operations may
86 be applied to pointers. However, there is some indication that
87 this may be too conservative for some C++ types.
89 The pass ipa-type-escape does this analysis for the types whose
90 instances do not escape across the compilation boundary.
92 Historically in GCC, these two problems were combined and a single
93 data structure was used to represent the solution to these
94 problems. We now have two similar but different data structures,
95 The data structure to solve the last two question is similar to the
96 first, but does not contain have the fields in it whose address are
97 never taken. For types that do escape the compilation unit, the
98 data structures will have identical information.
101 /* The alias sets assigned to MEMs assist the back-end in determining
102 which MEMs can alias which other MEMs. In general, two MEMs in
103 different alias sets cannot alias each other, with one important
104 exception. Consider something like:
106 struct S { int i; double d; };
108 a store to an `S' can alias something of either type `int' or type
109 `double'. (However, a store to an `int' cannot alias a `double'
110 and vice versa.) We indicate this via a tree structure that looks
111 like:
112 struct S
115 |/_ _\|
116 int double
118 (The arrows are directed and point downwards.)
119 In this situation we say the alias set for `struct S' is the
120 `superset' and that those for `int' and `double' are `subsets'.
122 To see whether two alias sets can point to the same memory, we must
123 see if either alias set is a subset of the other. We need not trace
124 past immediate descendants, however, since we propagate all
125 grandchildren up one level.
127 Alias set zero is implicitly a superset of all other alias sets.
128 However, this is no actual entry for alias set zero. It is an
129 error to attempt to explicitly construct a subset of zero. */
131 struct alias_set_entry GTY(())
133 /* The alias set number, as stored in MEM_ALIAS_SET. */
134 HOST_WIDE_INT alias_set;
136 /* The children of the alias set. These are not just the immediate
137 children, but, in fact, all descendants. So, if we have:
139 struct T { struct S s; float f; }
141 continuing our example above, the children here will be all of
142 `int', `double', `float', and `struct S'. */
143 splay_tree GTY((param1_is (int), param2_is (int))) children;
145 /* Nonzero if would have a child of zero: this effectively makes this
146 alias set the same as alias set zero. */
147 int has_zero_child;
149 typedef struct alias_set_entry *alias_set_entry;
151 static int rtx_equal_for_memref_p (rtx, rtx);
152 static rtx find_symbolic_term (rtx);
153 static int memrefs_conflict_p (int, rtx, int, rtx, HOST_WIDE_INT);
154 static void record_set (rtx, rtx, void *);
155 static int base_alias_check (rtx, rtx, enum machine_mode,
156 enum machine_mode);
157 static rtx find_base_value (rtx);
158 static int mems_in_disjoint_alias_sets_p (rtx, rtx);
159 static int insert_subset_children (splay_tree_node, void*);
160 static tree find_base_decl (tree);
161 static alias_set_entry get_alias_set_entry (HOST_WIDE_INT);
162 static rtx fixed_scalar_and_varying_struct_p (rtx, rtx, rtx, rtx,
163 int (*) (rtx, int));
164 static int aliases_everything_p (rtx);
165 static bool nonoverlapping_component_refs_p (tree, tree);
166 static tree decl_for_component_ref (tree);
167 static rtx adjust_offset_for_component_ref (tree, rtx);
168 static int nonoverlapping_memrefs_p (rtx, rtx);
169 static int write_dependence_p (rtx, rtx, int);
171 static void memory_modified_1 (rtx, rtx, void *);
172 static void record_alias_subset (HOST_WIDE_INT, HOST_WIDE_INT);
174 /* Set up all info needed to perform alias analysis on memory references. */
176 /* Returns the size in bytes of the mode of X. */
177 #define SIZE_FOR_MODE(X) (GET_MODE_SIZE (GET_MODE (X)))
179 /* Returns nonzero if MEM1 and MEM2 do not alias because they are in
180 different alias sets. We ignore alias sets in functions making use
181 of variable arguments because the va_arg macros on some systems are
182 not legal ANSI C. */
183 #define DIFFERENT_ALIAS_SETS_P(MEM1, MEM2) \
184 mems_in_disjoint_alias_sets_p (MEM1, MEM2)
186 /* Cap the number of passes we make over the insns propagating alias
187 information through set chains. 10 is a completely arbitrary choice. */
188 #define MAX_ALIAS_LOOP_PASSES 10
190 /* reg_base_value[N] gives an address to which register N is related.
191 If all sets after the first add or subtract to the current value
192 or otherwise modify it so it does not point to a different top level
193 object, reg_base_value[N] is equal to the address part of the source
194 of the first set.
196 A base address can be an ADDRESS, SYMBOL_REF, or LABEL_REF. ADDRESS
197 expressions represent certain special values: function arguments and
198 the stack, frame, and argument pointers.
200 The contents of an ADDRESS is not normally used, the mode of the
201 ADDRESS determines whether the ADDRESS is a function argument or some
202 other special value. Pointer equality, not rtx_equal_p, determines whether
203 two ADDRESS expressions refer to the same base address.
205 The only use of the contents of an ADDRESS is for determining if the
206 current function performs nonlocal memory memory references for the
207 purposes of marking the function as a constant function. */
209 static GTY(()) VEC(rtx,gc) *reg_base_value;
210 static rtx *new_reg_base_value;
212 /* We preserve the copy of old array around to avoid amount of garbage
213 produced. About 8% of garbage produced were attributed to this
214 array. */
215 static GTY((deletable)) VEC(rtx,gc) *old_reg_base_value;
217 /* Static hunks of RTL used by the aliasing code; these are initialized
218 once per function to avoid unnecessary RTL allocations. */
219 static GTY (()) rtx static_reg_base_value[FIRST_PSEUDO_REGISTER];
221 #define REG_BASE_VALUE(X) \
222 (REGNO (X) < VEC_length (rtx, reg_base_value) \
223 ? VEC_index (rtx, reg_base_value, REGNO (X)) : 0)
225 /* Vector indexed by N giving the initial (unchanging) value known for
226 pseudo-register N. This array is initialized in init_alias_analysis,
227 and does not change until end_alias_analysis is called. */
228 static GTY((length("reg_known_value_size"))) rtx *reg_known_value;
230 /* Indicates number of valid entries in reg_known_value. */
231 static GTY(()) unsigned int reg_known_value_size;
233 /* Vector recording for each reg_known_value whether it is due to a
234 REG_EQUIV note. Future passes (viz., reload) may replace the
235 pseudo with the equivalent expression and so we account for the
236 dependences that would be introduced if that happens.
238 The REG_EQUIV notes created in assign_parms may mention the arg
239 pointer, and there are explicit insns in the RTL that modify the
240 arg pointer. Thus we must ensure that such insns don't get
241 scheduled across each other because that would invalidate the
242 REG_EQUIV notes. One could argue that the REG_EQUIV notes are
243 wrong, but solving the problem in the scheduler will likely give
244 better code, so we do it here. */
245 static bool *reg_known_equiv_p;
247 /* True when scanning insns from the start of the rtl to the
248 NOTE_INSN_FUNCTION_BEG note. */
249 static bool copying_arguments;
251 DEF_VEC_P(alias_set_entry);
252 DEF_VEC_ALLOC_P(alias_set_entry,gc);
254 /* The splay-tree used to store the various alias set entries. */
255 static GTY (()) VEC(alias_set_entry,gc) *alias_sets;
257 /* Returns a pointer to the alias set entry for ALIAS_SET, if there is
258 such an entry, or NULL otherwise. */
260 static inline alias_set_entry
261 get_alias_set_entry (HOST_WIDE_INT alias_set)
263 return VEC_index (alias_set_entry, alias_sets, alias_set);
266 /* Returns nonzero if the alias sets for MEM1 and MEM2 are such that
267 the two MEMs cannot alias each other. */
269 static inline int
270 mems_in_disjoint_alias_sets_p (rtx mem1, rtx mem2)
272 /* Perform a basic sanity check. Namely, that there are no alias sets
273 if we're not using strict aliasing. This helps to catch bugs
274 whereby someone uses PUT_CODE, but doesn't clear MEM_ALIAS_SET, or
275 where a MEM is allocated in some way other than by the use of
276 gen_rtx_MEM, and the MEM_ALIAS_SET is not cleared. If we begin to
277 use alias sets to indicate that spilled registers cannot alias each
278 other, we might need to remove this check. */
279 gcc_assert (flag_strict_aliasing
280 || (!MEM_ALIAS_SET (mem1) && !MEM_ALIAS_SET (mem2)));
282 return ! alias_sets_conflict_p (MEM_ALIAS_SET (mem1), MEM_ALIAS_SET (mem2));
285 /* Insert the NODE into the splay tree given by DATA. Used by
286 record_alias_subset via splay_tree_foreach. */
288 static int
289 insert_subset_children (splay_tree_node node, void *data)
291 splay_tree_insert ((splay_tree) data, node->key, node->value);
293 return 0;
296 /* Return 1 if the two specified alias sets may conflict. */
299 alias_sets_conflict_p (HOST_WIDE_INT set1, HOST_WIDE_INT set2)
301 alias_set_entry ase;
303 /* If have no alias set information for one of the operands, we have
304 to assume it can alias anything. */
305 if (set1 == 0 || set2 == 0
306 /* If the two alias sets are the same, they may alias. */
307 || set1 == set2)
308 return 1;
310 /* See if the first alias set is a subset of the second. */
311 ase = get_alias_set_entry (set1);
312 if (ase != 0
313 && (ase->has_zero_child
314 || splay_tree_lookup (ase->children,
315 (splay_tree_key) set2)))
316 return 1;
318 /* Now do the same, but with the alias sets reversed. */
319 ase = get_alias_set_entry (set2);
320 if (ase != 0
321 && (ase->has_zero_child
322 || splay_tree_lookup (ase->children,
323 (splay_tree_key) set1)))
324 return 1;
326 /* The two alias sets are distinct and neither one is the
327 child of the other. Therefore, they cannot alias. */
328 return 0;
331 /* Return 1 if the two specified alias sets might conflict, or if any subtype
332 of these alias sets might conflict. */
335 alias_sets_might_conflict_p (HOST_WIDE_INT set1, HOST_WIDE_INT set2)
337 if (set1 == 0 || set2 == 0 || set1 == set2)
338 return 1;
340 return 0;
344 /* Return 1 if any MEM object of type T1 will always conflict (using the
345 dependency routines in this file) with any MEM object of type T2.
346 This is used when allocating temporary storage. If T1 and/or T2 are
347 NULL_TREE, it means we know nothing about the storage. */
350 objects_must_conflict_p (tree t1, tree t2)
352 HOST_WIDE_INT set1, set2;
354 /* If neither has a type specified, we don't know if they'll conflict
355 because we may be using them to store objects of various types, for
356 example the argument and local variables areas of inlined functions. */
357 if (t1 == 0 && t2 == 0)
358 return 0;
360 /* If they are the same type, they must conflict. */
361 if (t1 == t2
362 /* Likewise if both are volatile. */
363 || (t1 != 0 && TYPE_VOLATILE (t1) && t2 != 0 && TYPE_VOLATILE (t2)))
364 return 1;
366 set1 = t1 ? get_alias_set (t1) : 0;
367 set2 = t2 ? get_alias_set (t2) : 0;
369 /* Otherwise they conflict if they have no alias set or the same. We
370 can't simply use alias_sets_conflict_p here, because we must make
371 sure that every subtype of t1 will conflict with every subtype of
372 t2 for which a pair of subobjects of these respective subtypes
373 overlaps on the stack. */
374 return set1 == 0 || set2 == 0 || set1 == set2;
377 /* T is an expression with pointer type. Find the DECL on which this
378 expression is based. (For example, in `a[i]' this would be `a'.)
379 If there is no such DECL, or a unique decl cannot be determined,
380 NULL_TREE is returned. */
382 static tree
383 find_base_decl (tree t)
385 tree d0, d1;
387 if (t == 0 || t == error_mark_node || ! POINTER_TYPE_P (TREE_TYPE (t)))
388 return 0;
390 /* If this is a declaration, return it. If T is based on a restrict
391 qualified decl, return that decl. */
392 if (DECL_P (t))
394 if (TREE_CODE (t) == VAR_DECL && DECL_BASED_ON_RESTRICT_P (t))
395 t = DECL_GET_RESTRICT_BASE (t);
396 return t;
399 /* Handle general expressions. It would be nice to deal with
400 COMPONENT_REFs here. If we could tell that `a' and `b' were the
401 same, then `a->f' and `b->f' are also the same. */
402 switch (TREE_CODE_CLASS (TREE_CODE (t)))
404 case tcc_unary:
405 return find_base_decl (TREE_OPERAND (t, 0));
407 case tcc_binary:
408 /* Return 0 if found in neither or both are the same. */
409 d0 = find_base_decl (TREE_OPERAND (t, 0));
410 d1 = find_base_decl (TREE_OPERAND (t, 1));
411 if (d0 == d1)
412 return d0;
413 else if (d0 == 0)
414 return d1;
415 else if (d1 == 0)
416 return d0;
417 else
418 return 0;
420 default:
421 return 0;
425 /* Return true if all nested component references handled by
426 get_inner_reference in T are such that we should use the alias set
427 provided by the object at the heart of T.
429 This is true for non-addressable components (which don't have their
430 own alias set), as well as components of objects in alias set zero.
431 This later point is a special case wherein we wish to override the
432 alias set used by the component, but we don't have per-FIELD_DECL
433 assignable alias sets. */
435 bool
436 component_uses_parent_alias_set (tree t)
438 while (1)
440 /* If we're at the end, it vacuously uses its own alias set. */
441 if (!handled_component_p (t))
442 return false;
444 switch (TREE_CODE (t))
446 case COMPONENT_REF:
447 if (DECL_NONADDRESSABLE_P (TREE_OPERAND (t, 1)))
448 return true;
449 break;
451 case ARRAY_REF:
452 case ARRAY_RANGE_REF:
453 if (TYPE_NONALIASED_COMPONENT (TREE_TYPE (TREE_OPERAND (t, 0))))
454 return true;
455 break;
457 case REALPART_EXPR:
458 case IMAGPART_EXPR:
459 break;
461 default:
462 /* Bitfields and casts are never addressable. */
463 return true;
466 t = TREE_OPERAND (t, 0);
467 if (get_alias_set (TREE_TYPE (t)) == 0)
468 return true;
472 /* Return the alias set for T, which may be either a type or an
473 expression. Call language-specific routine for help, if needed. */
475 HOST_WIDE_INT
476 get_alias_set (tree t)
478 HOST_WIDE_INT set;
480 /* If we're not doing any alias analysis, just assume everything
481 aliases everything else. Also return 0 if this or its type is
482 an error. */
483 if (! flag_strict_aliasing || t == error_mark_node
484 || (! TYPE_P (t)
485 && (TREE_TYPE (t) == 0 || TREE_TYPE (t) == error_mark_node)))
486 return 0;
488 /* We can be passed either an expression or a type. This and the
489 language-specific routine may make mutually-recursive calls to each other
490 to figure out what to do. At each juncture, we see if this is a tree
491 that the language may need to handle specially. First handle things that
492 aren't types. */
493 if (! TYPE_P (t))
495 tree inner = t;
497 /* Remove any nops, then give the language a chance to do
498 something with this tree before we look at it. */
499 STRIP_NOPS (t);
500 set = lang_hooks.get_alias_set (t);
501 if (set != -1)
502 return set;
504 /* First see if the actual object referenced is an INDIRECT_REF from a
505 restrict-qualified pointer or a "void *". */
506 while (handled_component_p (inner))
508 inner = TREE_OPERAND (inner, 0);
509 STRIP_NOPS (inner);
512 /* Check for accesses through restrict-qualified pointers. */
513 if (INDIRECT_REF_P (inner))
515 tree decl = find_base_decl (TREE_OPERAND (inner, 0));
517 if (decl && DECL_POINTER_ALIAS_SET_KNOWN_P (decl))
519 /* If we haven't computed the actual alias set, do it now. */
520 if (DECL_POINTER_ALIAS_SET (decl) == -2)
522 tree pointed_to_type = TREE_TYPE (TREE_TYPE (decl));
524 /* No two restricted pointers can point at the same thing.
525 However, a restricted pointer can point at the same thing
526 as an unrestricted pointer, if that unrestricted pointer
527 is based on the restricted pointer. So, we make the
528 alias set for the restricted pointer a subset of the
529 alias set for the type pointed to by the type of the
530 decl. */
531 HOST_WIDE_INT pointed_to_alias_set
532 = get_alias_set (pointed_to_type);
534 if (pointed_to_alias_set == 0)
535 /* It's not legal to make a subset of alias set zero. */
536 DECL_POINTER_ALIAS_SET (decl) = 0;
537 else if (AGGREGATE_TYPE_P (pointed_to_type))
538 /* For an aggregate, we must treat the restricted
539 pointer the same as an ordinary pointer. If we
540 were to make the type pointed to by the
541 restricted pointer a subset of the pointed-to
542 type, then we would believe that other subsets
543 of the pointed-to type (such as fields of that
544 type) do not conflict with the type pointed to
545 by the restricted pointer. */
546 DECL_POINTER_ALIAS_SET (decl)
547 = pointed_to_alias_set;
548 else
550 DECL_POINTER_ALIAS_SET (decl) = new_alias_set ();
551 record_alias_subset (pointed_to_alias_set,
552 DECL_POINTER_ALIAS_SET (decl));
556 /* We use the alias set indicated in the declaration. */
557 return DECL_POINTER_ALIAS_SET (decl);
560 /* If we have an INDIRECT_REF via a void pointer, we don't
561 know anything about what that might alias. Likewise if the
562 pointer is marked that way. */
563 else if (TREE_CODE (TREE_TYPE (inner)) == VOID_TYPE
564 || (TYPE_REF_CAN_ALIAS_ALL
565 (TREE_TYPE (TREE_OPERAND (inner, 0)))))
566 return 0;
569 /* Otherwise, pick up the outermost object that we could have a pointer
570 to, processing conversions as above. */
571 while (component_uses_parent_alias_set (t))
573 t = TREE_OPERAND (t, 0);
574 STRIP_NOPS (t);
577 /* If we've already determined the alias set for a decl, just return
578 it. This is necessary for C++ anonymous unions, whose component
579 variables don't look like union members (boo!). */
580 if (TREE_CODE (t) == VAR_DECL
581 && DECL_RTL_SET_P (t) && MEM_P (DECL_RTL (t)))
582 return MEM_ALIAS_SET (DECL_RTL (t));
584 /* Now all we care about is the type. */
585 t = TREE_TYPE (t);
588 /* Variant qualifiers don't affect the alias set, so get the main
589 variant. If this is a type with a known alias set, return it. */
590 t = TYPE_MAIN_VARIANT (t);
591 if (TYPE_ALIAS_SET_KNOWN_P (t))
592 return TYPE_ALIAS_SET (t);
594 /* See if the language has special handling for this type. */
595 set = lang_hooks.get_alias_set (t);
596 if (set != -1)
597 return set;
599 /* There are no objects of FUNCTION_TYPE, so there's no point in
600 using up an alias set for them. (There are, of course, pointers
601 and references to functions, but that's different.) */
602 else if (TREE_CODE (t) == FUNCTION_TYPE)
603 set = 0;
605 /* Unless the language specifies otherwise, let vector types alias
606 their components. This avoids some nasty type punning issues in
607 normal usage. And indeed lets vectors be treated more like an
608 array slice. */
609 else if (TREE_CODE (t) == VECTOR_TYPE)
610 set = get_alias_set (TREE_TYPE (t));
612 else
613 /* Otherwise make a new alias set for this type. */
614 set = new_alias_set ();
616 TYPE_ALIAS_SET (t) = set;
618 /* If this is an aggregate type, we must record any component aliasing
619 information. */
620 if (AGGREGATE_TYPE_P (t) || TREE_CODE (t) == COMPLEX_TYPE)
621 record_component_aliases (t);
623 return set;
626 /* Return a brand-new alias set. */
628 HOST_WIDE_INT
629 new_alias_set (void)
631 if (flag_strict_aliasing)
633 if (alias_sets == 0)
634 VEC_safe_push (alias_set_entry, gc, alias_sets, 0);
635 VEC_safe_push (alias_set_entry, gc, alias_sets, 0);
636 return VEC_length (alias_set_entry, alias_sets) - 1;
638 else
639 return 0;
642 /* Indicate that things in SUBSET can alias things in SUPERSET, but that
643 not everything that aliases SUPERSET also aliases SUBSET. For example,
644 in C, a store to an `int' can alias a load of a structure containing an
645 `int', and vice versa. But it can't alias a load of a 'double' member
646 of the same structure. Here, the structure would be the SUPERSET and
647 `int' the SUBSET. This relationship is also described in the comment at
648 the beginning of this file.
650 This function should be called only once per SUPERSET/SUBSET pair.
652 It is illegal for SUPERSET to be zero; everything is implicitly a
653 subset of alias set zero. */
655 static void
656 record_alias_subset (HOST_WIDE_INT superset, HOST_WIDE_INT subset)
658 alias_set_entry superset_entry;
659 alias_set_entry subset_entry;
661 /* It is possible in complex type situations for both sets to be the same,
662 in which case we can ignore this operation. */
663 if (superset == subset)
664 return;
666 gcc_assert (superset);
668 superset_entry = get_alias_set_entry (superset);
669 if (superset_entry == 0)
671 /* Create an entry for the SUPERSET, so that we have a place to
672 attach the SUBSET. */
673 superset_entry = ggc_alloc (sizeof (struct alias_set_entry));
674 superset_entry->alias_set = superset;
675 superset_entry->children
676 = splay_tree_new_ggc (splay_tree_compare_ints);
677 superset_entry->has_zero_child = 0;
678 VEC_replace (alias_set_entry, alias_sets, superset, superset_entry);
681 if (subset == 0)
682 superset_entry->has_zero_child = 1;
683 else
685 subset_entry = get_alias_set_entry (subset);
686 /* If there is an entry for the subset, enter all of its children
687 (if they are not already present) as children of the SUPERSET. */
688 if (subset_entry)
690 if (subset_entry->has_zero_child)
691 superset_entry->has_zero_child = 1;
693 splay_tree_foreach (subset_entry->children, insert_subset_children,
694 superset_entry->children);
697 /* Enter the SUBSET itself as a child of the SUPERSET. */
698 splay_tree_insert (superset_entry->children,
699 (splay_tree_key) subset, 0);
703 /* Record that component types of TYPE, if any, are part of that type for
704 aliasing purposes. For record types, we only record component types
705 for fields that are marked addressable. For array types, we always
706 record the component types, so the front end should not call this
707 function if the individual component aren't addressable. */
709 void
710 record_component_aliases (tree type)
712 HOST_WIDE_INT superset = get_alias_set (type);
713 tree field;
715 if (superset == 0)
716 return;
718 switch (TREE_CODE (type))
720 case ARRAY_TYPE:
721 if (! TYPE_NONALIASED_COMPONENT (type))
722 record_alias_subset (superset, get_alias_set (TREE_TYPE (type)));
723 break;
725 case RECORD_TYPE:
726 case UNION_TYPE:
727 case QUAL_UNION_TYPE:
728 /* Recursively record aliases for the base classes, if there are any. */
729 if (TYPE_BINFO (type))
731 int i;
732 tree binfo, base_binfo;
734 for (binfo = TYPE_BINFO (type), i = 0;
735 BINFO_BASE_ITERATE (binfo, i, base_binfo); i++)
736 record_alias_subset (superset,
737 get_alias_set (BINFO_TYPE (base_binfo)));
739 for (field = TYPE_FIELDS (type); field != 0; field = TREE_CHAIN (field))
740 if (TREE_CODE (field) == FIELD_DECL && ! DECL_NONADDRESSABLE_P (field))
741 record_alias_subset (superset, get_alias_set (TREE_TYPE (field)));
742 break;
744 case COMPLEX_TYPE:
745 record_alias_subset (superset, get_alias_set (TREE_TYPE (type)));
746 break;
748 default:
749 break;
753 /* Allocate an alias set for use in storing and reading from the varargs
754 spill area. */
756 static GTY(()) HOST_WIDE_INT varargs_set = -1;
758 HOST_WIDE_INT
759 get_varargs_alias_set (void)
761 #if 1
762 /* We now lower VA_ARG_EXPR, and there's currently no way to attach the
763 varargs alias set to an INDIRECT_REF (FIXME!), so we can't
764 consistently use the varargs alias set for loads from the varargs
765 area. So don't use it anywhere. */
766 return 0;
767 #else
768 if (varargs_set == -1)
769 varargs_set = new_alias_set ();
771 return varargs_set;
772 #endif
775 /* Likewise, but used for the fixed portions of the frame, e.g., register
776 save areas. */
778 static GTY(()) HOST_WIDE_INT frame_set = -1;
780 HOST_WIDE_INT
781 get_frame_alias_set (void)
783 if (frame_set == -1)
784 frame_set = new_alias_set ();
786 return frame_set;
789 /* Inside SRC, the source of a SET, find a base address. */
791 static rtx
792 find_base_value (rtx src)
794 unsigned int regno;
796 switch (GET_CODE (src))
798 case SYMBOL_REF:
799 case LABEL_REF:
800 return src;
802 case REG:
803 regno = REGNO (src);
804 /* At the start of a function, argument registers have known base
805 values which may be lost later. Returning an ADDRESS
806 expression here allows optimization based on argument values
807 even when the argument registers are used for other purposes. */
808 if (regno < FIRST_PSEUDO_REGISTER && copying_arguments)
809 return new_reg_base_value[regno];
811 /* If a pseudo has a known base value, return it. Do not do this
812 for non-fixed hard regs since it can result in a circular
813 dependency chain for registers which have values at function entry.
815 The test above is not sufficient because the scheduler may move
816 a copy out of an arg reg past the NOTE_INSN_FUNCTION_BEGIN. */
817 if ((regno >= FIRST_PSEUDO_REGISTER || fixed_regs[regno])
818 && regno < VEC_length (rtx, reg_base_value))
820 /* If we're inside init_alias_analysis, use new_reg_base_value
821 to reduce the number of relaxation iterations. */
822 if (new_reg_base_value && new_reg_base_value[regno]
823 && REG_N_SETS (regno) == 1)
824 return new_reg_base_value[regno];
826 if (VEC_index (rtx, reg_base_value, regno))
827 return VEC_index (rtx, reg_base_value, regno);
830 return 0;
832 case MEM:
833 /* Check for an argument passed in memory. Only record in the
834 copying-arguments block; it is too hard to track changes
835 otherwise. */
836 if (copying_arguments
837 && (XEXP (src, 0) == arg_pointer_rtx
838 || (GET_CODE (XEXP (src, 0)) == PLUS
839 && XEXP (XEXP (src, 0), 0) == arg_pointer_rtx)))
840 return gen_rtx_ADDRESS (VOIDmode, src);
841 return 0;
843 case CONST:
844 src = XEXP (src, 0);
845 if (GET_CODE (src) != PLUS && GET_CODE (src) != MINUS)
846 break;
848 /* ... fall through ... */
850 case PLUS:
851 case MINUS:
853 rtx temp, src_0 = XEXP (src, 0), src_1 = XEXP (src, 1);
855 /* If either operand is a REG that is a known pointer, then it
856 is the base. */
857 if (REG_P (src_0) && REG_POINTER (src_0))
858 return find_base_value (src_0);
859 if (REG_P (src_1) && REG_POINTER (src_1))
860 return find_base_value (src_1);
862 /* If either operand is a REG, then see if we already have
863 a known value for it. */
864 if (REG_P (src_0))
866 temp = find_base_value (src_0);
867 if (temp != 0)
868 src_0 = temp;
871 if (REG_P (src_1))
873 temp = find_base_value (src_1);
874 if (temp!= 0)
875 src_1 = temp;
878 /* If either base is named object or a special address
879 (like an argument or stack reference), then use it for the
880 base term. */
881 if (src_0 != 0
882 && (GET_CODE (src_0) == SYMBOL_REF
883 || GET_CODE (src_0) == LABEL_REF
884 || (GET_CODE (src_0) == ADDRESS
885 && GET_MODE (src_0) != VOIDmode)))
886 return src_0;
888 if (src_1 != 0
889 && (GET_CODE (src_1) == SYMBOL_REF
890 || GET_CODE (src_1) == LABEL_REF
891 || (GET_CODE (src_1) == ADDRESS
892 && GET_MODE (src_1) != VOIDmode)))
893 return src_1;
895 /* Guess which operand is the base address:
896 If either operand is a symbol, then it is the base. If
897 either operand is a CONST_INT, then the other is the base. */
898 if (GET_CODE (src_1) == CONST_INT || CONSTANT_P (src_0))
899 return find_base_value (src_0);
900 else if (GET_CODE (src_0) == CONST_INT || CONSTANT_P (src_1))
901 return find_base_value (src_1);
903 return 0;
906 case LO_SUM:
907 /* The standard form is (lo_sum reg sym) so look only at the
908 second operand. */
909 return find_base_value (XEXP (src, 1));
911 case AND:
912 /* If the second operand is constant set the base
913 address to the first operand. */
914 if (GET_CODE (XEXP (src, 1)) == CONST_INT && INTVAL (XEXP (src, 1)) != 0)
915 return find_base_value (XEXP (src, 0));
916 return 0;
918 case TRUNCATE:
919 if (GET_MODE_SIZE (GET_MODE (src)) < GET_MODE_SIZE (Pmode))
920 break;
921 /* Fall through. */
922 case HIGH:
923 case PRE_INC:
924 case PRE_DEC:
925 case POST_INC:
926 case POST_DEC:
927 case PRE_MODIFY:
928 case POST_MODIFY:
929 return find_base_value (XEXP (src, 0));
931 case ZERO_EXTEND:
932 case SIGN_EXTEND: /* used for NT/Alpha pointers */
934 rtx temp = find_base_value (XEXP (src, 0));
936 if (temp != 0 && CONSTANT_P (temp))
937 temp = convert_memory_address (Pmode, temp);
939 return temp;
942 default:
943 break;
946 return 0;
949 /* Called from init_alias_analysis indirectly through note_stores. */
951 /* While scanning insns to find base values, reg_seen[N] is nonzero if
952 register N has been set in this function. */
953 static char *reg_seen;
955 /* Addresses which are known not to alias anything else are identified
956 by a unique integer. */
957 static int unique_id;
959 static void
960 record_set (rtx dest, rtx set, void *data ATTRIBUTE_UNUSED)
962 unsigned regno;
963 rtx src;
964 int n;
966 if (!REG_P (dest))
967 return;
969 regno = REGNO (dest);
971 gcc_assert (regno < VEC_length (rtx, reg_base_value));
973 /* If this spans multiple hard registers, then we must indicate that every
974 register has an unusable value. */
975 if (regno < FIRST_PSEUDO_REGISTER)
976 n = hard_regno_nregs[regno][GET_MODE (dest)];
977 else
978 n = 1;
979 if (n != 1)
981 while (--n >= 0)
983 reg_seen[regno + n] = 1;
984 new_reg_base_value[regno + n] = 0;
986 return;
989 if (set)
991 /* A CLOBBER wipes out any old value but does not prevent a previously
992 unset register from acquiring a base address (i.e. reg_seen is not
993 set). */
994 if (GET_CODE (set) == CLOBBER)
996 new_reg_base_value[regno] = 0;
997 return;
999 src = SET_SRC (set);
1001 else
1003 if (reg_seen[regno])
1005 new_reg_base_value[regno] = 0;
1006 return;
1008 reg_seen[regno] = 1;
1009 new_reg_base_value[regno] = gen_rtx_ADDRESS (Pmode,
1010 GEN_INT (unique_id++));
1011 return;
1014 /* If this is not the first set of REGNO, see whether the new value
1015 is related to the old one. There are two cases of interest:
1017 (1) The register might be assigned an entirely new value
1018 that has the same base term as the original set.
1020 (2) The set might be a simple self-modification that
1021 cannot change REGNO's base value.
1023 If neither case holds, reject the original base value as invalid.
1024 Note that the following situation is not detected:
1026 extern int x, y; int *p = &x; p += (&y-&x);
1028 ANSI C does not allow computing the difference of addresses
1029 of distinct top level objects. */
1030 if (new_reg_base_value[regno] != 0
1031 && find_base_value (src) != new_reg_base_value[regno])
1032 switch (GET_CODE (src))
1034 case LO_SUM:
1035 case MINUS:
1036 if (XEXP (src, 0) != dest && XEXP (src, 1) != dest)
1037 new_reg_base_value[regno] = 0;
1038 break;
1039 case PLUS:
1040 /* If the value we add in the PLUS is also a valid base value,
1041 this might be the actual base value, and the original value
1042 an index. */
1044 rtx other = NULL_RTX;
1046 if (XEXP (src, 0) == dest)
1047 other = XEXP (src, 1);
1048 else if (XEXP (src, 1) == dest)
1049 other = XEXP (src, 0);
1051 if (! other || find_base_value (other))
1052 new_reg_base_value[regno] = 0;
1053 break;
1055 case AND:
1056 if (XEXP (src, 0) != dest || GET_CODE (XEXP (src, 1)) != CONST_INT)
1057 new_reg_base_value[regno] = 0;
1058 break;
1059 default:
1060 new_reg_base_value[regno] = 0;
1061 break;
1063 /* If this is the first set of a register, record the value. */
1064 else if ((regno >= FIRST_PSEUDO_REGISTER || ! fixed_regs[regno])
1065 && ! reg_seen[regno] && new_reg_base_value[regno] == 0)
1066 new_reg_base_value[regno] = find_base_value (src);
1068 reg_seen[regno] = 1;
1071 /* Clear alias info for a register. This is used if an RTL transformation
1072 changes the value of a register. This is used in flow by AUTO_INC_DEC
1073 optimizations. We don't need to clear reg_base_value, since flow only
1074 changes the offset. */
1076 void
1077 clear_reg_alias_info (rtx reg)
1079 unsigned int regno = REGNO (reg);
1081 if (regno >= FIRST_PSEUDO_REGISTER)
1083 regno -= FIRST_PSEUDO_REGISTER;
1084 if (regno < reg_known_value_size)
1086 reg_known_value[regno] = reg;
1087 reg_known_equiv_p[regno] = false;
1092 /* If a value is known for REGNO, return it. */
1095 get_reg_known_value (unsigned int regno)
1097 if (regno >= FIRST_PSEUDO_REGISTER)
1099 regno -= FIRST_PSEUDO_REGISTER;
1100 if (regno < reg_known_value_size)
1101 return reg_known_value[regno];
1103 return NULL;
1106 /* Set it. */
1108 static void
1109 set_reg_known_value (unsigned int regno, rtx val)
1111 if (regno >= FIRST_PSEUDO_REGISTER)
1113 regno -= FIRST_PSEUDO_REGISTER;
1114 if (regno < reg_known_value_size)
1115 reg_known_value[regno] = val;
1119 /* Similarly for reg_known_equiv_p. */
1121 bool
1122 get_reg_known_equiv_p (unsigned int regno)
1124 if (regno >= FIRST_PSEUDO_REGISTER)
1126 regno -= FIRST_PSEUDO_REGISTER;
1127 if (regno < reg_known_value_size)
1128 return reg_known_equiv_p[regno];
1130 return false;
1133 static void
1134 set_reg_known_equiv_p (unsigned int regno, bool val)
1136 if (regno >= FIRST_PSEUDO_REGISTER)
1138 regno -= FIRST_PSEUDO_REGISTER;
1139 if (regno < reg_known_value_size)
1140 reg_known_equiv_p[regno] = val;
1145 /* Returns a canonical version of X, from the point of view alias
1146 analysis. (For example, if X is a MEM whose address is a register,
1147 and the register has a known value (say a SYMBOL_REF), then a MEM
1148 whose address is the SYMBOL_REF is returned.) */
1151 canon_rtx (rtx x)
1153 /* Recursively look for equivalences. */
1154 if (REG_P (x) && REGNO (x) >= FIRST_PSEUDO_REGISTER)
1156 rtx t = get_reg_known_value (REGNO (x));
1157 if (t == x)
1158 return x;
1159 if (t)
1160 return canon_rtx (t);
1163 if (GET_CODE (x) == PLUS)
1165 rtx x0 = canon_rtx (XEXP (x, 0));
1166 rtx x1 = canon_rtx (XEXP (x, 1));
1168 if (x0 != XEXP (x, 0) || x1 != XEXP (x, 1))
1170 if (GET_CODE (x0) == CONST_INT)
1171 return plus_constant (x1, INTVAL (x0));
1172 else if (GET_CODE (x1) == CONST_INT)
1173 return plus_constant (x0, INTVAL (x1));
1174 return gen_rtx_PLUS (GET_MODE (x), x0, x1);
1178 /* This gives us much better alias analysis when called from
1179 the loop optimizer. Note we want to leave the original
1180 MEM alone, but need to return the canonicalized MEM with
1181 all the flags with their original values. */
1182 else if (MEM_P (x))
1183 x = replace_equiv_address_nv (x, canon_rtx (XEXP (x, 0)));
1185 return x;
1188 /* Return 1 if X and Y are identical-looking rtx's.
1189 Expect that X and Y has been already canonicalized.
1191 We use the data in reg_known_value above to see if two registers with
1192 different numbers are, in fact, equivalent. */
1194 static int
1195 rtx_equal_for_memref_p (rtx x, rtx y)
1197 int i;
1198 int j;
1199 enum rtx_code code;
1200 const char *fmt;
1202 if (x == 0 && y == 0)
1203 return 1;
1204 if (x == 0 || y == 0)
1205 return 0;
1207 if (x == y)
1208 return 1;
1210 code = GET_CODE (x);
1211 /* Rtx's of different codes cannot be equal. */
1212 if (code != GET_CODE (y))
1213 return 0;
1215 /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent.
1216 (REG:SI x) and (REG:HI x) are NOT equivalent. */
1218 if (GET_MODE (x) != GET_MODE (y))
1219 return 0;
1221 /* Some RTL can be compared without a recursive examination. */
1222 switch (code)
1224 case REG:
1225 return REGNO (x) == REGNO (y);
1227 case LABEL_REF:
1228 return XEXP (x, 0) == XEXP (y, 0);
1230 case SYMBOL_REF:
1231 return XSTR (x, 0) == XSTR (y, 0);
1233 case VALUE:
1234 case CONST_INT:
1235 case CONST_DOUBLE:
1236 /* There's no need to compare the contents of CONST_DOUBLEs or
1237 CONST_INTs because pointer equality is a good enough
1238 comparison for these nodes. */
1239 return 0;
1241 default:
1242 break;
1245 /* canon_rtx knows how to handle plus. No need to canonicalize. */
1246 if (code == PLUS)
1247 return ((rtx_equal_for_memref_p (XEXP (x, 0), XEXP (y, 0))
1248 && rtx_equal_for_memref_p (XEXP (x, 1), XEXP (y, 1)))
1249 || (rtx_equal_for_memref_p (XEXP (x, 0), XEXP (y, 1))
1250 && rtx_equal_for_memref_p (XEXP (x, 1), XEXP (y, 0))));
1251 /* For commutative operations, the RTX match if the operand match in any
1252 order. Also handle the simple binary and unary cases without a loop. */
1253 if (COMMUTATIVE_P (x))
1255 rtx xop0 = canon_rtx (XEXP (x, 0));
1256 rtx yop0 = canon_rtx (XEXP (y, 0));
1257 rtx yop1 = canon_rtx (XEXP (y, 1));
1259 return ((rtx_equal_for_memref_p (xop0, yop0)
1260 && rtx_equal_for_memref_p (canon_rtx (XEXP (x, 1)), yop1))
1261 || (rtx_equal_for_memref_p (xop0, yop1)
1262 && rtx_equal_for_memref_p (canon_rtx (XEXP (x, 1)), yop0)));
1264 else if (NON_COMMUTATIVE_P (x))
1266 return (rtx_equal_for_memref_p (canon_rtx (XEXP (x, 0)),
1267 canon_rtx (XEXP (y, 0)))
1268 && rtx_equal_for_memref_p (canon_rtx (XEXP (x, 1)),
1269 canon_rtx (XEXP (y, 1))));
1271 else if (UNARY_P (x))
1272 return rtx_equal_for_memref_p (canon_rtx (XEXP (x, 0)),
1273 canon_rtx (XEXP (y, 0)));
1275 /* Compare the elements. If any pair of corresponding elements
1276 fail to match, return 0 for the whole things.
1278 Limit cases to types which actually appear in addresses. */
1280 fmt = GET_RTX_FORMAT (code);
1281 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1283 switch (fmt[i])
1285 case 'i':
1286 if (XINT (x, i) != XINT (y, i))
1287 return 0;
1288 break;
1290 case 'E':
1291 /* Two vectors must have the same length. */
1292 if (XVECLEN (x, i) != XVECLEN (y, i))
1293 return 0;
1295 /* And the corresponding elements must match. */
1296 for (j = 0; j < XVECLEN (x, i); j++)
1297 if (rtx_equal_for_memref_p (canon_rtx (XVECEXP (x, i, j)),
1298 canon_rtx (XVECEXP (y, i, j))) == 0)
1299 return 0;
1300 break;
1302 case 'e':
1303 if (rtx_equal_for_memref_p (canon_rtx (XEXP (x, i)),
1304 canon_rtx (XEXP (y, i))) == 0)
1305 return 0;
1306 break;
1308 /* This can happen for asm operands. */
1309 case 's':
1310 if (strcmp (XSTR (x, i), XSTR (y, i)))
1311 return 0;
1312 break;
1314 /* This can happen for an asm which clobbers memory. */
1315 case '0':
1316 break;
1318 /* It is believed that rtx's at this level will never
1319 contain anything but integers and other rtx's,
1320 except for within LABEL_REFs and SYMBOL_REFs. */
1321 default:
1322 gcc_unreachable ();
1325 return 1;
1328 /* Given an rtx X, find a SYMBOL_REF or LABEL_REF within
1329 X and return it, or return 0 if none found. */
1331 static rtx
1332 find_symbolic_term (rtx x)
1334 int i;
1335 enum rtx_code code;
1336 const char *fmt;
1338 code = GET_CODE (x);
1339 if (code == SYMBOL_REF || code == LABEL_REF)
1340 return x;
1341 if (OBJECT_P (x))
1342 return 0;
1344 fmt = GET_RTX_FORMAT (code);
1345 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1347 rtx t;
1349 if (fmt[i] == 'e')
1351 t = find_symbolic_term (XEXP (x, i));
1352 if (t != 0)
1353 return t;
1355 else if (fmt[i] == 'E')
1356 break;
1358 return 0;
1362 find_base_term (rtx x)
1364 cselib_val *val;
1365 struct elt_loc_list *l;
1367 #if defined (FIND_BASE_TERM)
1368 /* Try machine-dependent ways to find the base term. */
1369 x = FIND_BASE_TERM (x);
1370 #endif
1372 switch (GET_CODE (x))
1374 case REG:
1375 return REG_BASE_VALUE (x);
1377 case TRUNCATE:
1378 if (GET_MODE_SIZE (GET_MODE (x)) < GET_MODE_SIZE (Pmode))
1379 return 0;
1380 /* Fall through. */
1381 case HIGH:
1382 case PRE_INC:
1383 case PRE_DEC:
1384 case POST_INC:
1385 case POST_DEC:
1386 case PRE_MODIFY:
1387 case POST_MODIFY:
1388 return find_base_term (XEXP (x, 0));
1390 case ZERO_EXTEND:
1391 case SIGN_EXTEND: /* Used for Alpha/NT pointers */
1393 rtx temp = find_base_term (XEXP (x, 0));
1395 if (temp != 0 && CONSTANT_P (temp))
1396 temp = convert_memory_address (Pmode, temp);
1398 return temp;
1401 case VALUE:
1402 val = CSELIB_VAL_PTR (x);
1403 if (!val)
1404 return 0;
1405 for (l = val->locs; l; l = l->next)
1406 if ((x = find_base_term (l->loc)) != 0)
1407 return x;
1408 return 0;
1410 case CONST:
1411 x = XEXP (x, 0);
1412 if (GET_CODE (x) != PLUS && GET_CODE (x) != MINUS)
1413 return 0;
1414 /* Fall through. */
1415 case LO_SUM:
1416 case PLUS:
1417 case MINUS:
1419 rtx tmp1 = XEXP (x, 0);
1420 rtx tmp2 = XEXP (x, 1);
1422 /* This is a little bit tricky since we have to determine which of
1423 the two operands represents the real base address. Otherwise this
1424 routine may return the index register instead of the base register.
1426 That may cause us to believe no aliasing was possible, when in
1427 fact aliasing is possible.
1429 We use a few simple tests to guess the base register. Additional
1430 tests can certainly be added. For example, if one of the operands
1431 is a shift or multiply, then it must be the index register and the
1432 other operand is the base register. */
1434 if (tmp1 == pic_offset_table_rtx && CONSTANT_P (tmp2))
1435 return find_base_term (tmp2);
1437 /* If either operand is known to be a pointer, then use it
1438 to determine the base term. */
1439 if (REG_P (tmp1) && REG_POINTER (tmp1))
1440 return find_base_term (tmp1);
1442 if (REG_P (tmp2) && REG_POINTER (tmp2))
1443 return find_base_term (tmp2);
1445 /* Neither operand was known to be a pointer. Go ahead and find the
1446 base term for both operands. */
1447 tmp1 = find_base_term (tmp1);
1448 tmp2 = find_base_term (tmp2);
1450 /* If either base term is named object or a special address
1451 (like an argument or stack reference), then use it for the
1452 base term. */
1453 if (tmp1 != 0
1454 && (GET_CODE (tmp1) == SYMBOL_REF
1455 || GET_CODE (tmp1) == LABEL_REF
1456 || (GET_CODE (tmp1) == ADDRESS
1457 && GET_MODE (tmp1) != VOIDmode)))
1458 return tmp1;
1460 if (tmp2 != 0
1461 && (GET_CODE (tmp2) == SYMBOL_REF
1462 || GET_CODE (tmp2) == LABEL_REF
1463 || (GET_CODE (tmp2) == ADDRESS
1464 && GET_MODE (tmp2) != VOIDmode)))
1465 return tmp2;
1467 /* We could not determine which of the two operands was the
1468 base register and which was the index. So we can determine
1469 nothing from the base alias check. */
1470 return 0;
1473 case AND:
1474 if (GET_CODE (XEXP (x, 1)) == CONST_INT && INTVAL (XEXP (x, 1)) != 0)
1475 return find_base_term (XEXP (x, 0));
1476 return 0;
1478 case SYMBOL_REF:
1479 case LABEL_REF:
1480 return x;
1482 default:
1483 return 0;
1487 /* Return 0 if the addresses X and Y are known to point to different
1488 objects, 1 if they might be pointers to the same object. */
1490 static int
1491 base_alias_check (rtx x, rtx y, enum machine_mode x_mode,
1492 enum machine_mode y_mode)
1494 rtx x_base = find_base_term (x);
1495 rtx y_base = find_base_term (y);
1497 /* If the address itself has no known base see if a known equivalent
1498 value has one. If either address still has no known base, nothing
1499 is known about aliasing. */
1500 if (x_base == 0)
1502 rtx x_c;
1504 if (! flag_expensive_optimizations || (x_c = canon_rtx (x)) == x)
1505 return 1;
1507 x_base = find_base_term (x_c);
1508 if (x_base == 0)
1509 return 1;
1512 if (y_base == 0)
1514 rtx y_c;
1515 if (! flag_expensive_optimizations || (y_c = canon_rtx (y)) == y)
1516 return 1;
1518 y_base = find_base_term (y_c);
1519 if (y_base == 0)
1520 return 1;
1523 /* If the base addresses are equal nothing is known about aliasing. */
1524 if (rtx_equal_p (x_base, y_base))
1525 return 1;
1527 /* The base addresses of the read and write are different expressions.
1528 If they are both symbols and they are not accessed via AND, there is
1529 no conflict. We can bring knowledge of object alignment into play
1530 here. For example, on alpha, "char a, b;" can alias one another,
1531 though "char a; long b;" cannot. */
1532 if (GET_CODE (x_base) != ADDRESS && GET_CODE (y_base) != ADDRESS)
1534 if (GET_CODE (x) == AND && GET_CODE (y) == AND)
1535 return 1;
1536 if (GET_CODE (x) == AND
1537 && (GET_CODE (XEXP (x, 1)) != CONST_INT
1538 || (int) GET_MODE_UNIT_SIZE (y_mode) < -INTVAL (XEXP (x, 1))))
1539 return 1;
1540 if (GET_CODE (y) == AND
1541 && (GET_CODE (XEXP (y, 1)) != CONST_INT
1542 || (int) GET_MODE_UNIT_SIZE (x_mode) < -INTVAL (XEXP (y, 1))))
1543 return 1;
1544 /* Differing symbols never alias. */
1545 return 0;
1548 /* If one address is a stack reference there can be no alias:
1549 stack references using different base registers do not alias,
1550 a stack reference can not alias a parameter, and a stack reference
1551 can not alias a global. */
1552 if ((GET_CODE (x_base) == ADDRESS && GET_MODE (x_base) == Pmode)
1553 || (GET_CODE (y_base) == ADDRESS && GET_MODE (y_base) == Pmode))
1554 return 0;
1556 if (! flag_argument_noalias)
1557 return 1;
1559 if (flag_argument_noalias > 1)
1560 return 0;
1562 /* Weak noalias assertion (arguments are distinct, but may match globals). */
1563 return ! (GET_MODE (x_base) == VOIDmode && GET_MODE (y_base) == VOIDmode);
1566 /* Convert the address X into something we can use. This is done by returning
1567 it unchanged unless it is a value; in the latter case we call cselib to get
1568 a more useful rtx. */
1571 get_addr (rtx x)
1573 cselib_val *v;
1574 struct elt_loc_list *l;
1576 if (GET_CODE (x) != VALUE)
1577 return x;
1578 v = CSELIB_VAL_PTR (x);
1579 if (v)
1581 for (l = v->locs; l; l = l->next)
1582 if (CONSTANT_P (l->loc))
1583 return l->loc;
1584 for (l = v->locs; l; l = l->next)
1585 if (!REG_P (l->loc) && !MEM_P (l->loc))
1586 return l->loc;
1587 if (v->locs)
1588 return v->locs->loc;
1590 return x;
1593 /* Return the address of the (N_REFS + 1)th memory reference to ADDR
1594 where SIZE is the size in bytes of the memory reference. If ADDR
1595 is not modified by the memory reference then ADDR is returned. */
1597 static rtx
1598 addr_side_effect_eval (rtx addr, int size, int n_refs)
1600 int offset = 0;
1602 switch (GET_CODE (addr))
1604 case PRE_INC:
1605 offset = (n_refs + 1) * size;
1606 break;
1607 case PRE_DEC:
1608 offset = -(n_refs + 1) * size;
1609 break;
1610 case POST_INC:
1611 offset = n_refs * size;
1612 break;
1613 case POST_DEC:
1614 offset = -n_refs * size;
1615 break;
1617 default:
1618 return addr;
1621 if (offset)
1622 addr = gen_rtx_PLUS (GET_MODE (addr), XEXP (addr, 0),
1623 GEN_INT (offset));
1624 else
1625 addr = XEXP (addr, 0);
1626 addr = canon_rtx (addr);
1628 return addr;
1631 /* Return nonzero if X and Y (memory addresses) could reference the
1632 same location in memory. C is an offset accumulator. When
1633 C is nonzero, we are testing aliases between X and Y + C.
1634 XSIZE is the size in bytes of the X reference,
1635 similarly YSIZE is the size in bytes for Y.
1636 Expect that canon_rtx has been already called for X and Y.
1638 If XSIZE or YSIZE is zero, we do not know the amount of memory being
1639 referenced (the reference was BLKmode), so make the most pessimistic
1640 assumptions.
1642 If XSIZE or YSIZE is negative, we may access memory outside the object
1643 being referenced as a side effect. This can happen when using AND to
1644 align memory references, as is done on the Alpha.
1646 Nice to notice that varying addresses cannot conflict with fp if no
1647 local variables had their addresses taken, but that's too hard now. */
1649 static int
1650 memrefs_conflict_p (int xsize, rtx x, int ysize, rtx y, HOST_WIDE_INT c)
1652 if (GET_CODE (x) == VALUE)
1653 x = get_addr (x);
1654 if (GET_CODE (y) == VALUE)
1655 y = get_addr (y);
1656 if (GET_CODE (x) == HIGH)
1657 x = XEXP (x, 0);
1658 else if (GET_CODE (x) == LO_SUM)
1659 x = XEXP (x, 1);
1660 else
1661 x = addr_side_effect_eval (x, xsize, 0);
1662 if (GET_CODE (y) == HIGH)
1663 y = XEXP (y, 0);
1664 else if (GET_CODE (y) == LO_SUM)
1665 y = XEXP (y, 1);
1666 else
1667 y = addr_side_effect_eval (y, ysize, 0);
1669 if (rtx_equal_for_memref_p (x, y))
1671 if (xsize <= 0 || ysize <= 0)
1672 return 1;
1673 if (c >= 0 && xsize > c)
1674 return 1;
1675 if (c < 0 && ysize+c > 0)
1676 return 1;
1677 return 0;
1680 /* This code used to check for conflicts involving stack references and
1681 globals but the base address alias code now handles these cases. */
1683 if (GET_CODE (x) == PLUS)
1685 /* The fact that X is canonicalized means that this
1686 PLUS rtx is canonicalized. */
1687 rtx x0 = XEXP (x, 0);
1688 rtx x1 = XEXP (x, 1);
1690 if (GET_CODE (y) == PLUS)
1692 /* The fact that Y is canonicalized means that this
1693 PLUS rtx is canonicalized. */
1694 rtx y0 = XEXP (y, 0);
1695 rtx y1 = XEXP (y, 1);
1697 if (rtx_equal_for_memref_p (x1, y1))
1698 return memrefs_conflict_p (xsize, x0, ysize, y0, c);
1699 if (rtx_equal_for_memref_p (x0, y0))
1700 return memrefs_conflict_p (xsize, x1, ysize, y1, c);
1701 if (GET_CODE (x1) == CONST_INT)
1703 if (GET_CODE (y1) == CONST_INT)
1704 return memrefs_conflict_p (xsize, x0, ysize, y0,
1705 c - INTVAL (x1) + INTVAL (y1));
1706 else
1707 return memrefs_conflict_p (xsize, x0, ysize, y,
1708 c - INTVAL (x1));
1710 else if (GET_CODE (y1) == CONST_INT)
1711 return memrefs_conflict_p (xsize, x, ysize, y0, c + INTVAL (y1));
1713 return 1;
1715 else if (GET_CODE (x1) == CONST_INT)
1716 return memrefs_conflict_p (xsize, x0, ysize, y, c - INTVAL (x1));
1718 else if (GET_CODE (y) == PLUS)
1720 /* The fact that Y is canonicalized means that this
1721 PLUS rtx is canonicalized. */
1722 rtx y0 = XEXP (y, 0);
1723 rtx y1 = XEXP (y, 1);
1725 if (GET_CODE (y1) == CONST_INT)
1726 return memrefs_conflict_p (xsize, x, ysize, y0, c + INTVAL (y1));
1727 else
1728 return 1;
1731 if (GET_CODE (x) == GET_CODE (y))
1732 switch (GET_CODE (x))
1734 case MULT:
1736 /* Handle cases where we expect the second operands to be the
1737 same, and check only whether the first operand would conflict
1738 or not. */
1739 rtx x0, y0;
1740 rtx x1 = canon_rtx (XEXP (x, 1));
1741 rtx y1 = canon_rtx (XEXP (y, 1));
1742 if (! rtx_equal_for_memref_p (x1, y1))
1743 return 1;
1744 x0 = canon_rtx (XEXP (x, 0));
1745 y0 = canon_rtx (XEXP (y, 0));
1746 if (rtx_equal_for_memref_p (x0, y0))
1747 return (xsize == 0 || ysize == 0
1748 || (c >= 0 && xsize > c) || (c < 0 && ysize+c > 0));
1750 /* Can't properly adjust our sizes. */
1751 if (GET_CODE (x1) != CONST_INT)
1752 return 1;
1753 xsize /= INTVAL (x1);
1754 ysize /= INTVAL (x1);
1755 c /= INTVAL (x1);
1756 return memrefs_conflict_p (xsize, x0, ysize, y0, c);
1759 default:
1760 break;
1763 /* Treat an access through an AND (e.g. a subword access on an Alpha)
1764 as an access with indeterminate size. Assume that references
1765 besides AND are aligned, so if the size of the other reference is
1766 at least as large as the alignment, assume no other overlap. */
1767 if (GET_CODE (x) == AND && GET_CODE (XEXP (x, 1)) == CONST_INT)
1769 if (GET_CODE (y) == AND || ysize < -INTVAL (XEXP (x, 1)))
1770 xsize = -1;
1771 return memrefs_conflict_p (xsize, canon_rtx (XEXP (x, 0)), ysize, y, c);
1773 if (GET_CODE (y) == AND && GET_CODE (XEXP (y, 1)) == CONST_INT)
1775 /* ??? If we are indexing far enough into the array/structure, we
1776 may yet be able to determine that we can not overlap. But we
1777 also need to that we are far enough from the end not to overlap
1778 a following reference, so we do nothing with that for now. */
1779 if (GET_CODE (x) == AND || xsize < -INTVAL (XEXP (y, 1)))
1780 ysize = -1;
1781 return memrefs_conflict_p (xsize, x, ysize, canon_rtx (XEXP (y, 0)), c);
1784 if (CONSTANT_P (x))
1786 if (GET_CODE (x) == CONST_INT && GET_CODE (y) == CONST_INT)
1788 c += (INTVAL (y) - INTVAL (x));
1789 return (xsize <= 0 || ysize <= 0
1790 || (c >= 0 && xsize > c) || (c < 0 && ysize+c > 0));
1793 if (GET_CODE (x) == CONST)
1795 if (GET_CODE (y) == CONST)
1796 return memrefs_conflict_p (xsize, canon_rtx (XEXP (x, 0)),
1797 ysize, canon_rtx (XEXP (y, 0)), c);
1798 else
1799 return memrefs_conflict_p (xsize, canon_rtx (XEXP (x, 0)),
1800 ysize, y, c);
1802 if (GET_CODE (y) == CONST)
1803 return memrefs_conflict_p (xsize, x, ysize,
1804 canon_rtx (XEXP (y, 0)), c);
1806 if (CONSTANT_P (y))
1807 return (xsize <= 0 || ysize <= 0
1808 || (rtx_equal_for_memref_p (x, y)
1809 && ((c >= 0 && xsize > c) || (c < 0 && ysize+c > 0))));
1811 return 1;
1813 return 1;
1816 /* Functions to compute memory dependencies.
1818 Since we process the insns in execution order, we can build tables
1819 to keep track of what registers are fixed (and not aliased), what registers
1820 are varying in known ways, and what registers are varying in unknown
1821 ways.
1823 If both memory references are volatile, then there must always be a
1824 dependence between the two references, since their order can not be
1825 changed. A volatile and non-volatile reference can be interchanged
1826 though.
1828 A MEM_IN_STRUCT reference at a non-AND varying address can never
1829 conflict with a non-MEM_IN_STRUCT reference at a fixed address. We
1830 also must allow AND addresses, because they may generate accesses
1831 outside the object being referenced. This is used to generate
1832 aligned addresses from unaligned addresses, for instance, the alpha
1833 storeqi_unaligned pattern. */
1835 /* Read dependence: X is read after read in MEM takes place. There can
1836 only be a dependence here if both reads are volatile. */
1839 read_dependence (rtx mem, rtx x)
1841 return MEM_VOLATILE_P (x) && MEM_VOLATILE_P (mem);
1844 /* Returns MEM1 if and only if MEM1 is a scalar at a fixed address and
1845 MEM2 is a reference to a structure at a varying address, or returns
1846 MEM2 if vice versa. Otherwise, returns NULL_RTX. If a non-NULL
1847 value is returned MEM1 and MEM2 can never alias. VARIES_P is used
1848 to decide whether or not an address may vary; it should return
1849 nonzero whenever variation is possible.
1850 MEM1_ADDR and MEM2_ADDR are the addresses of MEM1 and MEM2. */
1852 static rtx
1853 fixed_scalar_and_varying_struct_p (rtx mem1, rtx mem2, rtx mem1_addr,
1854 rtx mem2_addr,
1855 int (*varies_p) (rtx, int))
1857 if (! flag_strict_aliasing)
1858 return NULL_RTX;
1860 if (MEM_ALIAS_SET (mem2)
1861 && MEM_SCALAR_P (mem1) && MEM_IN_STRUCT_P (mem2)
1862 && !varies_p (mem1_addr, 1) && varies_p (mem2_addr, 1))
1863 /* MEM1 is a scalar at a fixed address; MEM2 is a struct at a
1864 varying address. */
1865 return mem1;
1867 if (MEM_ALIAS_SET (mem1)
1868 && MEM_IN_STRUCT_P (mem1) && MEM_SCALAR_P (mem2)
1869 && varies_p (mem1_addr, 1) && !varies_p (mem2_addr, 1))
1870 /* MEM2 is a scalar at a fixed address; MEM1 is a struct at a
1871 varying address. */
1872 return mem2;
1874 return NULL_RTX;
1877 /* Returns nonzero if something about the mode or address format MEM1
1878 indicates that it might well alias *anything*. */
1880 static int
1881 aliases_everything_p (rtx mem)
1883 if (GET_CODE (XEXP (mem, 0)) == AND)
1884 /* If the address is an AND, it's very hard to know at what it is
1885 actually pointing. */
1886 return 1;
1888 return 0;
1891 /* Return true if we can determine that the fields referenced cannot
1892 overlap for any pair of objects. */
1894 static bool
1895 nonoverlapping_component_refs_p (tree x, tree y)
1897 tree fieldx, fieldy, typex, typey, orig_y;
1901 /* The comparison has to be done at a common type, since we don't
1902 know how the inheritance hierarchy works. */
1903 orig_y = y;
1906 fieldx = TREE_OPERAND (x, 1);
1907 typex = TYPE_MAIN_VARIANT (DECL_FIELD_CONTEXT (fieldx));
1909 y = orig_y;
1912 fieldy = TREE_OPERAND (y, 1);
1913 typey = TYPE_MAIN_VARIANT (DECL_FIELD_CONTEXT (fieldy));
1915 if (typex == typey)
1916 goto found;
1918 y = TREE_OPERAND (y, 0);
1920 while (y && TREE_CODE (y) == COMPONENT_REF);
1922 x = TREE_OPERAND (x, 0);
1924 while (x && TREE_CODE (x) == COMPONENT_REF);
1925 /* Never found a common type. */
1926 return false;
1928 found:
1929 /* If we're left with accessing different fields of a structure,
1930 then no overlap. */
1931 if (TREE_CODE (typex) == RECORD_TYPE
1932 && fieldx != fieldy)
1933 return true;
1935 /* The comparison on the current field failed. If we're accessing
1936 a very nested structure, look at the next outer level. */
1937 x = TREE_OPERAND (x, 0);
1938 y = TREE_OPERAND (y, 0);
1940 while (x && y
1941 && TREE_CODE (x) == COMPONENT_REF
1942 && TREE_CODE (y) == COMPONENT_REF);
1944 return false;
1947 /* Look at the bottom of the COMPONENT_REF list for a DECL, and return it. */
1949 static tree
1950 decl_for_component_ref (tree x)
1954 x = TREE_OPERAND (x, 0);
1956 while (x && TREE_CODE (x) == COMPONENT_REF);
1958 return x && DECL_P (x) ? x : NULL_TREE;
1961 /* Walk up the COMPONENT_REF list and adjust OFFSET to compensate for the
1962 offset of the field reference. */
1964 static rtx
1965 adjust_offset_for_component_ref (tree x, rtx offset)
1967 HOST_WIDE_INT ioffset;
1969 if (! offset)
1970 return NULL_RTX;
1972 ioffset = INTVAL (offset);
1975 tree offset = component_ref_field_offset (x);
1976 tree field = TREE_OPERAND (x, 1);
1978 if (! host_integerp (offset, 1))
1979 return NULL_RTX;
1980 ioffset += (tree_low_cst (offset, 1)
1981 + (tree_low_cst (DECL_FIELD_BIT_OFFSET (field), 1)
1982 / BITS_PER_UNIT));
1984 x = TREE_OPERAND (x, 0);
1986 while (x && TREE_CODE (x) == COMPONENT_REF);
1988 return GEN_INT (ioffset);
1991 /* Return nonzero if we can determine the exprs corresponding to memrefs
1992 X and Y and they do not overlap. */
1994 static int
1995 nonoverlapping_memrefs_p (rtx x, rtx y)
1997 tree exprx = MEM_EXPR (x), expry = MEM_EXPR (y);
1998 rtx rtlx, rtly;
1999 rtx basex, basey;
2000 rtx moffsetx, moffsety;
2001 HOST_WIDE_INT offsetx = 0, offsety = 0, sizex, sizey, tem;
2003 /* Unless both have exprs, we can't tell anything. */
2004 if (exprx == 0 || expry == 0)
2005 return 0;
2007 /* If both are field references, we may be able to determine something. */
2008 if (TREE_CODE (exprx) == COMPONENT_REF
2009 && TREE_CODE (expry) == COMPONENT_REF
2010 && nonoverlapping_component_refs_p (exprx, expry))
2011 return 1;
2014 /* If the field reference test failed, look at the DECLs involved. */
2015 moffsetx = MEM_OFFSET (x);
2016 if (TREE_CODE (exprx) == COMPONENT_REF)
2018 if (TREE_CODE (expry) == VAR_DECL
2019 && POINTER_TYPE_P (TREE_TYPE (expry)))
2021 tree field = TREE_OPERAND (exprx, 1);
2022 tree fieldcontext = DECL_FIELD_CONTEXT (field);
2023 if (ipa_type_escape_field_does_not_clobber_p (fieldcontext,
2024 TREE_TYPE (field)))
2025 return 1;
2028 tree t = decl_for_component_ref (exprx);
2029 if (! t)
2030 return 0;
2031 moffsetx = adjust_offset_for_component_ref (exprx, moffsetx);
2032 exprx = t;
2035 else if (INDIRECT_REF_P (exprx))
2037 exprx = TREE_OPERAND (exprx, 0);
2038 if (flag_argument_noalias < 2
2039 || TREE_CODE (exprx) != PARM_DECL)
2040 return 0;
2043 moffsety = MEM_OFFSET (y);
2044 if (TREE_CODE (expry) == COMPONENT_REF)
2046 if (TREE_CODE (exprx) == VAR_DECL
2047 && POINTER_TYPE_P (TREE_TYPE (exprx)))
2049 tree field = TREE_OPERAND (expry, 1);
2050 tree fieldcontext = DECL_FIELD_CONTEXT (field);
2051 if (ipa_type_escape_field_does_not_clobber_p (fieldcontext,
2052 TREE_TYPE (field)))
2053 return 1;
2056 tree t = decl_for_component_ref (expry);
2057 if (! t)
2058 return 0;
2059 moffsety = adjust_offset_for_component_ref (expry, moffsety);
2060 expry = t;
2063 else if (INDIRECT_REF_P (expry))
2065 expry = TREE_OPERAND (expry, 0);
2066 if (flag_argument_noalias < 2
2067 || TREE_CODE (expry) != PARM_DECL)
2068 return 0;
2071 if (! DECL_P (exprx) || ! DECL_P (expry))
2072 return 0;
2074 rtlx = DECL_RTL (exprx);
2075 rtly = DECL_RTL (expry);
2077 /* If either RTL is not a MEM, it must be a REG or CONCAT, meaning they
2078 can't overlap unless they are the same because we never reuse that part
2079 of the stack frame used for locals for spilled pseudos. */
2080 if ((!MEM_P (rtlx) || !MEM_P (rtly))
2081 && ! rtx_equal_p (rtlx, rtly))
2082 return 1;
2084 /* Get the base and offsets of both decls. If either is a register, we
2085 know both are and are the same, so use that as the base. The only
2086 we can avoid overlap is if we can deduce that they are nonoverlapping
2087 pieces of that decl, which is very rare. */
2088 basex = MEM_P (rtlx) ? XEXP (rtlx, 0) : rtlx;
2089 if (GET_CODE (basex) == PLUS && GET_CODE (XEXP (basex, 1)) == CONST_INT)
2090 offsetx = INTVAL (XEXP (basex, 1)), basex = XEXP (basex, 0);
2092 basey = MEM_P (rtly) ? XEXP (rtly, 0) : rtly;
2093 if (GET_CODE (basey) == PLUS && GET_CODE (XEXP (basey, 1)) == CONST_INT)
2094 offsety = INTVAL (XEXP (basey, 1)), basey = XEXP (basey, 0);
2096 /* If the bases are different, we know they do not overlap if both
2097 are constants or if one is a constant and the other a pointer into the
2098 stack frame. Otherwise a different base means we can't tell if they
2099 overlap or not. */
2100 if (! rtx_equal_p (basex, basey))
2101 return ((CONSTANT_P (basex) && CONSTANT_P (basey))
2102 || (CONSTANT_P (basex) && REG_P (basey)
2103 && REGNO_PTR_FRAME_P (REGNO (basey)))
2104 || (CONSTANT_P (basey) && REG_P (basex)
2105 && REGNO_PTR_FRAME_P (REGNO (basex))));
2107 sizex = (!MEM_P (rtlx) ? (int) GET_MODE_SIZE (GET_MODE (rtlx))
2108 : MEM_SIZE (rtlx) ? INTVAL (MEM_SIZE (rtlx))
2109 : -1);
2110 sizey = (!MEM_P (rtly) ? (int) GET_MODE_SIZE (GET_MODE (rtly))
2111 : MEM_SIZE (rtly) ? INTVAL (MEM_SIZE (rtly)) :
2112 -1);
2114 /* If we have an offset for either memref, it can update the values computed
2115 above. */
2116 if (moffsetx)
2117 offsetx += INTVAL (moffsetx), sizex -= INTVAL (moffsetx);
2118 if (moffsety)
2119 offsety += INTVAL (moffsety), sizey -= INTVAL (moffsety);
2121 /* If a memref has both a size and an offset, we can use the smaller size.
2122 We can't do this if the offset isn't known because we must view this
2123 memref as being anywhere inside the DECL's MEM. */
2124 if (MEM_SIZE (x) && moffsetx)
2125 sizex = INTVAL (MEM_SIZE (x));
2126 if (MEM_SIZE (y) && moffsety)
2127 sizey = INTVAL (MEM_SIZE (y));
2129 /* Put the values of the memref with the lower offset in X's values. */
2130 if (offsetx > offsety)
2132 tem = offsetx, offsetx = offsety, offsety = tem;
2133 tem = sizex, sizex = sizey, sizey = tem;
2136 /* If we don't know the size of the lower-offset value, we can't tell
2137 if they conflict. Otherwise, we do the test. */
2138 return sizex >= 0 && offsety >= offsetx + sizex;
2141 /* True dependence: X is read after store in MEM takes place. */
2144 true_dependence (rtx mem, enum machine_mode mem_mode, rtx x,
2145 int (*varies) (rtx, int))
2147 rtx x_addr, mem_addr;
2148 rtx base;
2150 if (MEM_VOLATILE_P (x) && MEM_VOLATILE_P (mem))
2151 return 1;
2153 /* (mem:BLK (scratch)) is a special mechanism to conflict with everything.
2154 This is used in epilogue deallocation functions, and in cselib. */
2155 if (GET_MODE (x) == BLKmode && GET_CODE (XEXP (x, 0)) == SCRATCH)
2156 return 1;
2157 if (GET_MODE (mem) == BLKmode && GET_CODE (XEXP (mem, 0)) == SCRATCH)
2158 return 1;
2159 if (MEM_ALIAS_SET (x) == ALIAS_SET_MEMORY_BARRIER
2160 || MEM_ALIAS_SET (mem) == ALIAS_SET_MEMORY_BARRIER)
2161 return 1;
2163 if (DIFFERENT_ALIAS_SETS_P (x, mem))
2164 return 0;
2166 /* Read-only memory is by definition never modified, and therefore can't
2167 conflict with anything. We don't expect to find read-only set on MEM,
2168 but stupid user tricks can produce them, so don't die. */
2169 if (MEM_READONLY_P (x))
2170 return 0;
2172 if (nonoverlapping_memrefs_p (mem, x))
2173 return 0;
2175 if (mem_mode == VOIDmode)
2176 mem_mode = GET_MODE (mem);
2178 x_addr = get_addr (XEXP (x, 0));
2179 mem_addr = get_addr (XEXP (mem, 0));
2181 base = find_base_term (x_addr);
2182 if (base && (GET_CODE (base) == LABEL_REF
2183 || (GET_CODE (base) == SYMBOL_REF
2184 && CONSTANT_POOL_ADDRESS_P (base))))
2185 return 0;
2187 if (! base_alias_check (x_addr, mem_addr, GET_MODE (x), mem_mode))
2188 return 0;
2190 x_addr = canon_rtx (x_addr);
2191 mem_addr = canon_rtx (mem_addr);
2193 if (! memrefs_conflict_p (GET_MODE_SIZE (mem_mode), mem_addr,
2194 SIZE_FOR_MODE (x), x_addr, 0))
2195 return 0;
2197 if (aliases_everything_p (x))
2198 return 1;
2200 /* We cannot use aliases_everything_p to test MEM, since we must look
2201 at MEM_MODE, rather than GET_MODE (MEM). */
2202 if (mem_mode == QImode || GET_CODE (mem_addr) == AND)
2203 return 1;
2205 /* In true_dependence we also allow BLKmode to alias anything. Why
2206 don't we do this in anti_dependence and output_dependence? */
2207 if (mem_mode == BLKmode || GET_MODE (x) == BLKmode)
2208 return 1;
2210 return ! fixed_scalar_and_varying_struct_p (mem, x, mem_addr, x_addr,
2211 varies);
2214 /* Canonical true dependence: X is read after store in MEM takes place.
2215 Variant of true_dependence which assumes MEM has already been
2216 canonicalized (hence we no longer do that here).
2217 The mem_addr argument has been added, since true_dependence computed
2218 this value prior to canonicalizing. */
2221 canon_true_dependence (rtx mem, enum machine_mode mem_mode, rtx mem_addr,
2222 rtx x, int (*varies) (rtx, int))
2224 rtx x_addr;
2226 if (MEM_VOLATILE_P (x) && MEM_VOLATILE_P (mem))
2227 return 1;
2229 /* (mem:BLK (scratch)) is a special mechanism to conflict with everything.
2230 This is used in epilogue deallocation functions. */
2231 if (GET_MODE (x) == BLKmode && GET_CODE (XEXP (x, 0)) == SCRATCH)
2232 return 1;
2233 if (GET_MODE (mem) == BLKmode && GET_CODE (XEXP (mem, 0)) == SCRATCH)
2234 return 1;
2235 if (MEM_ALIAS_SET (x) == ALIAS_SET_MEMORY_BARRIER
2236 || MEM_ALIAS_SET (mem) == ALIAS_SET_MEMORY_BARRIER)
2237 return 1;
2239 if (DIFFERENT_ALIAS_SETS_P (x, mem))
2240 return 0;
2242 /* Read-only memory is by definition never modified, and therefore can't
2243 conflict with anything. We don't expect to find read-only set on MEM,
2244 but stupid user tricks can produce them, so don't die. */
2245 if (MEM_READONLY_P (x))
2246 return 0;
2248 if (nonoverlapping_memrefs_p (x, mem))
2249 return 0;
2251 x_addr = get_addr (XEXP (x, 0));
2253 if (! base_alias_check (x_addr, mem_addr, GET_MODE (x), mem_mode))
2254 return 0;
2256 x_addr = canon_rtx (x_addr);
2257 if (! memrefs_conflict_p (GET_MODE_SIZE (mem_mode), mem_addr,
2258 SIZE_FOR_MODE (x), x_addr, 0))
2259 return 0;
2261 if (aliases_everything_p (x))
2262 return 1;
2264 /* We cannot use aliases_everything_p to test MEM, since we must look
2265 at MEM_MODE, rather than GET_MODE (MEM). */
2266 if (mem_mode == QImode || GET_CODE (mem_addr) == AND)
2267 return 1;
2269 /* In true_dependence we also allow BLKmode to alias anything. Why
2270 don't we do this in anti_dependence and output_dependence? */
2271 if (mem_mode == BLKmode || GET_MODE (x) == BLKmode)
2272 return 1;
2274 return ! fixed_scalar_and_varying_struct_p (mem, x, mem_addr, x_addr,
2275 varies);
2278 /* Returns nonzero if a write to X might alias a previous read from
2279 (or, if WRITEP is nonzero, a write to) MEM. */
2281 static int
2282 write_dependence_p (rtx mem, rtx x, int writep)
2284 rtx x_addr, mem_addr;
2285 rtx fixed_scalar;
2286 rtx base;
2288 if (MEM_VOLATILE_P (x) && MEM_VOLATILE_P (mem))
2289 return 1;
2291 /* (mem:BLK (scratch)) is a special mechanism to conflict with everything.
2292 This is used in epilogue deallocation functions. */
2293 if (GET_MODE (x) == BLKmode && GET_CODE (XEXP (x, 0)) == SCRATCH)
2294 return 1;
2295 if (GET_MODE (mem) == BLKmode && GET_CODE (XEXP (mem, 0)) == SCRATCH)
2296 return 1;
2297 if (MEM_ALIAS_SET (x) == ALIAS_SET_MEMORY_BARRIER
2298 || MEM_ALIAS_SET (mem) == ALIAS_SET_MEMORY_BARRIER)
2299 return 1;
2301 if (DIFFERENT_ALIAS_SETS_P (x, mem))
2302 return 0;
2304 /* A read from read-only memory can't conflict with read-write memory. */
2305 if (!writep && MEM_READONLY_P (mem))
2306 return 0;
2308 if (nonoverlapping_memrefs_p (x, mem))
2309 return 0;
2311 x_addr = get_addr (XEXP (x, 0));
2312 mem_addr = get_addr (XEXP (mem, 0));
2314 if (! writep)
2316 base = find_base_term (mem_addr);
2317 if (base && (GET_CODE (base) == LABEL_REF
2318 || (GET_CODE (base) == SYMBOL_REF
2319 && CONSTANT_POOL_ADDRESS_P (base))))
2320 return 0;
2323 if (! base_alias_check (x_addr, mem_addr, GET_MODE (x),
2324 GET_MODE (mem)))
2325 return 0;
2327 x_addr = canon_rtx (x_addr);
2328 mem_addr = canon_rtx (mem_addr);
2330 if (!memrefs_conflict_p (SIZE_FOR_MODE (mem), mem_addr,
2331 SIZE_FOR_MODE (x), x_addr, 0))
2332 return 0;
2334 fixed_scalar
2335 = fixed_scalar_and_varying_struct_p (mem, x, mem_addr, x_addr,
2336 rtx_addr_varies_p);
2338 return (!(fixed_scalar == mem && !aliases_everything_p (x))
2339 && !(fixed_scalar == x && !aliases_everything_p (mem)));
2342 /* Anti dependence: X is written after read in MEM takes place. */
2345 anti_dependence (rtx mem, rtx x)
2347 return write_dependence_p (mem, x, /*writep=*/0);
2350 /* Output dependence: X is written after store in MEM takes place. */
2353 output_dependence (rtx mem, rtx x)
2355 return write_dependence_p (mem, x, /*writep=*/1);
2359 void
2360 init_alias_once (void)
2362 int i;
2364 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
2365 /* Check whether this register can hold an incoming pointer
2366 argument. FUNCTION_ARG_REGNO_P tests outgoing register
2367 numbers, so translate if necessary due to register windows. */
2368 if (FUNCTION_ARG_REGNO_P (OUTGOING_REGNO (i))
2369 && HARD_REGNO_MODE_OK (i, Pmode))
2370 static_reg_base_value[i]
2371 = gen_rtx_ADDRESS (VOIDmode, gen_rtx_REG (Pmode, i));
2373 static_reg_base_value[STACK_POINTER_REGNUM]
2374 = gen_rtx_ADDRESS (Pmode, stack_pointer_rtx);
2375 static_reg_base_value[ARG_POINTER_REGNUM]
2376 = gen_rtx_ADDRESS (Pmode, arg_pointer_rtx);
2377 static_reg_base_value[FRAME_POINTER_REGNUM]
2378 = gen_rtx_ADDRESS (Pmode, frame_pointer_rtx);
2379 #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM
2380 static_reg_base_value[HARD_FRAME_POINTER_REGNUM]
2381 = gen_rtx_ADDRESS (Pmode, hard_frame_pointer_rtx);
2382 #endif
2385 /* Set MEMORY_MODIFIED when X modifies DATA (that is assumed
2386 to be memory reference. */
2387 static bool memory_modified;
2388 static void
2389 memory_modified_1 (rtx x, rtx pat ATTRIBUTE_UNUSED, void *data)
2391 if (MEM_P (x))
2393 if (anti_dependence (x, (rtx)data) || output_dependence (x, (rtx)data))
2394 memory_modified = true;
2399 /* Return true when INSN possibly modify memory contents of MEM
2400 (i.e. address can be modified). */
2401 bool
2402 memory_modified_in_insn_p (rtx mem, rtx insn)
2404 if (!INSN_P (insn))
2405 return false;
2406 memory_modified = false;
2407 note_stores (PATTERN (insn), memory_modified_1, mem);
2408 return memory_modified;
2411 /* Initialize the aliasing machinery. Initialize the REG_KNOWN_VALUE
2412 array. */
2414 void
2415 init_alias_analysis (void)
2417 unsigned int maxreg = max_reg_num ();
2418 int changed, pass;
2419 int i;
2420 unsigned int ui;
2421 rtx insn;
2423 timevar_push (TV_ALIAS_ANALYSIS);
2425 reg_known_value_size = maxreg - FIRST_PSEUDO_REGISTER;
2426 reg_known_value = ggc_calloc (reg_known_value_size, sizeof (rtx));
2427 reg_known_equiv_p = xcalloc (reg_known_value_size, sizeof (bool));
2429 /* If we have memory allocated from the previous run, use it. */
2430 if (old_reg_base_value)
2431 reg_base_value = old_reg_base_value;
2433 if (reg_base_value)
2434 VEC_truncate (rtx, reg_base_value, 0);
2436 VEC_safe_grow (rtx, gc, reg_base_value, maxreg);
2437 memset (VEC_address (rtx, reg_base_value), 0,
2438 sizeof (rtx) * VEC_length (rtx, reg_base_value));
2440 new_reg_base_value = XNEWVEC (rtx, maxreg);
2441 reg_seen = XNEWVEC (char, maxreg);
2443 /* The basic idea is that each pass through this loop will use the
2444 "constant" information from the previous pass to propagate alias
2445 information through another level of assignments.
2447 This could get expensive if the assignment chains are long. Maybe
2448 we should throttle the number of iterations, possibly based on
2449 the optimization level or flag_expensive_optimizations.
2451 We could propagate more information in the first pass by making use
2452 of REG_N_SETS to determine immediately that the alias information
2453 for a pseudo is "constant".
2455 A program with an uninitialized variable can cause an infinite loop
2456 here. Instead of doing a full dataflow analysis to detect such problems
2457 we just cap the number of iterations for the loop.
2459 The state of the arrays for the set chain in question does not matter
2460 since the program has undefined behavior. */
2462 pass = 0;
2465 /* Assume nothing will change this iteration of the loop. */
2466 changed = 0;
2468 /* We want to assign the same IDs each iteration of this loop, so
2469 start counting from zero each iteration of the loop. */
2470 unique_id = 0;
2472 /* We're at the start of the function each iteration through the
2473 loop, so we're copying arguments. */
2474 copying_arguments = true;
2476 /* Wipe the potential alias information clean for this pass. */
2477 memset (new_reg_base_value, 0, maxreg * sizeof (rtx));
2479 /* Wipe the reg_seen array clean. */
2480 memset (reg_seen, 0, maxreg);
2482 /* Mark all hard registers which may contain an address.
2483 The stack, frame and argument pointers may contain an address.
2484 An argument register which can hold a Pmode value may contain
2485 an address even if it is not in BASE_REGS.
2487 The address expression is VOIDmode for an argument and
2488 Pmode for other registers. */
2490 memcpy (new_reg_base_value, static_reg_base_value,
2491 FIRST_PSEUDO_REGISTER * sizeof (rtx));
2493 /* Walk the insns adding values to the new_reg_base_value array. */
2494 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
2496 if (INSN_P (insn))
2498 rtx note, set;
2500 #if defined (HAVE_prologue) || defined (HAVE_epilogue)
2501 /* The prologue/epilogue insns are not threaded onto the
2502 insn chain until after reload has completed. Thus,
2503 there is no sense wasting time checking if INSN is in
2504 the prologue/epilogue until after reload has completed. */
2505 if (reload_completed
2506 && prologue_epilogue_contains (insn))
2507 continue;
2508 #endif
2510 /* If this insn has a noalias note, process it, Otherwise,
2511 scan for sets. A simple set will have no side effects
2512 which could change the base value of any other register. */
2514 if (GET_CODE (PATTERN (insn)) == SET
2515 && REG_NOTES (insn) != 0
2516 && find_reg_note (insn, REG_NOALIAS, NULL_RTX))
2517 record_set (SET_DEST (PATTERN (insn)), NULL_RTX, NULL);
2518 else
2519 note_stores (PATTERN (insn), record_set, NULL);
2521 set = single_set (insn);
2523 if (set != 0
2524 && REG_P (SET_DEST (set))
2525 && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
2527 unsigned int regno = REGNO (SET_DEST (set));
2528 rtx src = SET_SRC (set);
2529 rtx t;
2531 if (REG_NOTES (insn) != 0
2532 && (((note = find_reg_note (insn, REG_EQUAL, 0)) != 0
2533 && REG_N_SETS (regno) == 1)
2534 || (note = find_reg_note (insn, REG_EQUIV, NULL_RTX)) != 0)
2535 && GET_CODE (XEXP (note, 0)) != EXPR_LIST
2536 && ! rtx_varies_p (XEXP (note, 0), 1)
2537 && ! reg_overlap_mentioned_p (SET_DEST (set),
2538 XEXP (note, 0)))
2540 set_reg_known_value (regno, XEXP (note, 0));
2541 set_reg_known_equiv_p (regno,
2542 REG_NOTE_KIND (note) == REG_EQUIV);
2544 else if (REG_N_SETS (regno) == 1
2545 && GET_CODE (src) == PLUS
2546 && REG_P (XEXP (src, 0))
2547 && (t = get_reg_known_value (REGNO (XEXP (src, 0))))
2548 && GET_CODE (XEXP (src, 1)) == CONST_INT)
2550 t = plus_constant (t, INTVAL (XEXP (src, 1)));
2551 set_reg_known_value (regno, t);
2552 set_reg_known_equiv_p (regno, 0);
2554 else if (REG_N_SETS (regno) == 1
2555 && ! rtx_varies_p (src, 1))
2557 set_reg_known_value (regno, src);
2558 set_reg_known_equiv_p (regno, 0);
2562 else if (NOTE_P (insn)
2563 && NOTE_LINE_NUMBER (insn) == NOTE_INSN_FUNCTION_BEG)
2564 copying_arguments = false;
2567 /* Now propagate values from new_reg_base_value to reg_base_value. */
2568 gcc_assert (maxreg == (unsigned int) max_reg_num());
2570 for (ui = 0; ui < maxreg; ui++)
2572 if (new_reg_base_value[ui]
2573 && new_reg_base_value[ui] != VEC_index (rtx, reg_base_value, ui)
2574 && ! rtx_equal_p (new_reg_base_value[ui],
2575 VEC_index (rtx, reg_base_value, ui)))
2577 VEC_replace (rtx, reg_base_value, ui, new_reg_base_value[ui]);
2578 changed = 1;
2582 while (changed && ++pass < MAX_ALIAS_LOOP_PASSES);
2584 /* Fill in the remaining entries. */
2585 for (i = 0; i < (int)reg_known_value_size; i++)
2586 if (reg_known_value[i] == 0)
2587 reg_known_value[i] = regno_reg_rtx[i + FIRST_PSEUDO_REGISTER];
2589 /* Clean up. */
2590 free (new_reg_base_value);
2591 new_reg_base_value = 0;
2592 free (reg_seen);
2593 reg_seen = 0;
2594 timevar_pop (TV_ALIAS_ANALYSIS);
2597 void
2598 end_alias_analysis (void)
2600 old_reg_base_value = reg_base_value;
2601 ggc_free (reg_known_value);
2602 reg_known_value = 0;
2603 reg_known_value_size = 0;
2604 free (reg_known_equiv_p);
2605 reg_known_equiv_p = 0;
2608 #include "gt-alias.h"