2001-08-28 Alexandre Petit-Bianco <apbianco@redhat.com>
[official-gcc.git] / gcc / cselib.c
blob6498d869b16584900909457f821ed7f7484f4d16
1 /* Common subexpression elimination library for GNU compiler.
2 Copyright (C) 1987, 1988, 1989, 1992, 1993, 1994, 1995, 1996, 1997, 1998,
3 1999, 2000, 2001 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to the Free
19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
20 02111-1307, USA. */
22 #include "config.h"
23 #include "system.h"
25 #include "rtl.h"
26 #include "tm_p.h"
27 #include "regs.h"
28 #include "hard-reg-set.h"
29 #include "flags.h"
30 #include "real.h"
31 #include "insn-config.h"
32 #include "recog.h"
33 #include "function.h"
34 #include "expr.h"
35 #include "toplev.h"
36 #include "output.h"
37 #include "ggc.h"
38 #include "obstack.h"
39 #include "hashtab.h"
40 #include "cselib.h"
42 static int entry_and_rtx_equal_p PARAMS ((const void *, const void *));
43 static unsigned int get_value_hash PARAMS ((const void *));
44 static struct elt_list *new_elt_list PARAMS ((struct elt_list *,
45 cselib_val *));
46 static struct elt_loc_list *new_elt_loc_list PARAMS ((struct elt_loc_list *,
47 rtx));
48 static void unchain_one_value PARAMS ((cselib_val *));
49 static void unchain_one_elt_list PARAMS ((struct elt_list **));
50 static void unchain_one_elt_loc_list PARAMS ((struct elt_loc_list **));
51 static void clear_table PARAMS ((int));
52 static int discard_useless_locs PARAMS ((void **, void *));
53 static int discard_useless_values PARAMS ((void **, void *));
54 static void remove_useless_values PARAMS ((void));
55 static rtx wrap_constant PARAMS ((enum machine_mode, rtx));
56 static unsigned int hash_rtx PARAMS ((rtx, enum machine_mode, int));
57 static cselib_val *new_cselib_val PARAMS ((unsigned int,
58 enum machine_mode));
59 static void add_mem_for_addr PARAMS ((cselib_val *, cselib_val *,
60 rtx));
61 static cselib_val *cselib_lookup_mem PARAMS ((rtx, int));
62 static void cselib_invalidate_regno PARAMS ((unsigned int,
63 enum machine_mode));
64 static int cselib_mem_conflict_p PARAMS ((rtx, rtx));
65 static int cselib_invalidate_mem_1 PARAMS ((void **, void *));
66 static void cselib_invalidate_mem PARAMS ((rtx));
67 static void cselib_invalidate_rtx PARAMS ((rtx, rtx, void *));
68 static void cselib_record_set PARAMS ((rtx, cselib_val *,
69 cselib_val *));
70 static void cselib_record_sets PARAMS ((rtx));
72 /* There are three ways in which cselib can look up an rtx:
73 - for a REG, the reg_values table (which is indexed by regno) is used
74 - for a MEM, we recursively look up its address and then follow the
75 addr_list of that value
76 - for everything else, we compute a hash value and go through the hash
77 table. Since different rtx's can still have the same hash value,
78 this involves walking the table entries for a given value and comparing
79 the locations of the entries with the rtx we are looking up. */
81 /* A table that enables us to look up elts by their value. */
82 static htab_t hash_table;
84 /* This is a global so we don't have to pass this through every function.
85 It is used in new_elt_loc_list to set SETTING_INSN. */
86 static rtx cselib_current_insn;
88 /* Every new unknown value gets a unique number. */
89 static unsigned int next_unknown_value;
91 /* The number of registers we had when the varrays were last resized. */
92 static unsigned int cselib_nregs;
94 /* Count values without known locations. Whenever this grows too big, we
95 remove these useless values from the table. */
96 static int n_useless_values;
98 /* Number of useless values before we remove them from the hash table. */
99 #define MAX_USELESS_VALUES 32
101 /* This table maps from register number to values. It does not contain
102 pointers to cselib_val structures, but rather elt_lists. The purpose is
103 to be able to refer to the same register in different modes. */
104 static varray_type reg_values;
105 #define REG_VALUES(I) VARRAY_ELT_LIST (reg_values, (I))
107 /* Here the set of indices I with REG_VALUES(I) != 0 is saved. This is used
108 in clear_table() for fast emptying. */
109 static varray_type used_regs;
111 /* We pass this to cselib_invalidate_mem to invalidate all of
112 memory for a non-const call instruction. */
113 static rtx callmem;
115 /* Memory for our structures is allocated from this obstack. */
116 static struct obstack cselib_obstack;
118 /* Used to quickly free all memory. */
119 static char *cselib_startobj;
121 /* Caches for unused structures. */
122 static cselib_val *empty_vals;
123 static struct elt_list *empty_elt_lists;
124 static struct elt_loc_list *empty_elt_loc_lists;
126 /* Set by discard_useless_locs if it deleted the last location of any
127 value. */
128 static int values_became_useless;
131 /* Allocate a struct elt_list and fill in its two elements with the
132 arguments. */
134 static struct elt_list *
135 new_elt_list (next, elt)
136 struct elt_list *next;
137 cselib_val *elt;
139 struct elt_list *el = empty_elt_lists;
141 if (el)
142 empty_elt_lists = el->next;
143 else
144 el = (struct elt_list *) obstack_alloc (&cselib_obstack,
145 sizeof (struct elt_list));
146 el->next = next;
147 el->elt = elt;
148 return el;
151 /* Allocate a struct elt_loc_list and fill in its two elements with the
152 arguments. */
154 static struct elt_loc_list *
155 new_elt_loc_list (next, loc)
156 struct elt_loc_list *next;
157 rtx loc;
159 struct elt_loc_list *el = empty_elt_loc_lists;
161 if (el)
162 empty_elt_loc_lists = el->next;
163 else
164 el = (struct elt_loc_list *) obstack_alloc (&cselib_obstack,
165 sizeof (struct elt_loc_list));
166 el->next = next;
167 el->loc = loc;
168 el->setting_insn = cselib_current_insn;
169 return el;
172 /* The elt_list at *PL is no longer needed. Unchain it and free its
173 storage. */
175 static void
176 unchain_one_elt_list (pl)
177 struct elt_list **pl;
179 struct elt_list *l = *pl;
181 *pl = l->next;
182 l->next = empty_elt_lists;
183 empty_elt_lists = l;
186 /* Likewise for elt_loc_lists. */
188 static void
189 unchain_one_elt_loc_list (pl)
190 struct elt_loc_list **pl;
192 struct elt_loc_list *l = *pl;
194 *pl = l->next;
195 l->next = empty_elt_loc_lists;
196 empty_elt_loc_lists = l;
199 /* Likewise for cselib_vals. This also frees the addr_list associated with
200 V. */
202 static void
203 unchain_one_value (v)
204 cselib_val *v;
206 while (v->addr_list)
207 unchain_one_elt_list (&v->addr_list);
209 v->u.next_free = empty_vals;
210 empty_vals = v;
213 /* Remove all entries from the hash table. Also used during
214 initialization. If CLEAR_ALL isn't set, then only clear the entries
215 which are known to have been used. */
217 static void
218 clear_table (clear_all)
219 int clear_all;
221 unsigned int i;
223 if (clear_all)
224 for (i = 0; i < cselib_nregs; i++)
225 REG_VALUES (i) = 0;
226 else
227 for (i = 0; i < VARRAY_ACTIVE_SIZE (used_regs); i++)
228 REG_VALUES (VARRAY_UINT (used_regs, i)) = 0;
230 VARRAY_POP_ALL (used_regs);
232 htab_empty (hash_table);
233 obstack_free (&cselib_obstack, cselib_startobj);
235 empty_vals = 0;
236 empty_elt_lists = 0;
237 empty_elt_loc_lists = 0;
238 n_useless_values = 0;
240 next_unknown_value = 0;
243 /* The equality test for our hash table. The first argument ENTRY is a table
244 element (i.e. a cselib_val), while the second arg X is an rtx. We know
245 that all callers of htab_find_slot_with_hash will wrap CONST_INTs into a
246 CONST of an appropriate mode. */
248 static int
249 entry_and_rtx_equal_p (entry, x_arg)
250 const void *entry, *x_arg;
252 struct elt_loc_list *l;
253 const cselib_val *v = (const cselib_val *) entry;
254 rtx x = (rtx) x_arg;
255 enum machine_mode mode = GET_MODE (x);
257 if (GET_CODE (x) == CONST_INT
258 || (mode == VOIDmode && GET_CODE (x) == CONST_DOUBLE))
259 abort ();
260 if (mode != GET_MODE (v->u.val_rtx))
261 return 0;
263 /* Unwrap X if necessary. */
264 if (GET_CODE (x) == CONST
265 && (GET_CODE (XEXP (x, 0)) == CONST_INT
266 || GET_CODE (XEXP (x, 0)) == CONST_DOUBLE))
267 x = XEXP (x, 0);
269 /* We don't guarantee that distinct rtx's have different hash values,
270 so we need to do a comparison. */
271 for (l = v->locs; l; l = l->next)
272 if (rtx_equal_for_cselib_p (l->loc, x))
273 return 1;
275 return 0;
278 /* The hash function for our hash table. The value is always computed with
279 hash_rtx when adding an element; this function just extracts the hash
280 value from a cselib_val structure. */
282 static unsigned int
283 get_value_hash (entry)
284 const void *entry;
286 const cselib_val *v = (const cselib_val *) entry;
287 return v->value;
290 /* Return true if X contains a VALUE rtx. If ONLY_USELESS is set, we
291 only return true for values which point to a cselib_val whose value
292 element has been set to zero, which implies the cselib_val will be
293 removed. */
296 references_value_p (x, only_useless)
297 rtx x;
298 int only_useless;
300 enum rtx_code code = GET_CODE (x);
301 const char *fmt = GET_RTX_FORMAT (code);
302 int i, j;
304 if (GET_CODE (x) == VALUE
305 && (! only_useless || CSELIB_VAL_PTR (x)->locs == 0))
306 return 1;
308 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
310 if (fmt[i] == 'e' && references_value_p (XEXP (x, i), only_useless))
311 return 1;
312 else if (fmt[i] == 'E')
313 for (j = 0; j < XVECLEN (x, i); j++)
314 if (references_value_p (XVECEXP (x, i, j), only_useless))
315 return 1;
318 return 0;
321 /* For all locations found in X, delete locations that reference useless
322 values (i.e. values without any location). Called through
323 htab_traverse. */
325 static int
326 discard_useless_locs (x, info)
327 void **x;
328 void *info ATTRIBUTE_UNUSED;
330 cselib_val *v = (cselib_val *)*x;
331 struct elt_loc_list **p = &v->locs;
332 int had_locs = v->locs != 0;
334 while (*p)
336 if (references_value_p ((*p)->loc, 1))
337 unchain_one_elt_loc_list (p);
338 else
339 p = &(*p)->next;
342 if (had_locs && v->locs == 0)
344 n_useless_values++;
345 values_became_useless = 1;
347 return 1;
350 /* If X is a value with no locations, remove it from the hashtable. */
352 static int
353 discard_useless_values (x, info)
354 void **x;
355 void *info ATTRIBUTE_UNUSED;
357 cselib_val *v = (cselib_val *)*x;
359 if (v->locs == 0)
361 htab_clear_slot (hash_table, x);
362 unchain_one_value (v);
363 n_useless_values--;
366 return 1;
369 /* Clean out useless values (i.e. those which no longer have locations
370 associated with them) from the hash table. */
372 static void
373 remove_useless_values ()
375 /* First pass: eliminate locations that reference the value. That in
376 turn can make more values useless. */
379 values_became_useless = 0;
380 htab_traverse (hash_table, discard_useless_locs, 0);
382 while (values_became_useless);
384 /* Second pass: actually remove the values. */
385 htab_traverse (hash_table, discard_useless_values, 0);
387 if (n_useless_values != 0)
388 abort ();
391 /* Return nonzero if we can prove that X and Y contain the same value, taking
392 our gathered information into account. */
395 rtx_equal_for_cselib_p (x, y)
396 rtx x, y;
398 enum rtx_code code;
399 const char *fmt;
400 int i;
402 if (GET_CODE (x) == REG || GET_CODE (x) == MEM)
404 cselib_val *e = cselib_lookup (x, GET_MODE (x), 0);
406 if (e)
407 x = e->u.val_rtx;
410 if (GET_CODE (y) == REG || GET_CODE (y) == MEM)
412 cselib_val *e = cselib_lookup (y, GET_MODE (y), 0);
414 if (e)
415 y = e->u.val_rtx;
418 if (x == y)
419 return 1;
421 if (GET_CODE (x) == VALUE && GET_CODE (y) == VALUE)
422 return CSELIB_VAL_PTR (x) == CSELIB_VAL_PTR (y);
424 if (GET_CODE (x) == VALUE)
426 cselib_val *e = CSELIB_VAL_PTR (x);
427 struct elt_loc_list *l;
429 for (l = e->locs; l; l = l->next)
431 rtx t = l->loc;
433 /* Avoid infinite recursion. */
434 if (GET_CODE (t) == REG || GET_CODE (t) == MEM)
435 continue;
436 else if (rtx_equal_for_cselib_p (t, y))
437 return 1;
440 return 0;
443 if (GET_CODE (y) == VALUE)
445 cselib_val *e = CSELIB_VAL_PTR (y);
446 struct elt_loc_list *l;
448 for (l = e->locs; l; l = l->next)
450 rtx t = l->loc;
452 if (GET_CODE (t) == REG || GET_CODE (t) == MEM)
453 continue;
454 else if (rtx_equal_for_cselib_p (x, t))
455 return 1;
458 return 0;
461 if (GET_CODE (x) != GET_CODE (y) || GET_MODE (x) != GET_MODE (y))
462 return 0;
464 /* This won't be handled correctly by the code below. */
465 if (GET_CODE (x) == LABEL_REF)
466 return XEXP (x, 0) == XEXP (y, 0);
468 code = GET_CODE (x);
469 fmt = GET_RTX_FORMAT (code);
471 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
473 int j;
475 switch (fmt[i])
477 case 'w':
478 if (XWINT (x, i) != XWINT (y, i))
479 return 0;
480 break;
482 case 'n':
483 case 'i':
484 if (XINT (x, i) != XINT (y, i))
485 return 0;
486 break;
488 case 'V':
489 case 'E':
490 /* Two vectors must have the same length. */
491 if (XVECLEN (x, i) != XVECLEN (y, i))
492 return 0;
494 /* And the corresponding elements must match. */
495 for (j = 0; j < XVECLEN (x, i); j++)
496 if (! rtx_equal_for_cselib_p (XVECEXP (x, i, j),
497 XVECEXP (y, i, j)))
498 return 0;
499 break;
501 case 'e':
502 if (! rtx_equal_for_cselib_p (XEXP (x, i), XEXP (y, i)))
503 return 0;
504 break;
506 case 'S':
507 case 's':
508 if (strcmp (XSTR (x, i), XSTR (y, i)))
509 return 0;
510 break;
512 case 'u':
513 /* These are just backpointers, so they don't matter. */
514 break;
516 case '0':
517 case 't':
518 break;
520 /* It is believed that rtx's at this level will never
521 contain anything but integers and other rtx's,
522 except for within LABEL_REFs and SYMBOL_REFs. */
523 default:
524 abort ();
527 return 1;
530 /* We need to pass down the mode of constants through the hash table
531 functions. For that purpose, wrap them in a CONST of the appropriate
532 mode. */
533 static rtx
534 wrap_constant (mode, x)
535 enum machine_mode mode;
536 rtx x;
538 if (GET_CODE (x) != CONST_INT
539 && (GET_CODE (x) != CONST_DOUBLE || GET_MODE (x) != VOIDmode))
540 return x;
541 if (mode == VOIDmode)
542 abort ();
543 return gen_rtx_CONST (mode, x);
546 /* Hash an rtx. Return 0 if we couldn't hash the rtx.
547 For registers and memory locations, we look up their cselib_val structure
548 and return its VALUE element.
549 Possible reasons for return 0 are: the object is volatile, or we couldn't
550 find a register or memory location in the table and CREATE is zero. If
551 CREATE is nonzero, table elts are created for regs and mem.
552 MODE is used in hashing for CONST_INTs only;
553 otherwise the mode of X is used. */
555 static unsigned int
556 hash_rtx (x, mode, create)
557 rtx x;
558 enum machine_mode mode;
559 int create;
561 cselib_val *e;
562 int i, j;
563 enum rtx_code code;
564 const char *fmt;
565 unsigned int hash = 0;
567 code = GET_CODE (x);
568 hash += (unsigned) code + (unsigned) GET_MODE (x);
570 switch (code)
572 case MEM:
573 case REG:
574 e = cselib_lookup (x, GET_MODE (x), create);
575 if (! e)
576 return 0;
578 return e->value;
580 case CONST_INT:
581 hash += ((unsigned) CONST_INT << 7) + (unsigned) mode + INTVAL (x);
582 return hash ? hash : (unsigned int) CONST_INT;
584 case CONST_DOUBLE:
585 /* This is like the general case, except that it only counts
586 the integers representing the constant. */
587 hash += (unsigned) code + (unsigned) GET_MODE (x);
588 if (GET_MODE (x) != VOIDmode)
589 for (i = 2; i < GET_RTX_LENGTH (CONST_DOUBLE); i++)
590 hash += XWINT (x, i);
591 else
592 hash += ((unsigned) CONST_DOUBLE_LOW (x)
593 + (unsigned) CONST_DOUBLE_HIGH (x));
594 return hash ? hash : (unsigned int) CONST_DOUBLE;
596 /* Assume there is only one rtx object for any given label. */
597 case LABEL_REF:
598 hash
599 += ((unsigned) LABEL_REF << 7) + (unsigned long) XEXP (x, 0);
600 return hash ? hash : (unsigned int) LABEL_REF;
602 case SYMBOL_REF:
603 hash
604 += ((unsigned) SYMBOL_REF << 7) + (unsigned long) XSTR (x, 0);
605 return hash ? hash : (unsigned int) SYMBOL_REF;
607 case PRE_DEC:
608 case PRE_INC:
609 case POST_DEC:
610 case POST_INC:
611 case POST_MODIFY:
612 case PRE_MODIFY:
613 case PC:
614 case CC0:
615 case CALL:
616 case UNSPEC_VOLATILE:
617 return 0;
619 case ASM_OPERANDS:
620 if (MEM_VOLATILE_P (x))
621 return 0;
623 break;
625 default:
626 break;
629 i = GET_RTX_LENGTH (code) - 1;
630 fmt = GET_RTX_FORMAT (code);
631 for (; i >= 0; i--)
633 if (fmt[i] == 'e')
635 rtx tem = XEXP (x, i);
636 unsigned int tem_hash = hash_rtx (tem, 0, create);
638 if (tem_hash == 0)
639 return 0;
641 hash += tem_hash;
643 else if (fmt[i] == 'E')
644 for (j = 0; j < XVECLEN (x, i); j++)
646 unsigned int tem_hash = hash_rtx (XVECEXP (x, i, j), 0, create);
648 if (tem_hash == 0)
649 return 0;
651 hash += tem_hash;
653 else if (fmt[i] == 's')
655 const unsigned char *p = (const unsigned char *) XSTR (x, i);
657 if (p)
658 while (*p)
659 hash += *p++;
661 else if (fmt[i] == 'i')
662 hash += XINT (x, i);
663 else if (fmt[i] == '0' || fmt[i] == 't')
664 /* unused */;
665 else
666 abort ();
669 return hash ? hash : 1 + (unsigned int) GET_CODE (x);
672 /* Create a new value structure for VALUE and initialize it. The mode of the
673 value is MODE. */
675 static cselib_val *
676 new_cselib_val (value, mode)
677 unsigned int value;
678 enum machine_mode mode;
680 cselib_val *e = empty_vals;
682 if (e)
683 empty_vals = e->u.next_free;
684 else
685 e = (cselib_val *) obstack_alloc (&cselib_obstack, sizeof (cselib_val));
687 if (value == 0)
688 abort ();
690 e->value = value;
691 e->u.val_rtx = gen_rtx_VALUE (mode);
692 CSELIB_VAL_PTR (e->u.val_rtx) = e;
693 e->addr_list = 0;
694 e->locs = 0;
695 return e;
698 /* ADDR_ELT is a value that is used as address. MEM_ELT is the value that
699 contains the data at this address. X is a MEM that represents the
700 value. Update the two value structures to represent this situation. */
702 static void
703 add_mem_for_addr (addr_elt, mem_elt, x)
704 cselib_val *addr_elt, *mem_elt;
705 rtx x;
707 struct elt_loc_list *l;
709 /* Avoid duplicates. */
710 for (l = mem_elt->locs; l; l = l->next)
711 if (GET_CODE (l->loc) == MEM
712 && CSELIB_VAL_PTR (XEXP (l->loc, 0)) == addr_elt)
713 return;
715 addr_elt->addr_list = new_elt_list (addr_elt->addr_list, mem_elt);
716 mem_elt->locs
717 = new_elt_loc_list (mem_elt->locs,
718 replace_equiv_address_nv (x, addr_elt->u.val_rtx));
721 /* Subroutine of cselib_lookup. Return a value for X, which is a MEM rtx.
722 If CREATE, make a new one if we haven't seen it before. */
724 static cselib_val *
725 cselib_lookup_mem (x, create)
726 rtx x;
727 int create;
729 enum machine_mode mode = GET_MODE (x);
730 void **slot;
731 cselib_val *addr;
732 cselib_val *mem_elt;
733 struct elt_list *l;
735 if (MEM_VOLATILE_P (x) || mode == BLKmode
736 || (FLOAT_MODE_P (mode) && flag_float_store))
737 return 0;
739 /* Look up the value for the address. */
740 addr = cselib_lookup (XEXP (x, 0), mode, create);
741 if (! addr)
742 return 0;
744 /* Find a value that describes a value of our mode at that address. */
745 for (l = addr->addr_list; l; l = l->next)
746 if (GET_MODE (l->elt->u.val_rtx) == mode)
747 return l->elt;
749 if (! create)
750 return 0;
752 mem_elt = new_cselib_val (++next_unknown_value, mode);
753 add_mem_for_addr (addr, mem_elt, x);
754 slot = htab_find_slot_with_hash (hash_table, wrap_constant (mode, x),
755 mem_elt->value, INSERT);
756 *slot = mem_elt;
757 return mem_elt;
760 /* Walk rtx X and replace all occurrences of REG and MEM subexpressions
761 with VALUE expressions. This way, it becomes independent of changes
762 to registers and memory.
763 X isn't actually modified; if modifications are needed, new rtl is
764 allocated. However, the return value can share rtl with X. */
767 cselib_subst_to_values (x)
768 rtx x;
770 enum rtx_code code = GET_CODE (x);
771 const char *fmt = GET_RTX_FORMAT (code);
772 cselib_val *e;
773 struct elt_list *l;
774 rtx copy = x;
775 int i;
777 switch (code)
779 case REG:
780 for (l = REG_VALUES (REGNO (x)); l; l = l->next)
781 if (GET_MODE (l->elt->u.val_rtx) == GET_MODE (x))
782 return l->elt->u.val_rtx;
784 abort ();
786 case MEM:
787 e = cselib_lookup_mem (x, 0);
788 if (! e)
790 /* This happens for autoincrements. Assign a value that doesn't
791 match any other. */
792 e = new_cselib_val (++next_unknown_value, GET_MODE (x));
794 return e->u.val_rtx;
796 /* CONST_DOUBLEs must be special-cased here so that we won't try to
797 look up the CONST_DOUBLE_MEM inside. */
798 case CONST_DOUBLE:
799 case CONST_INT:
800 return x;
802 case POST_INC:
803 case PRE_INC:
804 case POST_DEC:
805 case PRE_DEC:
806 case POST_MODIFY:
807 case PRE_MODIFY:
808 e = new_cselib_val (++next_unknown_value, GET_MODE (x));
809 return e->u.val_rtx;
811 default:
812 break;
815 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
817 if (fmt[i] == 'e')
819 rtx t = cselib_subst_to_values (XEXP (x, i));
821 if (t != XEXP (x, i) && x == copy)
822 copy = shallow_copy_rtx (x);
824 XEXP (copy, i) = t;
826 else if (fmt[i] == 'E')
828 int j, k;
830 for (j = 0; j < XVECLEN (x, i); j++)
832 rtx t = cselib_subst_to_values (XVECEXP (x, i, j));
834 if (t != XVECEXP (x, i, j) && XVEC (x, i) == XVEC (copy, i))
836 if (x == copy)
837 copy = shallow_copy_rtx (x);
839 XVEC (copy, i) = rtvec_alloc (XVECLEN (x, i));
840 for (k = 0; k < j; k++)
841 XVECEXP (copy, i, k) = XVECEXP (x, i, k);
844 XVECEXP (copy, i, j) = t;
849 return copy;
852 /* Look up the rtl expression X in our tables and return the value it has.
853 If CREATE is zero, we return NULL if we don't know the value. Otherwise,
854 we create a new one if possible, using mode MODE if X doesn't have a mode
855 (i.e. because it's a constant). */
857 cselib_val *
858 cselib_lookup (x, mode, create)
859 rtx x;
860 enum machine_mode mode;
861 int create;
863 void **slot;
864 cselib_val *e;
865 unsigned int hashval;
867 if (GET_MODE (x) != VOIDmode)
868 mode = GET_MODE (x);
870 if (GET_CODE (x) == VALUE)
871 return CSELIB_VAL_PTR (x);
873 if (GET_CODE (x) == REG)
875 struct elt_list *l;
876 unsigned int i = REGNO (x);
878 for (l = REG_VALUES (i); l; l = l->next)
879 if (mode == GET_MODE (l->elt->u.val_rtx))
880 return l->elt;
882 if (! create)
883 return 0;
885 e = new_cselib_val (++next_unknown_value, GET_MODE (x));
886 e->locs = new_elt_loc_list (e->locs, x);
887 if (REG_VALUES (i) == 0)
888 VARRAY_PUSH_UINT (used_regs, i);
889 REG_VALUES (i) = new_elt_list (REG_VALUES (i), e);
890 slot = htab_find_slot_with_hash (hash_table, x, e->value, INSERT);
891 *slot = e;
892 return e;
895 if (GET_CODE (x) == MEM)
896 return cselib_lookup_mem (x, create);
898 hashval = hash_rtx (x, mode, create);
899 /* Can't even create if hashing is not possible. */
900 if (! hashval)
901 return 0;
903 slot = htab_find_slot_with_hash (hash_table, wrap_constant (mode, x),
904 hashval, create ? INSERT : NO_INSERT);
905 if (slot == 0)
906 return 0;
908 e = (cselib_val *) *slot;
909 if (e)
910 return e;
912 e = new_cselib_val (hashval, mode);
914 /* We have to fill the slot before calling cselib_subst_to_values:
915 the hash table is inconsistent until we do so, and
916 cselib_subst_to_values will need to do lookups. */
917 *slot = (void *) e;
918 e->locs = new_elt_loc_list (e->locs, cselib_subst_to_values (x));
919 return e;
922 /* Invalidate any entries in reg_values that overlap REGNO. This is called
923 if REGNO is changing. MODE is the mode of the assignment to REGNO, which
924 is used to determine how many hard registers are being changed. If MODE
925 is VOIDmode, then only REGNO is being changed; this is used when
926 invalidating call clobbered registers across a call. */
928 static void
929 cselib_invalidate_regno (regno, mode)
930 unsigned int regno;
931 enum machine_mode mode;
933 unsigned int endregno;
934 unsigned int i;
936 /* If we see pseudos after reload, something is _wrong_. */
937 if (reload_completed && regno >= FIRST_PSEUDO_REGISTER
938 && reg_renumber[regno] >= 0)
939 abort ();
941 /* Determine the range of registers that must be invalidated. For
942 pseudos, only REGNO is affected. For hard regs, we must take MODE
943 into account, and we must also invalidate lower register numbers
944 if they contain values that overlap REGNO. */
945 endregno = regno + 1;
946 if (regno < FIRST_PSEUDO_REGISTER && mode != VOIDmode)
947 endregno = regno + HARD_REGNO_NREGS (regno, mode);
949 for (i = 0; i < endregno; i++)
951 struct elt_list **l = &REG_VALUES (i);
953 /* Go through all known values for this reg; if it overlaps the range
954 we're invalidating, remove the value. */
955 while (*l)
957 cselib_val *v = (*l)->elt;
958 struct elt_loc_list **p;
959 unsigned int this_last = i;
961 if (i < FIRST_PSEUDO_REGISTER)
962 this_last += HARD_REGNO_NREGS (i, GET_MODE (v->u.val_rtx)) - 1;
964 if (this_last < regno)
966 l = &(*l)->next;
967 continue;
970 /* We have an overlap. */
971 unchain_one_elt_list (l);
973 /* Now, we clear the mapping from value to reg. It must exist, so
974 this code will crash intentionally if it doesn't. */
975 for (p = &v->locs; ; p = &(*p)->next)
977 rtx x = (*p)->loc;
979 if (GET_CODE (x) == REG && REGNO (x) == i)
981 unchain_one_elt_loc_list (p);
982 break;
985 if (v->locs == 0)
986 n_useless_values++;
991 /* The memory at address MEM_BASE is being changed.
992 Return whether this change will invalidate VAL. */
994 static int
995 cselib_mem_conflict_p (mem_base, val)
996 rtx mem_base;
997 rtx val;
999 enum rtx_code code;
1000 const char *fmt;
1001 int i, j;
1003 code = GET_CODE (val);
1004 switch (code)
1006 /* Get rid of a few simple cases quickly. */
1007 case REG:
1008 case PC:
1009 case CC0:
1010 case SCRATCH:
1011 case CONST:
1012 case CONST_INT:
1013 case CONST_DOUBLE:
1014 case SYMBOL_REF:
1015 case LABEL_REF:
1016 return 0;
1018 case MEM:
1019 if (GET_MODE (mem_base) == BLKmode
1020 || GET_MODE (val) == BLKmode
1021 || anti_dependence (val, mem_base))
1022 return 1;
1024 /* The address may contain nested MEMs. */
1025 break;
1027 default:
1028 break;
1031 fmt = GET_RTX_FORMAT (code);
1032 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1034 if (fmt[i] == 'e')
1036 if (cselib_mem_conflict_p (mem_base, XEXP (val, i)))
1037 return 1;
1039 else if (fmt[i] == 'E')
1040 for (j = 0; j < XVECLEN (val, i); j++)
1041 if (cselib_mem_conflict_p (mem_base, XVECEXP (val, i, j)))
1042 return 1;
1045 return 0;
1048 /* For the value found in SLOT, walk its locations to determine if any overlap
1049 INFO (which is a MEM rtx). */
1051 static int
1052 cselib_invalidate_mem_1 (slot, info)
1053 void **slot;
1054 void *info;
1056 cselib_val *v = (cselib_val *) *slot;
1057 rtx mem_rtx = (rtx) info;
1058 struct elt_loc_list **p = &v->locs;
1059 int had_locs = v->locs != 0;
1061 while (*p)
1063 rtx x = (*p)->loc;
1064 cselib_val *addr;
1065 struct elt_list **mem_chain;
1067 /* MEMs may occur in locations only at the top level; below
1068 that every MEM or REG is substituted by its VALUE. */
1069 if (GET_CODE (x) != MEM
1070 || ! cselib_mem_conflict_p (mem_rtx, x))
1072 p = &(*p)->next;
1073 continue;
1076 /* This one overlaps. */
1077 /* We must have a mapping from this MEM's address to the
1078 value (E). Remove that, too. */
1079 addr = cselib_lookup (XEXP (x, 0), VOIDmode, 0);
1080 mem_chain = &addr->addr_list;
1081 for (;;)
1083 if ((*mem_chain)->elt == v)
1085 unchain_one_elt_list (mem_chain);
1086 break;
1089 mem_chain = &(*mem_chain)->next;
1092 unchain_one_elt_loc_list (p);
1095 if (had_locs && v->locs == 0)
1096 n_useless_values++;
1098 return 1;
1101 /* Invalidate any locations in the table which are changed because of a
1102 store to MEM_RTX. If this is called because of a non-const call
1103 instruction, MEM_RTX is (mem:BLK const0_rtx). */
1105 static void
1106 cselib_invalidate_mem (mem_rtx)
1107 rtx mem_rtx;
1109 htab_traverse (hash_table, cselib_invalidate_mem_1, mem_rtx);
1112 /* Invalidate DEST, which is being assigned to or clobbered. The second and
1113 the third parameter exist so that this function can be passed to
1114 note_stores; they are ignored. */
1116 static void
1117 cselib_invalidate_rtx (dest, ignore, data)
1118 rtx dest;
1119 rtx ignore ATTRIBUTE_UNUSED;
1120 void *data ATTRIBUTE_UNUSED;
1122 while (GET_CODE (dest) == STRICT_LOW_PART || GET_CODE (dest) == SIGN_EXTRACT
1123 || GET_CODE (dest) == ZERO_EXTRACT || GET_CODE (dest) == SUBREG)
1124 dest = XEXP (dest, 0);
1126 if (GET_CODE (dest) == REG)
1127 cselib_invalidate_regno (REGNO (dest), GET_MODE (dest));
1128 else if (GET_CODE (dest) == MEM)
1129 cselib_invalidate_mem (dest);
1131 /* Some machines don't define AUTO_INC_DEC, but they still use push
1132 instructions. We need to catch that case here in order to
1133 invalidate the stack pointer correctly. Note that invalidating
1134 the stack pointer is different from invalidating DEST. */
1135 if (push_operand (dest, GET_MODE (dest)))
1136 cselib_invalidate_rtx (stack_pointer_rtx, NULL_RTX, NULL);
1139 /* Record the result of a SET instruction. DEST is being set; the source
1140 contains the value described by SRC_ELT. If DEST is a MEM, DEST_ADDR_ELT
1141 describes its address. */
1143 static void
1144 cselib_record_set (dest, src_elt, dest_addr_elt)
1145 rtx dest;
1146 cselib_val *src_elt, *dest_addr_elt;
1148 int dreg = GET_CODE (dest) == REG ? (int) REGNO (dest) : -1;
1150 if (src_elt == 0 || side_effects_p (dest))
1151 return;
1153 if (dreg >= 0)
1155 if (REG_VALUES (dreg) == 0)
1156 VARRAY_PUSH_UINT (used_regs, dreg);
1158 REG_VALUES (dreg) = new_elt_list (REG_VALUES (dreg), src_elt);
1159 if (src_elt->locs == 0)
1160 n_useless_values--;
1161 src_elt->locs = new_elt_loc_list (src_elt->locs, dest);
1163 else if (GET_CODE (dest) == MEM && dest_addr_elt != 0)
1165 if (src_elt->locs == 0)
1166 n_useless_values--;
1167 add_mem_for_addr (dest_addr_elt, src_elt, dest);
1171 /* Describe a single set that is part of an insn. */
1172 struct set
1174 rtx src;
1175 rtx dest;
1176 cselib_val *src_elt;
1177 cselib_val *dest_addr_elt;
1180 /* There is no good way to determine how many elements there can be
1181 in a PARALLEL. Since it's fairly cheap, use a really large number. */
1182 #define MAX_SETS (FIRST_PSEUDO_REGISTER * 2)
1184 /* Record the effects of any sets in INSN. */
1185 static void
1186 cselib_record_sets (insn)
1187 rtx insn;
1189 int n_sets = 0;
1190 int i;
1191 struct set sets[MAX_SETS];
1192 rtx body = PATTERN (insn);
1193 rtx cond = 0;
1195 body = PATTERN (insn);
1196 if (GET_CODE (body) == COND_EXEC)
1198 cond = COND_EXEC_TEST (body);
1199 body = COND_EXEC_CODE (body);
1202 /* Find all sets. */
1203 if (GET_CODE (body) == SET)
1205 sets[0].src = SET_SRC (body);
1206 sets[0].dest = SET_DEST (body);
1207 n_sets = 1;
1209 else if (GET_CODE (body) == PARALLEL)
1211 /* Look through the PARALLEL and record the values being
1212 set, if possible. Also handle any CLOBBERs. */
1213 for (i = XVECLEN (body, 0) - 1; i >= 0; --i)
1215 rtx x = XVECEXP (body, 0, i);
1217 if (GET_CODE (x) == SET)
1219 sets[n_sets].src = SET_SRC (x);
1220 sets[n_sets].dest = SET_DEST (x);
1221 n_sets++;
1226 /* Look up the values that are read. Do this before invalidating the
1227 locations that are written. */
1228 for (i = 0; i < n_sets; i++)
1230 rtx dest = sets[i].dest;
1232 /* A STRICT_LOW_PART can be ignored; we'll record the equivalence for
1233 the low part after invalidating any knowledge about larger modes. */
1234 if (GET_CODE (sets[i].dest) == STRICT_LOW_PART)
1235 sets[i].dest = dest = XEXP (dest, 0);
1237 /* We don't know how to record anything but REG or MEM. */
1238 if (GET_CODE (dest) == REG || GET_CODE (dest) == MEM)
1240 rtx src = sets[i].src;
1241 if (cond)
1242 src = gen_rtx_IF_THEN_ELSE (GET_MODE (src), cond, src, dest);
1243 sets[i].src_elt = cselib_lookup (sets[i].src, GET_MODE (dest), 1);
1244 if (GET_CODE (dest) == MEM)
1245 sets[i].dest_addr_elt = cselib_lookup (XEXP (dest, 0), Pmode, 1);
1246 else
1247 sets[i].dest_addr_elt = 0;
1251 /* Invalidate all locations written by this insn. Note that the elts we
1252 looked up in the previous loop aren't affected, just some of their
1253 locations may go away. */
1254 note_stores (body, cselib_invalidate_rtx, NULL);
1256 /* Now enter the equivalences in our tables. */
1257 for (i = 0; i < n_sets; i++)
1259 rtx dest = sets[i].dest;
1260 if (GET_CODE (dest) == REG || GET_CODE (dest) == MEM)
1261 cselib_record_set (dest, sets[i].src_elt, sets[i].dest_addr_elt);
1265 /* Record the effects of INSN. */
1267 void
1268 cselib_process_insn (insn)
1269 rtx insn;
1271 int i;
1272 rtx x;
1274 cselib_current_insn = insn;
1276 /* Forget everything at a CODE_LABEL, a volatile asm, or a setjmp. */
1277 if (GET_CODE (insn) == CODE_LABEL
1278 || (GET_CODE (insn) == CALL_INSN
1279 && find_reg_note (insn, REG_SETJMP, NULL))
1280 || (GET_CODE (insn) == INSN
1281 && GET_CODE (PATTERN (insn)) == ASM_OPERANDS
1282 && MEM_VOLATILE_P (PATTERN (insn))))
1284 clear_table (0);
1285 return;
1288 if (! INSN_P (insn))
1290 cselib_current_insn = 0;
1291 return;
1294 /* If this is a call instruction, forget anything stored in a
1295 call clobbered register, or, if this is not a const call, in
1296 memory. */
1297 if (GET_CODE (insn) == CALL_INSN)
1299 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1300 if (call_used_regs[i])
1301 cselib_invalidate_regno (i, VOIDmode);
1303 if (! CONST_OR_PURE_CALL_P (insn))
1304 cselib_invalidate_mem (callmem);
1307 cselib_record_sets (insn);
1309 #ifdef AUTO_INC_DEC
1310 /* Clobber any registers which appear in REG_INC notes. We
1311 could keep track of the changes to their values, but it is
1312 unlikely to help. */
1313 for (x = REG_NOTES (insn); x; x = XEXP (x, 1))
1314 if (REG_NOTE_KIND (x) == REG_INC)
1315 cselib_invalidate_rtx (XEXP (x, 0), NULL_RTX, NULL);
1316 #endif
1318 /* Look for any CLOBBERs in CALL_INSN_FUNCTION_USAGE, but only
1319 after we have processed the insn. */
1320 if (GET_CODE (insn) == CALL_INSN)
1321 for (x = CALL_INSN_FUNCTION_USAGE (insn); x; x = XEXP (x, 1))
1322 if (GET_CODE (XEXP (x, 0)) == CLOBBER)
1323 cselib_invalidate_rtx (XEXP (XEXP (x, 0), 0), NULL_RTX, NULL);
1325 cselib_current_insn = 0;
1327 if (n_useless_values > MAX_USELESS_VALUES)
1328 remove_useless_values ();
1331 /* Make sure our varrays are big enough. Not called from any cselib routines;
1332 it must be called by the user if it allocated new registers. */
1334 void
1335 cselib_update_varray_sizes ()
1337 unsigned int nregs = max_reg_num ();
1339 if (nregs == cselib_nregs)
1340 return;
1342 cselib_nregs = nregs;
1343 VARRAY_GROW (reg_values, nregs);
1344 VARRAY_GROW (used_regs, nregs);
1347 /* Initialize cselib for one pass. The caller must also call
1348 init_alias_analysis. */
1350 void
1351 cselib_init ()
1353 /* These are only created once. */
1354 if (! callmem)
1356 gcc_obstack_init (&cselib_obstack);
1357 cselib_startobj = obstack_alloc (&cselib_obstack, 0);
1359 callmem = gen_rtx_MEM (BLKmode, const0_rtx);
1360 ggc_add_rtx_root (&callmem, 1);
1363 cselib_nregs = max_reg_num ();
1364 VARRAY_ELT_LIST_INIT (reg_values, cselib_nregs, "reg_values");
1365 VARRAY_UINT_INIT (used_regs, cselib_nregs, "used_regs");
1366 hash_table = htab_create (31, get_value_hash, entry_and_rtx_equal_p, NULL);
1367 clear_table (1);
1370 /* Called when the current user is done with cselib. */
1372 void
1373 cselib_finish ()
1375 clear_table (0);
1376 VARRAY_FREE (reg_values);
1377 VARRAY_FREE (used_regs);
1378 htab_delete (hash_table);