* configure.in: Add ${libgcj} to noconfigdirs for xtensa-*-* targets.
[official-gcc.git] / gcc / cse.c
blob5e6c9e40b17e3a2b2bc7da42d55298df75ce2896
1 /* Common subexpression elimination for GNU compiler.
2 Copyright (C) 1987, 1988, 1989, 1992, 1993, 1994, 1995, 1996, 1997, 1998
3 1999, 2000, 2001, 2002, 2003 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to the Free
19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
20 02111-1307, USA. */
22 #include "config.h"
23 /* stdio.h must precede rtl.h for FFS. */
24 #include "system.h"
25 #include "coretypes.h"
26 #include "tm.h"
28 #include "rtl.h"
29 #include "tm_p.h"
30 #include "regs.h"
31 #include "hard-reg-set.h"
32 #include "basic-block.h"
33 #include "flags.h"
34 #include "real.h"
35 #include "insn-config.h"
36 #include "recog.h"
37 #include "function.h"
38 #include "expr.h"
39 #include "toplev.h"
40 #include "output.h"
41 #include "ggc.h"
42 #include "timevar.h"
43 #include "except.h"
44 #include "target.h"
45 #include "params.h"
47 /* The basic idea of common subexpression elimination is to go
48 through the code, keeping a record of expressions that would
49 have the same value at the current scan point, and replacing
50 expressions encountered with the cheapest equivalent expression.
52 It is too complicated to keep track of the different possibilities
53 when control paths merge in this code; so, at each label, we forget all
54 that is known and start fresh. This can be described as processing each
55 extended basic block separately. We have a separate pass to perform
56 global CSE.
58 Note CSE can turn a conditional or computed jump into a nop or
59 an unconditional jump. When this occurs we arrange to run the jump
60 optimizer after CSE to delete the unreachable code.
62 We use two data structures to record the equivalent expressions:
63 a hash table for most expressions, and a vector of "quantity
64 numbers" to record equivalent (pseudo) registers.
66 The use of the special data structure for registers is desirable
67 because it is faster. It is possible because registers references
68 contain a fairly small number, the register number, taken from
69 a contiguously allocated series, and two register references are
70 identical if they have the same number. General expressions
71 do not have any such thing, so the only way to retrieve the
72 information recorded on an expression other than a register
73 is to keep it in a hash table.
75 Registers and "quantity numbers":
77 At the start of each basic block, all of the (hardware and pseudo)
78 registers used in the function are given distinct quantity
79 numbers to indicate their contents. During scan, when the code
80 copies one register into another, we copy the quantity number.
81 When a register is loaded in any other way, we allocate a new
82 quantity number to describe the value generated by this operation.
83 `reg_qty' records what quantity a register is currently thought
84 of as containing.
86 All real quantity numbers are greater than or equal to `max_reg'.
87 If register N has not been assigned a quantity, reg_qty[N] will equal N.
89 Quantity numbers below `max_reg' do not exist and none of the `qty_table'
90 entries should be referenced with an index below `max_reg'.
92 We also maintain a bidirectional chain of registers for each
93 quantity number. The `qty_table` members `first_reg' and `last_reg',
94 and `reg_eqv_table' members `next' and `prev' hold these chains.
96 The first register in a chain is the one whose lifespan is least local.
97 Among equals, it is the one that was seen first.
98 We replace any equivalent register with that one.
100 If two registers have the same quantity number, it must be true that
101 REG expressions with qty_table `mode' must be in the hash table for both
102 registers and must be in the same class.
104 The converse is not true. Since hard registers may be referenced in
105 any mode, two REG expressions might be equivalent in the hash table
106 but not have the same quantity number if the quantity number of one
107 of the registers is not the same mode as those expressions.
109 Constants and quantity numbers
111 When a quantity has a known constant value, that value is stored
112 in the appropriate qty_table `const_rtx'. This is in addition to
113 putting the constant in the hash table as is usual for non-regs.
115 Whether a reg or a constant is preferred is determined by the configuration
116 macro CONST_COSTS and will often depend on the constant value. In any
117 event, expressions containing constants can be simplified, by fold_rtx.
119 When a quantity has a known nearly constant value (such as an address
120 of a stack slot), that value is stored in the appropriate qty_table
121 `const_rtx'.
123 Integer constants don't have a machine mode. However, cse
124 determines the intended machine mode from the destination
125 of the instruction that moves the constant. The machine mode
126 is recorded in the hash table along with the actual RTL
127 constant expression so that different modes are kept separate.
129 Other expressions:
131 To record known equivalences among expressions in general
132 we use a hash table called `table'. It has a fixed number of buckets
133 that contain chains of `struct table_elt' elements for expressions.
134 These chains connect the elements whose expressions have the same
135 hash codes.
137 Other chains through the same elements connect the elements which
138 currently have equivalent values.
140 Register references in an expression are canonicalized before hashing
141 the expression. This is done using `reg_qty' and qty_table `first_reg'.
142 The hash code of a register reference is computed using the quantity
143 number, not the register number.
145 When the value of an expression changes, it is necessary to remove from the
146 hash table not just that expression but all expressions whose values
147 could be different as a result.
149 1. If the value changing is in memory, except in special cases
150 ANYTHING referring to memory could be changed. That is because
151 nobody knows where a pointer does not point.
152 The function `invalidate_memory' removes what is necessary.
154 The special cases are when the address is constant or is
155 a constant plus a fixed register such as the frame pointer
156 or a static chain pointer. When such addresses are stored in,
157 we can tell exactly which other such addresses must be invalidated
158 due to overlap. `invalidate' does this.
159 All expressions that refer to non-constant
160 memory addresses are also invalidated. `invalidate_memory' does this.
162 2. If the value changing is a register, all expressions
163 containing references to that register, and only those,
164 must be removed.
166 Because searching the entire hash table for expressions that contain
167 a register is very slow, we try to figure out when it isn't necessary.
168 Precisely, this is necessary only when expressions have been
169 entered in the hash table using this register, and then the value has
170 changed, and then another expression wants to be added to refer to
171 the register's new value. This sequence of circumstances is rare
172 within any one basic block.
174 The vectors `reg_tick' and `reg_in_table' are used to detect this case.
175 reg_tick[i] is incremented whenever a value is stored in register i.
176 reg_in_table[i] holds -1 if no references to register i have been
177 entered in the table; otherwise, it contains the value reg_tick[i] had
178 when the references were entered. If we want to enter a reference
179 and reg_in_table[i] != reg_tick[i], we must scan and remove old references.
180 Until we want to enter a new entry, the mere fact that the two vectors
181 don't match makes the entries be ignored if anyone tries to match them.
183 Registers themselves are entered in the hash table as well as in
184 the equivalent-register chains. However, the vectors `reg_tick'
185 and `reg_in_table' do not apply to expressions which are simple
186 register references. These expressions are removed from the table
187 immediately when they become invalid, and this can be done even if
188 we do not immediately search for all the expressions that refer to
189 the register.
191 A CLOBBER rtx in an instruction invalidates its operand for further
192 reuse. A CLOBBER or SET rtx whose operand is a MEM:BLK
193 invalidates everything that resides in memory.
195 Related expressions:
197 Constant expressions that differ only by an additive integer
198 are called related. When a constant expression is put in
199 the table, the related expression with no constant term
200 is also entered. These are made to point at each other
201 so that it is possible to find out if there exists any
202 register equivalent to an expression related to a given expression. */
204 /* One plus largest register number used in this function. */
206 static int max_reg;
208 /* One plus largest instruction UID used in this function at time of
209 cse_main call. */
211 static int max_insn_uid;
213 /* Length of qty_table vector. We know in advance we will not need
214 a quantity number this big. */
216 static int max_qty;
218 /* Next quantity number to be allocated.
219 This is 1 + the largest number needed so far. */
221 static int next_qty;
223 /* Per-qty information tracking.
225 `first_reg' and `last_reg' track the head and tail of the
226 chain of registers which currently contain this quantity.
228 `mode' contains the machine mode of this quantity.
230 `const_rtx' holds the rtx of the constant value of this
231 quantity, if known. A summations of the frame/arg pointer
232 and a constant can also be entered here. When this holds
233 a known value, `const_insn' is the insn which stored the
234 constant value.
236 `comparison_{code,const,qty}' are used to track when a
237 comparison between a quantity and some constant or register has
238 been passed. In such a case, we know the results of the comparison
239 in case we see it again. These members record a comparison that
240 is known to be true. `comparison_code' holds the rtx code of such
241 a comparison, else it is set to UNKNOWN and the other two
242 comparison members are undefined. `comparison_const' holds
243 the constant being compared against, or zero if the comparison
244 is not against a constant. `comparison_qty' holds the quantity
245 being compared against when the result is known. If the comparison
246 is not with a register, `comparison_qty' is -1. */
248 struct qty_table_elem
250 rtx const_rtx;
251 rtx const_insn;
252 rtx comparison_const;
253 int comparison_qty;
254 unsigned int first_reg, last_reg;
255 /* The sizes of these fields should match the sizes of the
256 code and mode fields of struct rtx_def (see rtl.h). */
257 ENUM_BITFIELD(rtx_code) comparison_code : 16;
258 ENUM_BITFIELD(machine_mode) mode : 8;
261 /* The table of all qtys, indexed by qty number. */
262 static struct qty_table_elem *qty_table;
264 #ifdef HAVE_cc0
265 /* For machines that have a CC0, we do not record its value in the hash
266 table since its use is guaranteed to be the insn immediately following
267 its definition and any other insn is presumed to invalidate it.
269 Instead, we store below the value last assigned to CC0. If it should
270 happen to be a constant, it is stored in preference to the actual
271 assigned value. In case it is a constant, we store the mode in which
272 the constant should be interpreted. */
274 static rtx prev_insn_cc0;
275 static enum machine_mode prev_insn_cc0_mode;
277 /* Previous actual insn. 0 if at first insn of basic block. */
279 static rtx prev_insn;
280 #endif
282 /* Insn being scanned. */
284 static rtx this_insn;
286 /* Index by register number, gives the number of the next (or
287 previous) register in the chain of registers sharing the same
288 value.
290 Or -1 if this register is at the end of the chain.
292 If reg_qty[N] == N, reg_eqv_table[N].next is undefined. */
294 /* Per-register equivalence chain. */
295 struct reg_eqv_elem
297 int next, prev;
300 /* The table of all register equivalence chains. */
301 static struct reg_eqv_elem *reg_eqv_table;
303 struct cse_reg_info
305 /* Next in hash chain. */
306 struct cse_reg_info *hash_next;
308 /* The next cse_reg_info structure in the free or used list. */
309 struct cse_reg_info *next;
311 /* Search key */
312 unsigned int regno;
314 /* The quantity number of the register's current contents. */
315 int reg_qty;
317 /* The number of times the register has been altered in the current
318 basic block. */
319 int reg_tick;
321 /* The REG_TICK value at which rtx's containing this register are
322 valid in the hash table. If this does not equal the current
323 reg_tick value, such expressions existing in the hash table are
324 invalid. */
325 int reg_in_table;
327 /* The SUBREG that was set when REG_TICK was last incremented. Set
328 to -1 if the last store was to the whole register, not a subreg. */
329 unsigned int subreg_ticked;
332 /* A free list of cse_reg_info entries. */
333 static struct cse_reg_info *cse_reg_info_free_list;
335 /* A used list of cse_reg_info entries. */
336 static struct cse_reg_info *cse_reg_info_used_list;
337 static struct cse_reg_info *cse_reg_info_used_list_end;
339 /* A mapping from registers to cse_reg_info data structures. */
340 #define REGHASH_SHIFT 7
341 #define REGHASH_SIZE (1 << REGHASH_SHIFT)
342 #define REGHASH_MASK (REGHASH_SIZE - 1)
343 static struct cse_reg_info *reg_hash[REGHASH_SIZE];
345 #define REGHASH_FN(REGNO) \
346 (((REGNO) ^ ((REGNO) >> REGHASH_SHIFT)) & REGHASH_MASK)
348 /* The last lookup we did into the cse_reg_info_tree. This allows us
349 to cache repeated lookups. */
350 static unsigned int cached_regno;
351 static struct cse_reg_info *cached_cse_reg_info;
353 /* A HARD_REG_SET containing all the hard registers for which there is
354 currently a REG expression in the hash table. Note the difference
355 from the above variables, which indicate if the REG is mentioned in some
356 expression in the table. */
358 static HARD_REG_SET hard_regs_in_table;
360 /* CUID of insn that starts the basic block currently being cse-processed. */
362 static int cse_basic_block_start;
364 /* CUID of insn that ends the basic block currently being cse-processed. */
366 static int cse_basic_block_end;
368 /* Vector mapping INSN_UIDs to cuids.
369 The cuids are like uids but increase monotonically always.
370 We use them to see whether a reg is used outside a given basic block. */
372 static int *uid_cuid;
374 /* Highest UID in UID_CUID. */
375 static int max_uid;
377 /* Get the cuid of an insn. */
379 #define INSN_CUID(INSN) (uid_cuid[INSN_UID (INSN)])
381 /* Nonzero if this pass has made changes, and therefore it's
382 worthwhile to run the garbage collector. */
384 static int cse_altered;
386 /* Nonzero if cse has altered conditional jump insns
387 in such a way that jump optimization should be redone. */
389 static int cse_jumps_altered;
391 /* Nonzero if we put a LABEL_REF into the hash table for an INSN without a
392 REG_LABEL, we have to rerun jump after CSE to put in the note. */
393 static int recorded_label_ref;
395 /* canon_hash stores 1 in do_not_record
396 if it notices a reference to CC0, PC, or some other volatile
397 subexpression. */
399 static int do_not_record;
401 #ifdef LOAD_EXTEND_OP
403 /* Scratch rtl used when looking for load-extended copy of a MEM. */
404 static rtx memory_extend_rtx;
405 #endif
407 /* canon_hash stores 1 in hash_arg_in_memory
408 if it notices a reference to memory within the expression being hashed. */
410 static int hash_arg_in_memory;
412 /* The hash table contains buckets which are chains of `struct table_elt's,
413 each recording one expression's information.
414 That expression is in the `exp' field.
416 The canon_exp field contains a canonical (from the point of view of
417 alias analysis) version of the `exp' field.
419 Those elements with the same hash code are chained in both directions
420 through the `next_same_hash' and `prev_same_hash' fields.
422 Each set of expressions with equivalent values
423 are on a two-way chain through the `next_same_value'
424 and `prev_same_value' fields, and all point with
425 the `first_same_value' field at the first element in
426 that chain. The chain is in order of increasing cost.
427 Each element's cost value is in its `cost' field.
429 The `in_memory' field is nonzero for elements that
430 involve any reference to memory. These elements are removed
431 whenever a write is done to an unidentified location in memory.
432 To be safe, we assume that a memory address is unidentified unless
433 the address is either a symbol constant or a constant plus
434 the frame pointer or argument pointer.
436 The `related_value' field is used to connect related expressions
437 (that differ by adding an integer).
438 The related expressions are chained in a circular fashion.
439 `related_value' is zero for expressions for which this
440 chain is not useful.
442 The `cost' field stores the cost of this element's expression.
443 The `regcost' field stores the value returned by approx_reg_cost for
444 this element's expression.
446 The `is_const' flag is set if the element is a constant (including
447 a fixed address).
449 The `flag' field is used as a temporary during some search routines.
451 The `mode' field is usually the same as GET_MODE (`exp'), but
452 if `exp' is a CONST_INT and has no machine mode then the `mode'
453 field is the mode it was being used as. Each constant is
454 recorded separately for each mode it is used with. */
456 struct table_elt
458 rtx exp;
459 rtx canon_exp;
460 struct table_elt *next_same_hash;
461 struct table_elt *prev_same_hash;
462 struct table_elt *next_same_value;
463 struct table_elt *prev_same_value;
464 struct table_elt *first_same_value;
465 struct table_elt *related_value;
466 int cost;
467 int regcost;
468 /* The size of this field should match the size
469 of the mode field of struct rtx_def (see rtl.h). */
470 ENUM_BITFIELD(machine_mode) mode : 8;
471 char in_memory;
472 char is_const;
473 char flag;
476 /* We don't want a lot of buckets, because we rarely have very many
477 things stored in the hash table, and a lot of buckets slows
478 down a lot of loops that happen frequently. */
479 #define HASH_SHIFT 5
480 #define HASH_SIZE (1 << HASH_SHIFT)
481 #define HASH_MASK (HASH_SIZE - 1)
483 /* Compute hash code of X in mode M. Special-case case where X is a pseudo
484 register (hard registers may require `do_not_record' to be set). */
486 #define HASH(X, M) \
487 ((GET_CODE (X) == REG && REGNO (X) >= FIRST_PSEUDO_REGISTER \
488 ? (((unsigned) REG << 7) + (unsigned) REG_QTY (REGNO (X))) \
489 : canon_hash (X, M)) & HASH_MASK)
491 /* Determine whether register number N is considered a fixed register for the
492 purpose of approximating register costs.
493 It is desirable to replace other regs with fixed regs, to reduce need for
494 non-fixed hard regs.
495 A reg wins if it is either the frame pointer or designated as fixed. */
496 #define FIXED_REGNO_P(N) \
497 ((N) == FRAME_POINTER_REGNUM || (N) == HARD_FRAME_POINTER_REGNUM \
498 || fixed_regs[N] || global_regs[N])
500 /* Compute cost of X, as stored in the `cost' field of a table_elt. Fixed
501 hard registers and pointers into the frame are the cheapest with a cost
502 of 0. Next come pseudos with a cost of one and other hard registers with
503 a cost of 2. Aside from these special cases, call `rtx_cost'. */
505 #define CHEAP_REGNO(N) \
506 ((N) == FRAME_POINTER_REGNUM || (N) == HARD_FRAME_POINTER_REGNUM \
507 || (N) == STACK_POINTER_REGNUM || (N) == ARG_POINTER_REGNUM \
508 || ((N) >= FIRST_VIRTUAL_REGISTER && (N) <= LAST_VIRTUAL_REGISTER) \
509 || ((N) < FIRST_PSEUDO_REGISTER \
510 && FIXED_REGNO_P (N) && REGNO_REG_CLASS (N) != NO_REGS))
512 #define COST(X) (GET_CODE (X) == REG ? 0 : notreg_cost (X, SET))
513 #define COST_IN(X,OUTER) (GET_CODE (X) == REG ? 0 : notreg_cost (X, OUTER))
515 /* Get the info associated with register N. */
517 #define GET_CSE_REG_INFO(N) \
518 (((N) == cached_regno && cached_cse_reg_info) \
519 ? cached_cse_reg_info : get_cse_reg_info ((N)))
521 /* Get the number of times this register has been updated in this
522 basic block. */
524 #define REG_TICK(N) ((GET_CSE_REG_INFO (N))->reg_tick)
526 /* Get the point at which REG was recorded in the table. */
528 #define REG_IN_TABLE(N) ((GET_CSE_REG_INFO (N))->reg_in_table)
530 /* Get the SUBREG set at the last increment to REG_TICK (-1 if not a
531 SUBREG). */
533 #define SUBREG_TICKED(N) ((GET_CSE_REG_INFO (N))->subreg_ticked)
535 /* Get the quantity number for REG. */
537 #define REG_QTY(N) ((GET_CSE_REG_INFO (N))->reg_qty)
539 /* Determine if the quantity number for register X represents a valid index
540 into the qty_table. */
542 #define REGNO_QTY_VALID_P(N) (REG_QTY (N) != (int) (N))
544 static struct table_elt *table[HASH_SIZE];
546 /* Chain of `struct table_elt's made so far for this function
547 but currently removed from the table. */
549 static struct table_elt *free_element_chain;
551 /* Number of `struct table_elt' structures made so far for this function. */
553 static int n_elements_made;
555 /* Maximum value `n_elements_made' has had so far in this compilation
556 for functions previously processed. */
558 static int max_elements_made;
560 /* Surviving equivalence class when two equivalence classes are merged
561 by recording the effects of a jump in the last insn. Zero if the
562 last insn was not a conditional jump. */
564 static struct table_elt *last_jump_equiv_class;
566 /* Set to the cost of a constant pool reference if one was found for a
567 symbolic constant. If this was found, it means we should try to
568 convert constants into constant pool entries if they don't fit in
569 the insn. */
571 static int constant_pool_entries_cost;
573 /* This data describes a block that will be processed by cse_basic_block. */
575 struct cse_basic_block_data
577 /* Lowest CUID value of insns in block. */
578 int low_cuid;
579 /* Highest CUID value of insns in block. */
580 int high_cuid;
581 /* Total number of SETs in block. */
582 int nsets;
583 /* Last insn in the block. */
584 rtx last;
585 /* Size of current branch path, if any. */
586 int path_size;
587 /* Current branch path, indicating which branches will be taken. */
588 struct branch_path
590 /* The branch insn. */
591 rtx branch;
592 /* Whether it should be taken or not. AROUND is the same as taken
593 except that it is used when the destination label is not preceded
594 by a BARRIER. */
595 enum taken {TAKEN, NOT_TAKEN, AROUND} status;
596 } *path;
599 static bool fixed_base_plus_p (rtx x);
600 static int notreg_cost (rtx, enum rtx_code);
601 static int approx_reg_cost_1 (rtx *, void *);
602 static int approx_reg_cost (rtx);
603 static int preferrable (int, int, int, int);
604 static void new_basic_block (void);
605 static void make_new_qty (unsigned int, enum machine_mode);
606 static void make_regs_eqv (unsigned int, unsigned int);
607 static void delete_reg_equiv (unsigned int);
608 static int mention_regs (rtx);
609 static int insert_regs (rtx, struct table_elt *, int);
610 static void remove_from_table (struct table_elt *, unsigned);
611 static struct table_elt *lookup (rtx, unsigned, enum machine_mode);
612 static struct table_elt *lookup_for_remove (rtx, unsigned, enum machine_mode);
613 static rtx lookup_as_function (rtx, enum rtx_code);
614 static struct table_elt *insert (rtx, struct table_elt *, unsigned,
615 enum machine_mode);
616 static void merge_equiv_classes (struct table_elt *, struct table_elt *);
617 static void invalidate (rtx, enum machine_mode);
618 static int cse_rtx_varies_p (rtx, int);
619 static void remove_invalid_refs (unsigned int);
620 static void remove_invalid_subreg_refs (unsigned int, unsigned int,
621 enum machine_mode);
622 static void rehash_using_reg (rtx);
623 static void invalidate_memory (void);
624 static void invalidate_for_call (void);
625 static rtx use_related_value (rtx, struct table_elt *);
626 static unsigned canon_hash (rtx, enum machine_mode);
627 static unsigned canon_hash_string (const char *);
628 static unsigned safe_hash (rtx, enum machine_mode);
629 static int exp_equiv_p (rtx, rtx, int, int);
630 static rtx canon_reg (rtx, rtx);
631 static void find_best_addr (rtx, rtx *, enum machine_mode);
632 static enum rtx_code find_comparison_args (enum rtx_code, rtx *, rtx *,
633 enum machine_mode *,
634 enum machine_mode *);
635 static rtx fold_rtx (rtx, rtx);
636 static rtx equiv_constant (rtx);
637 static void record_jump_equiv (rtx, int);
638 static void record_jump_cond (enum rtx_code, enum machine_mode, rtx, rtx,
639 int);
640 static void cse_insn (rtx, rtx);
641 static int addr_affects_sp_p (rtx);
642 static void invalidate_from_clobbers (rtx);
643 static rtx cse_process_notes (rtx, rtx);
644 static void cse_around_loop (rtx);
645 static void invalidate_skipped_set (rtx, rtx, void *);
646 static void invalidate_skipped_block (rtx);
647 static void cse_check_loop_start (rtx, rtx, void *);
648 static void cse_set_around_loop (rtx, rtx, rtx);
649 static rtx cse_basic_block (rtx, rtx, struct branch_path *, int);
650 static void count_reg_usage (rtx, int *, rtx, int);
651 static int check_for_label_ref (rtx *, void *);
652 extern void dump_class (struct table_elt*);
653 static struct cse_reg_info * get_cse_reg_info (unsigned int);
654 static int check_dependence (rtx *, void *);
656 static void flush_hash_table (void);
657 static bool insn_live_p (rtx, int *);
658 static bool set_live_p (rtx, rtx, int *);
659 static bool dead_libcall_p (rtx, int *);
661 /* Nonzero if X has the form (PLUS frame-pointer integer). We check for
662 virtual regs here because the simplify_*_operation routines are called
663 by integrate.c, which is called before virtual register instantiation. */
665 static bool
666 fixed_base_plus_p (rtx x)
668 switch (GET_CODE (x))
670 case REG:
671 if (x == frame_pointer_rtx || x == hard_frame_pointer_rtx)
672 return true;
673 if (x == arg_pointer_rtx && fixed_regs[ARG_POINTER_REGNUM])
674 return true;
675 if (REGNO (x) >= FIRST_VIRTUAL_REGISTER
676 && REGNO (x) <= LAST_VIRTUAL_REGISTER)
677 return true;
678 return false;
680 case PLUS:
681 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
682 return false;
683 return fixed_base_plus_p (XEXP (x, 0));
685 case ADDRESSOF:
686 return true;
688 default:
689 return false;
693 /* Dump the expressions in the equivalence class indicated by CLASSP.
694 This function is used only for debugging. */
695 void
696 dump_class (struct table_elt *classp)
698 struct table_elt *elt;
700 fprintf (stderr, "Equivalence chain for ");
701 print_rtl (stderr, classp->exp);
702 fprintf (stderr, ": \n");
704 for (elt = classp->first_same_value; elt; elt = elt->next_same_value)
706 print_rtl (stderr, elt->exp);
707 fprintf (stderr, "\n");
711 /* Subroutine of approx_reg_cost; called through for_each_rtx. */
713 static int
714 approx_reg_cost_1 (rtx *xp, void *data)
716 rtx x = *xp;
717 int *cost_p = data;
719 if (x && GET_CODE (x) == REG)
721 unsigned int regno = REGNO (x);
723 if (! CHEAP_REGNO (regno))
725 if (regno < FIRST_PSEUDO_REGISTER)
727 if (SMALL_REGISTER_CLASSES)
728 return 1;
729 *cost_p += 2;
731 else
732 *cost_p += 1;
736 return 0;
739 /* Return an estimate of the cost of the registers used in an rtx.
740 This is mostly the number of different REG expressions in the rtx;
741 however for some exceptions like fixed registers we use a cost of
742 0. If any other hard register reference occurs, return MAX_COST. */
744 static int
745 approx_reg_cost (rtx x)
747 int cost = 0;
749 if (for_each_rtx (&x, approx_reg_cost_1, (void *) &cost))
750 return MAX_COST;
752 return cost;
755 /* Return a negative value if an rtx A, whose costs are given by COST_A
756 and REGCOST_A, is more desirable than an rtx B.
757 Return a positive value if A is less desirable, or 0 if the two are
758 equally good. */
759 static int
760 preferrable (int cost_a, int regcost_a, int cost_b, int regcost_b)
762 /* First, get rid of cases involving expressions that are entirely
763 unwanted. */
764 if (cost_a != cost_b)
766 if (cost_a == MAX_COST)
767 return 1;
768 if (cost_b == MAX_COST)
769 return -1;
772 /* Avoid extending lifetimes of hardregs. */
773 if (regcost_a != regcost_b)
775 if (regcost_a == MAX_COST)
776 return 1;
777 if (regcost_b == MAX_COST)
778 return -1;
781 /* Normal operation costs take precedence. */
782 if (cost_a != cost_b)
783 return cost_a - cost_b;
784 /* Only if these are identical consider effects on register pressure. */
785 if (regcost_a != regcost_b)
786 return regcost_a - regcost_b;
787 return 0;
790 /* Internal function, to compute cost when X is not a register; called
791 from COST macro to keep it simple. */
793 static int
794 notreg_cost (rtx x, enum rtx_code outer)
796 return ((GET_CODE (x) == SUBREG
797 && GET_CODE (SUBREG_REG (x)) == REG
798 && GET_MODE_CLASS (GET_MODE (x)) == MODE_INT
799 && GET_MODE_CLASS (GET_MODE (SUBREG_REG (x))) == MODE_INT
800 && (GET_MODE_SIZE (GET_MODE (x))
801 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (x))))
802 && subreg_lowpart_p (x)
803 && TRULY_NOOP_TRUNCATION (GET_MODE_BITSIZE (GET_MODE (x)),
804 GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x)))))
806 : rtx_cost (x, outer) * 2);
809 /* Return an estimate of the cost of computing rtx X.
810 One use is in cse, to decide which expression to keep in the hash table.
811 Another is in rtl generation, to pick the cheapest way to multiply.
812 Other uses like the latter are expected in the future. */
815 rtx_cost (rtx x, enum rtx_code outer_code ATTRIBUTE_UNUSED)
817 int i, j;
818 enum rtx_code code;
819 const char *fmt;
820 int total;
822 if (x == 0)
823 return 0;
825 /* Compute the default costs of certain things.
826 Note that targetm.rtx_costs can override the defaults. */
828 code = GET_CODE (x);
829 switch (code)
831 case MULT:
832 total = COSTS_N_INSNS (5);
833 break;
834 case DIV:
835 case UDIV:
836 case MOD:
837 case UMOD:
838 total = COSTS_N_INSNS (7);
839 break;
840 case USE:
841 /* Used in loop.c and combine.c as a marker. */
842 total = 0;
843 break;
844 default:
845 total = COSTS_N_INSNS (1);
848 switch (code)
850 case REG:
851 return 0;
853 case SUBREG:
854 /* If we can't tie these modes, make this expensive. The larger
855 the mode, the more expensive it is. */
856 if (! MODES_TIEABLE_P (GET_MODE (x), GET_MODE (SUBREG_REG (x))))
857 return COSTS_N_INSNS (2
858 + GET_MODE_SIZE (GET_MODE (x)) / UNITS_PER_WORD);
859 break;
861 default:
862 if ((*targetm.rtx_costs) (x, code, outer_code, &total))
863 return total;
864 break;
867 /* Sum the costs of the sub-rtx's, plus cost of this operation,
868 which is already in total. */
870 fmt = GET_RTX_FORMAT (code);
871 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
872 if (fmt[i] == 'e')
873 total += rtx_cost (XEXP (x, i), code);
874 else if (fmt[i] == 'E')
875 for (j = 0; j < XVECLEN (x, i); j++)
876 total += rtx_cost (XVECEXP (x, i, j), code);
878 return total;
881 /* Return cost of address expression X.
882 Expect that X is properly formed address reference. */
885 address_cost (rtx x, enum machine_mode mode)
887 /* The address_cost target hook does not deal with ADDRESSOF nodes. But,
888 during CSE, such nodes are present. Using an ADDRESSOF node which
889 refers to the address of a REG is a good thing because we can then
890 turn (MEM (ADDRESSSOF (REG))) into just plain REG. */
892 if (GET_CODE (x) == ADDRESSOF && REG_P (XEXP ((x), 0)))
893 return -1;
895 /* We may be asked for cost of various unusual addresses, such as operands
896 of push instruction. It is not worthwhile to complicate writing
897 of the target hook by such cases. */
899 if (!memory_address_p (mode, x))
900 return 1000;
902 return (*targetm.address_cost) (x);
905 /* If the target doesn't override, compute the cost as with arithmetic. */
908 default_address_cost (rtx x)
910 return rtx_cost (x, MEM);
913 static struct cse_reg_info *
914 get_cse_reg_info (unsigned int regno)
916 struct cse_reg_info **hash_head = &reg_hash[REGHASH_FN (regno)];
917 struct cse_reg_info *p;
919 for (p = *hash_head; p != NULL; p = p->hash_next)
920 if (p->regno == regno)
921 break;
923 if (p == NULL)
925 /* Get a new cse_reg_info structure. */
926 if (cse_reg_info_free_list)
928 p = cse_reg_info_free_list;
929 cse_reg_info_free_list = p->next;
931 else
932 p = (struct cse_reg_info *) xmalloc (sizeof (struct cse_reg_info));
934 /* Insert into hash table. */
935 p->hash_next = *hash_head;
936 *hash_head = p;
938 /* Initialize it. */
939 p->reg_tick = 1;
940 p->reg_in_table = -1;
941 p->subreg_ticked = -1;
942 p->reg_qty = regno;
943 p->regno = regno;
944 p->next = cse_reg_info_used_list;
945 cse_reg_info_used_list = p;
946 if (!cse_reg_info_used_list_end)
947 cse_reg_info_used_list_end = p;
950 /* Cache this lookup; we tend to be looking up information about the
951 same register several times in a row. */
952 cached_regno = regno;
953 cached_cse_reg_info = p;
955 return p;
958 /* Clear the hash table and initialize each register with its own quantity,
959 for a new basic block. */
961 static void
962 new_basic_block (void)
964 int i;
966 next_qty = max_reg;
968 /* Clear out hash table state for this pass. */
970 memset ((char *) reg_hash, 0, sizeof reg_hash);
972 if (cse_reg_info_used_list)
974 cse_reg_info_used_list_end->next = cse_reg_info_free_list;
975 cse_reg_info_free_list = cse_reg_info_used_list;
976 cse_reg_info_used_list = cse_reg_info_used_list_end = 0;
978 cached_cse_reg_info = 0;
980 CLEAR_HARD_REG_SET (hard_regs_in_table);
982 /* The per-quantity values used to be initialized here, but it is
983 much faster to initialize each as it is made in `make_new_qty'. */
985 for (i = 0; i < HASH_SIZE; i++)
987 struct table_elt *first;
989 first = table[i];
990 if (first != NULL)
992 struct table_elt *last = first;
994 table[i] = NULL;
996 while (last->next_same_hash != NULL)
997 last = last->next_same_hash;
999 /* Now relink this hash entire chain into
1000 the free element list. */
1002 last->next_same_hash = free_element_chain;
1003 free_element_chain = first;
1007 #ifdef HAVE_cc0
1008 prev_insn = 0;
1009 prev_insn_cc0 = 0;
1010 #endif
1013 /* Say that register REG contains a quantity in mode MODE not in any
1014 register before and initialize that quantity. */
1016 static void
1017 make_new_qty (unsigned int reg, enum machine_mode mode)
1019 int q;
1020 struct qty_table_elem *ent;
1021 struct reg_eqv_elem *eqv;
1023 if (next_qty >= max_qty)
1024 abort ();
1026 q = REG_QTY (reg) = next_qty++;
1027 ent = &qty_table[q];
1028 ent->first_reg = reg;
1029 ent->last_reg = reg;
1030 ent->mode = mode;
1031 ent->const_rtx = ent->const_insn = NULL_RTX;
1032 ent->comparison_code = UNKNOWN;
1034 eqv = &reg_eqv_table[reg];
1035 eqv->next = eqv->prev = -1;
1038 /* Make reg NEW equivalent to reg OLD.
1039 OLD is not changing; NEW is. */
1041 static void
1042 make_regs_eqv (unsigned int new, unsigned int old)
1044 unsigned int lastr, firstr;
1045 int q = REG_QTY (old);
1046 struct qty_table_elem *ent;
1048 ent = &qty_table[q];
1050 /* Nothing should become eqv until it has a "non-invalid" qty number. */
1051 if (! REGNO_QTY_VALID_P (old))
1052 abort ();
1054 REG_QTY (new) = q;
1055 firstr = ent->first_reg;
1056 lastr = ent->last_reg;
1058 /* Prefer fixed hard registers to anything. Prefer pseudo regs to other
1059 hard regs. Among pseudos, if NEW will live longer than any other reg
1060 of the same qty, and that is beyond the current basic block,
1061 make it the new canonical replacement for this qty. */
1062 if (! (firstr < FIRST_PSEUDO_REGISTER && FIXED_REGNO_P (firstr))
1063 /* Certain fixed registers might be of the class NO_REGS. This means
1064 that not only can they not be allocated by the compiler, but
1065 they cannot be used in substitutions or canonicalizations
1066 either. */
1067 && (new >= FIRST_PSEUDO_REGISTER || REGNO_REG_CLASS (new) != NO_REGS)
1068 && ((new < FIRST_PSEUDO_REGISTER && FIXED_REGNO_P (new))
1069 || (new >= FIRST_PSEUDO_REGISTER
1070 && (firstr < FIRST_PSEUDO_REGISTER
1071 || ((uid_cuid[REGNO_LAST_UID (new)] > cse_basic_block_end
1072 || (uid_cuid[REGNO_FIRST_UID (new)]
1073 < cse_basic_block_start))
1074 && (uid_cuid[REGNO_LAST_UID (new)]
1075 > uid_cuid[REGNO_LAST_UID (firstr)]))))))
1077 reg_eqv_table[firstr].prev = new;
1078 reg_eqv_table[new].next = firstr;
1079 reg_eqv_table[new].prev = -1;
1080 ent->first_reg = new;
1082 else
1084 /* If NEW is a hard reg (known to be non-fixed), insert at end.
1085 Otherwise, insert before any non-fixed hard regs that are at the
1086 end. Registers of class NO_REGS cannot be used as an
1087 equivalent for anything. */
1088 while (lastr < FIRST_PSEUDO_REGISTER && reg_eqv_table[lastr].prev >= 0
1089 && (REGNO_REG_CLASS (lastr) == NO_REGS || ! FIXED_REGNO_P (lastr))
1090 && new >= FIRST_PSEUDO_REGISTER)
1091 lastr = reg_eqv_table[lastr].prev;
1092 reg_eqv_table[new].next = reg_eqv_table[lastr].next;
1093 if (reg_eqv_table[lastr].next >= 0)
1094 reg_eqv_table[reg_eqv_table[lastr].next].prev = new;
1095 else
1096 qty_table[q].last_reg = new;
1097 reg_eqv_table[lastr].next = new;
1098 reg_eqv_table[new].prev = lastr;
1102 /* Remove REG from its equivalence class. */
1104 static void
1105 delete_reg_equiv (unsigned int reg)
1107 struct qty_table_elem *ent;
1108 int q = REG_QTY (reg);
1109 int p, n;
1111 /* If invalid, do nothing. */
1112 if (q == (int) reg)
1113 return;
1115 ent = &qty_table[q];
1117 p = reg_eqv_table[reg].prev;
1118 n = reg_eqv_table[reg].next;
1120 if (n != -1)
1121 reg_eqv_table[n].prev = p;
1122 else
1123 ent->last_reg = p;
1124 if (p != -1)
1125 reg_eqv_table[p].next = n;
1126 else
1127 ent->first_reg = n;
1129 REG_QTY (reg) = reg;
1132 /* Remove any invalid expressions from the hash table
1133 that refer to any of the registers contained in expression X.
1135 Make sure that newly inserted references to those registers
1136 as subexpressions will be considered valid.
1138 mention_regs is not called when a register itself
1139 is being stored in the table.
1141 Return 1 if we have done something that may have changed the hash code
1142 of X. */
1144 static int
1145 mention_regs (rtx x)
1147 enum rtx_code code;
1148 int i, j;
1149 const char *fmt;
1150 int changed = 0;
1152 if (x == 0)
1153 return 0;
1155 code = GET_CODE (x);
1156 if (code == REG)
1158 unsigned int regno = REGNO (x);
1159 unsigned int endregno
1160 = regno + (regno >= FIRST_PSEUDO_REGISTER ? 1
1161 : HARD_REGNO_NREGS (regno, GET_MODE (x)));
1162 unsigned int i;
1164 for (i = regno; i < endregno; i++)
1166 if (REG_IN_TABLE (i) >= 0 && REG_IN_TABLE (i) != REG_TICK (i))
1167 remove_invalid_refs (i);
1169 REG_IN_TABLE (i) = REG_TICK (i);
1170 SUBREG_TICKED (i) = -1;
1173 return 0;
1176 /* If this is a SUBREG, we don't want to discard other SUBREGs of the same
1177 pseudo if they don't use overlapping words. We handle only pseudos
1178 here for simplicity. */
1179 if (code == SUBREG && GET_CODE (SUBREG_REG (x)) == REG
1180 && REGNO (SUBREG_REG (x)) >= FIRST_PSEUDO_REGISTER)
1182 unsigned int i = REGNO (SUBREG_REG (x));
1184 if (REG_IN_TABLE (i) >= 0 && REG_IN_TABLE (i) != REG_TICK (i))
1186 /* If REG_IN_TABLE (i) differs from REG_TICK (i) by one, and
1187 the last store to this register really stored into this
1188 subreg, then remove the memory of this subreg.
1189 Otherwise, remove any memory of the entire register and
1190 all its subregs from the table. */
1191 if (REG_TICK (i) - REG_IN_TABLE (i) > 1
1192 || SUBREG_TICKED (i) != REGNO (SUBREG_REG (x)))
1193 remove_invalid_refs (i);
1194 else
1195 remove_invalid_subreg_refs (i, SUBREG_BYTE (x), GET_MODE (x));
1198 REG_IN_TABLE (i) = REG_TICK (i);
1199 SUBREG_TICKED (i) = REGNO (SUBREG_REG (x));
1200 return 0;
1203 /* If X is a comparison or a COMPARE and either operand is a register
1204 that does not have a quantity, give it one. This is so that a later
1205 call to record_jump_equiv won't cause X to be assigned a different
1206 hash code and not found in the table after that call.
1208 It is not necessary to do this here, since rehash_using_reg can
1209 fix up the table later, but doing this here eliminates the need to
1210 call that expensive function in the most common case where the only
1211 use of the register is in the comparison. */
1213 if (code == COMPARE || GET_RTX_CLASS (code) == '<')
1215 if (GET_CODE (XEXP (x, 0)) == REG
1216 && ! REGNO_QTY_VALID_P (REGNO (XEXP (x, 0))))
1217 if (insert_regs (XEXP (x, 0), NULL, 0))
1219 rehash_using_reg (XEXP (x, 0));
1220 changed = 1;
1223 if (GET_CODE (XEXP (x, 1)) == REG
1224 && ! REGNO_QTY_VALID_P (REGNO (XEXP (x, 1))))
1225 if (insert_regs (XEXP (x, 1), NULL, 0))
1227 rehash_using_reg (XEXP (x, 1));
1228 changed = 1;
1232 fmt = GET_RTX_FORMAT (code);
1233 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1234 if (fmt[i] == 'e')
1235 changed |= mention_regs (XEXP (x, i));
1236 else if (fmt[i] == 'E')
1237 for (j = 0; j < XVECLEN (x, i); j++)
1238 changed |= mention_regs (XVECEXP (x, i, j));
1240 return changed;
1243 /* Update the register quantities for inserting X into the hash table
1244 with a value equivalent to CLASSP.
1245 (If the class does not contain a REG, it is irrelevant.)
1246 If MODIFIED is nonzero, X is a destination; it is being modified.
1247 Note that delete_reg_equiv should be called on a register
1248 before insert_regs is done on that register with MODIFIED != 0.
1250 Nonzero value means that elements of reg_qty have changed
1251 so X's hash code may be different. */
1253 static int
1254 insert_regs (rtx x, struct table_elt *classp, int modified)
1256 if (GET_CODE (x) == REG)
1258 unsigned int regno = REGNO (x);
1259 int qty_valid;
1261 /* If REGNO is in the equivalence table already but is of the
1262 wrong mode for that equivalence, don't do anything here. */
1264 qty_valid = REGNO_QTY_VALID_P (regno);
1265 if (qty_valid)
1267 struct qty_table_elem *ent = &qty_table[REG_QTY (regno)];
1269 if (ent->mode != GET_MODE (x))
1270 return 0;
1273 if (modified || ! qty_valid)
1275 if (classp)
1276 for (classp = classp->first_same_value;
1277 classp != 0;
1278 classp = classp->next_same_value)
1279 if (GET_CODE (classp->exp) == REG
1280 && GET_MODE (classp->exp) == GET_MODE (x))
1282 make_regs_eqv (regno, REGNO (classp->exp));
1283 return 1;
1286 /* Mention_regs for a SUBREG checks if REG_TICK is exactly one larger
1287 than REG_IN_TABLE to find out if there was only a single preceding
1288 invalidation - for the SUBREG - or another one, which would be
1289 for the full register. However, if we find here that REG_TICK
1290 indicates that the register is invalid, it means that it has
1291 been invalidated in a separate operation. The SUBREG might be used
1292 now (then this is a recursive call), or we might use the full REG
1293 now and a SUBREG of it later. So bump up REG_TICK so that
1294 mention_regs will do the right thing. */
1295 if (! modified
1296 && REG_IN_TABLE (regno) >= 0
1297 && REG_TICK (regno) == REG_IN_TABLE (regno) + 1)
1298 REG_TICK (regno)++;
1299 make_new_qty (regno, GET_MODE (x));
1300 return 1;
1303 return 0;
1306 /* If X is a SUBREG, we will likely be inserting the inner register in the
1307 table. If that register doesn't have an assigned quantity number at
1308 this point but does later, the insertion that we will be doing now will
1309 not be accessible because its hash code will have changed. So assign
1310 a quantity number now. */
1312 else if (GET_CODE (x) == SUBREG && GET_CODE (SUBREG_REG (x)) == REG
1313 && ! REGNO_QTY_VALID_P (REGNO (SUBREG_REG (x))))
1315 insert_regs (SUBREG_REG (x), NULL, 0);
1316 mention_regs (x);
1317 return 1;
1319 else
1320 return mention_regs (x);
1323 /* Look in or update the hash table. */
1325 /* Remove table element ELT from use in the table.
1326 HASH is its hash code, made using the HASH macro.
1327 It's an argument because often that is known in advance
1328 and we save much time not recomputing it. */
1330 static void
1331 remove_from_table (struct table_elt *elt, unsigned int hash)
1333 if (elt == 0)
1334 return;
1336 /* Mark this element as removed. See cse_insn. */
1337 elt->first_same_value = 0;
1339 /* Remove the table element from its equivalence class. */
1342 struct table_elt *prev = elt->prev_same_value;
1343 struct table_elt *next = elt->next_same_value;
1345 if (next)
1346 next->prev_same_value = prev;
1348 if (prev)
1349 prev->next_same_value = next;
1350 else
1352 struct table_elt *newfirst = next;
1353 while (next)
1355 next->first_same_value = newfirst;
1356 next = next->next_same_value;
1361 /* Remove the table element from its hash bucket. */
1364 struct table_elt *prev = elt->prev_same_hash;
1365 struct table_elt *next = elt->next_same_hash;
1367 if (next)
1368 next->prev_same_hash = prev;
1370 if (prev)
1371 prev->next_same_hash = next;
1372 else if (table[hash] == elt)
1373 table[hash] = next;
1374 else
1376 /* This entry is not in the proper hash bucket. This can happen
1377 when two classes were merged by `merge_equiv_classes'. Search
1378 for the hash bucket that it heads. This happens only very
1379 rarely, so the cost is acceptable. */
1380 for (hash = 0; hash < HASH_SIZE; hash++)
1381 if (table[hash] == elt)
1382 table[hash] = next;
1386 /* Remove the table element from its related-value circular chain. */
1388 if (elt->related_value != 0 && elt->related_value != elt)
1390 struct table_elt *p = elt->related_value;
1392 while (p->related_value != elt)
1393 p = p->related_value;
1394 p->related_value = elt->related_value;
1395 if (p->related_value == p)
1396 p->related_value = 0;
1399 /* Now add it to the free element chain. */
1400 elt->next_same_hash = free_element_chain;
1401 free_element_chain = elt;
1404 /* Look up X in the hash table and return its table element,
1405 or 0 if X is not in the table.
1407 MODE is the machine-mode of X, or if X is an integer constant
1408 with VOIDmode then MODE is the mode with which X will be used.
1410 Here we are satisfied to find an expression whose tree structure
1411 looks like X. */
1413 static struct table_elt *
1414 lookup (rtx x, unsigned int hash, enum machine_mode mode)
1416 struct table_elt *p;
1418 for (p = table[hash]; p; p = p->next_same_hash)
1419 if (mode == p->mode && ((x == p->exp && GET_CODE (x) == REG)
1420 || exp_equiv_p (x, p->exp, GET_CODE (x) != REG, 0)))
1421 return p;
1423 return 0;
1426 /* Like `lookup' but don't care whether the table element uses invalid regs.
1427 Also ignore discrepancies in the machine mode of a register. */
1429 static struct table_elt *
1430 lookup_for_remove (rtx x, unsigned int hash, enum machine_mode mode)
1432 struct table_elt *p;
1434 if (GET_CODE (x) == REG)
1436 unsigned int regno = REGNO (x);
1438 /* Don't check the machine mode when comparing registers;
1439 invalidating (REG:SI 0) also invalidates (REG:DF 0). */
1440 for (p = table[hash]; p; p = p->next_same_hash)
1441 if (GET_CODE (p->exp) == REG
1442 && REGNO (p->exp) == regno)
1443 return p;
1445 else
1447 for (p = table[hash]; p; p = p->next_same_hash)
1448 if (mode == p->mode && (x == p->exp || exp_equiv_p (x, p->exp, 0, 0)))
1449 return p;
1452 return 0;
1455 /* Look for an expression equivalent to X and with code CODE.
1456 If one is found, return that expression. */
1458 static rtx
1459 lookup_as_function (rtx x, enum rtx_code code)
1461 struct table_elt *p
1462 = lookup (x, safe_hash (x, VOIDmode) & HASH_MASK, GET_MODE (x));
1464 /* If we are looking for a CONST_INT, the mode doesn't really matter, as
1465 long as we are narrowing. So if we looked in vain for a mode narrower
1466 than word_mode before, look for word_mode now. */
1467 if (p == 0 && code == CONST_INT
1468 && GET_MODE_SIZE (GET_MODE (x)) < GET_MODE_SIZE (word_mode))
1470 x = copy_rtx (x);
1471 PUT_MODE (x, word_mode);
1472 p = lookup (x, safe_hash (x, VOIDmode) & HASH_MASK, word_mode);
1475 if (p == 0)
1476 return 0;
1478 for (p = p->first_same_value; p; p = p->next_same_value)
1479 if (GET_CODE (p->exp) == code
1480 /* Make sure this is a valid entry in the table. */
1481 && exp_equiv_p (p->exp, p->exp, 1, 0))
1482 return p->exp;
1484 return 0;
1487 /* Insert X in the hash table, assuming HASH is its hash code
1488 and CLASSP is an element of the class it should go in
1489 (or 0 if a new class should be made).
1490 It is inserted at the proper position to keep the class in
1491 the order cheapest first.
1493 MODE is the machine-mode of X, or if X is an integer constant
1494 with VOIDmode then MODE is the mode with which X will be used.
1496 For elements of equal cheapness, the most recent one
1497 goes in front, except that the first element in the list
1498 remains first unless a cheaper element is added. The order of
1499 pseudo-registers does not matter, as canon_reg will be called to
1500 find the cheapest when a register is retrieved from the table.
1502 The in_memory field in the hash table element is set to 0.
1503 The caller must set it nonzero if appropriate.
1505 You should call insert_regs (X, CLASSP, MODIFY) before calling here,
1506 and if insert_regs returns a nonzero value
1507 you must then recompute its hash code before calling here.
1509 If necessary, update table showing constant values of quantities. */
1511 #define CHEAPER(X, Y) \
1512 (preferrable ((X)->cost, (X)->regcost, (Y)->cost, (Y)->regcost) < 0)
1514 static struct table_elt *
1515 insert (rtx x, struct table_elt *classp, unsigned int hash, enum machine_mode mode)
1517 struct table_elt *elt;
1519 /* If X is a register and we haven't made a quantity for it,
1520 something is wrong. */
1521 if (GET_CODE (x) == REG && ! REGNO_QTY_VALID_P (REGNO (x)))
1522 abort ();
1524 /* If X is a hard register, show it is being put in the table. */
1525 if (GET_CODE (x) == REG && REGNO (x) < FIRST_PSEUDO_REGISTER)
1527 unsigned int regno = REGNO (x);
1528 unsigned int endregno = regno + HARD_REGNO_NREGS (regno, GET_MODE (x));
1529 unsigned int i;
1531 for (i = regno; i < endregno; i++)
1532 SET_HARD_REG_BIT (hard_regs_in_table, i);
1535 /* Put an element for X into the right hash bucket. */
1537 elt = free_element_chain;
1538 if (elt)
1539 free_element_chain = elt->next_same_hash;
1540 else
1542 n_elements_made++;
1543 elt = (struct table_elt *) xmalloc (sizeof (struct table_elt));
1546 elt->exp = x;
1547 elt->canon_exp = NULL_RTX;
1548 elt->cost = COST (x);
1549 elt->regcost = approx_reg_cost (x);
1550 elt->next_same_value = 0;
1551 elt->prev_same_value = 0;
1552 elt->next_same_hash = table[hash];
1553 elt->prev_same_hash = 0;
1554 elt->related_value = 0;
1555 elt->in_memory = 0;
1556 elt->mode = mode;
1557 elt->is_const = (CONSTANT_P (x)
1558 /* GNU C++ takes advantage of this for `this'
1559 (and other const values). */
1560 || (GET_CODE (x) == REG
1561 && RTX_UNCHANGING_P (x)
1562 && REGNO (x) >= FIRST_PSEUDO_REGISTER)
1563 || fixed_base_plus_p (x));
1565 if (table[hash])
1566 table[hash]->prev_same_hash = elt;
1567 table[hash] = elt;
1569 /* Put it into the proper value-class. */
1570 if (classp)
1572 classp = classp->first_same_value;
1573 if (CHEAPER (elt, classp))
1574 /* Insert at the head of the class. */
1576 struct table_elt *p;
1577 elt->next_same_value = classp;
1578 classp->prev_same_value = elt;
1579 elt->first_same_value = elt;
1581 for (p = classp; p; p = p->next_same_value)
1582 p->first_same_value = elt;
1584 else
1586 /* Insert not at head of the class. */
1587 /* Put it after the last element cheaper than X. */
1588 struct table_elt *p, *next;
1590 for (p = classp; (next = p->next_same_value) && CHEAPER (next, elt);
1591 p = next);
1593 /* Put it after P and before NEXT. */
1594 elt->next_same_value = next;
1595 if (next)
1596 next->prev_same_value = elt;
1598 elt->prev_same_value = p;
1599 p->next_same_value = elt;
1600 elt->first_same_value = classp;
1603 else
1604 elt->first_same_value = elt;
1606 /* If this is a constant being set equivalent to a register or a register
1607 being set equivalent to a constant, note the constant equivalence.
1609 If this is a constant, it cannot be equivalent to a different constant,
1610 and a constant is the only thing that can be cheaper than a register. So
1611 we know the register is the head of the class (before the constant was
1612 inserted).
1614 If this is a register that is not already known equivalent to a
1615 constant, we must check the entire class.
1617 If this is a register that is already known equivalent to an insn,
1618 update the qtys `const_insn' to show that `this_insn' is the latest
1619 insn making that quantity equivalent to the constant. */
1621 if (elt->is_const && classp && GET_CODE (classp->exp) == REG
1622 && GET_CODE (x) != REG)
1624 int exp_q = REG_QTY (REGNO (classp->exp));
1625 struct qty_table_elem *exp_ent = &qty_table[exp_q];
1627 exp_ent->const_rtx = gen_lowpart_if_possible (exp_ent->mode, x);
1628 exp_ent->const_insn = this_insn;
1631 else if (GET_CODE (x) == REG
1632 && classp
1633 && ! qty_table[REG_QTY (REGNO (x))].const_rtx
1634 && ! elt->is_const)
1636 struct table_elt *p;
1638 for (p = classp; p != 0; p = p->next_same_value)
1640 if (p->is_const && GET_CODE (p->exp) != REG)
1642 int x_q = REG_QTY (REGNO (x));
1643 struct qty_table_elem *x_ent = &qty_table[x_q];
1645 x_ent->const_rtx
1646 = gen_lowpart_if_possible (GET_MODE (x), p->exp);
1647 x_ent->const_insn = this_insn;
1648 break;
1653 else if (GET_CODE (x) == REG
1654 && qty_table[REG_QTY (REGNO (x))].const_rtx
1655 && GET_MODE (x) == qty_table[REG_QTY (REGNO (x))].mode)
1656 qty_table[REG_QTY (REGNO (x))].const_insn = this_insn;
1658 /* If this is a constant with symbolic value,
1659 and it has a term with an explicit integer value,
1660 link it up with related expressions. */
1661 if (GET_CODE (x) == CONST)
1663 rtx subexp = get_related_value (x);
1664 unsigned subhash;
1665 struct table_elt *subelt, *subelt_prev;
1667 if (subexp != 0)
1669 /* Get the integer-free subexpression in the hash table. */
1670 subhash = safe_hash (subexp, mode) & HASH_MASK;
1671 subelt = lookup (subexp, subhash, mode);
1672 if (subelt == 0)
1673 subelt = insert (subexp, NULL, subhash, mode);
1674 /* Initialize SUBELT's circular chain if it has none. */
1675 if (subelt->related_value == 0)
1676 subelt->related_value = subelt;
1677 /* Find the element in the circular chain that precedes SUBELT. */
1678 subelt_prev = subelt;
1679 while (subelt_prev->related_value != subelt)
1680 subelt_prev = subelt_prev->related_value;
1681 /* Put new ELT into SUBELT's circular chain just before SUBELT.
1682 This way the element that follows SUBELT is the oldest one. */
1683 elt->related_value = subelt_prev->related_value;
1684 subelt_prev->related_value = elt;
1688 return elt;
1691 /* Given two equivalence classes, CLASS1 and CLASS2, put all the entries from
1692 CLASS2 into CLASS1. This is done when we have reached an insn which makes
1693 the two classes equivalent.
1695 CLASS1 will be the surviving class; CLASS2 should not be used after this
1696 call.
1698 Any invalid entries in CLASS2 will not be copied. */
1700 static void
1701 merge_equiv_classes (struct table_elt *class1, struct table_elt *class2)
1703 struct table_elt *elt, *next, *new;
1705 /* Ensure we start with the head of the classes. */
1706 class1 = class1->first_same_value;
1707 class2 = class2->first_same_value;
1709 /* If they were already equal, forget it. */
1710 if (class1 == class2)
1711 return;
1713 for (elt = class2; elt; elt = next)
1715 unsigned int hash;
1716 rtx exp = elt->exp;
1717 enum machine_mode mode = elt->mode;
1719 next = elt->next_same_value;
1721 /* Remove old entry, make a new one in CLASS1's class.
1722 Don't do this for invalid entries as we cannot find their
1723 hash code (it also isn't necessary). */
1724 if (GET_CODE (exp) == REG || exp_equiv_p (exp, exp, 1, 0))
1726 hash_arg_in_memory = 0;
1727 hash = HASH (exp, mode);
1729 if (GET_CODE (exp) == REG)
1730 delete_reg_equiv (REGNO (exp));
1732 remove_from_table (elt, hash);
1734 if (insert_regs (exp, class1, 0))
1736 rehash_using_reg (exp);
1737 hash = HASH (exp, mode);
1739 new = insert (exp, class1, hash, mode);
1740 new->in_memory = hash_arg_in_memory;
1745 /* Flush the entire hash table. */
1747 static void
1748 flush_hash_table (void)
1750 int i;
1751 struct table_elt *p;
1753 for (i = 0; i < HASH_SIZE; i++)
1754 for (p = table[i]; p; p = table[i])
1756 /* Note that invalidate can remove elements
1757 after P in the current hash chain. */
1758 if (GET_CODE (p->exp) == REG)
1759 invalidate (p->exp, p->mode);
1760 else
1761 remove_from_table (p, i);
1765 /* Function called for each rtx to check whether true dependence exist. */
1766 struct check_dependence_data
1768 enum machine_mode mode;
1769 rtx exp;
1772 static int
1773 check_dependence (rtx *x, void *data)
1775 struct check_dependence_data *d = (struct check_dependence_data *) data;
1776 if (*x && GET_CODE (*x) == MEM)
1777 return true_dependence (d->exp, d->mode, *x, cse_rtx_varies_p);
1778 else
1779 return 0;
1782 /* Remove from the hash table, or mark as invalid, all expressions whose
1783 values could be altered by storing in X. X is a register, a subreg, or
1784 a memory reference with nonvarying address (because, when a memory
1785 reference with a varying address is stored in, all memory references are
1786 removed by invalidate_memory so specific invalidation is superfluous).
1787 FULL_MODE, if not VOIDmode, indicates that this much should be
1788 invalidated instead of just the amount indicated by the mode of X. This
1789 is only used for bitfield stores into memory.
1791 A nonvarying address may be just a register or just a symbol reference,
1792 or it may be either of those plus a numeric offset. */
1794 static void
1795 invalidate (rtx x, enum machine_mode full_mode)
1797 int i;
1798 struct table_elt *p;
1800 switch (GET_CODE (x))
1802 case REG:
1804 /* If X is a register, dependencies on its contents are recorded
1805 through the qty number mechanism. Just change the qty number of
1806 the register, mark it as invalid for expressions that refer to it,
1807 and remove it itself. */
1808 unsigned int regno = REGNO (x);
1809 unsigned int hash = HASH (x, GET_MODE (x));
1811 /* Remove REGNO from any quantity list it might be on and indicate
1812 that its value might have changed. If it is a pseudo, remove its
1813 entry from the hash table.
1815 For a hard register, we do the first two actions above for any
1816 additional hard registers corresponding to X. Then, if any of these
1817 registers are in the table, we must remove any REG entries that
1818 overlap these registers. */
1820 delete_reg_equiv (regno);
1821 REG_TICK (regno)++;
1822 SUBREG_TICKED (regno) = -1;
1824 if (regno >= FIRST_PSEUDO_REGISTER)
1826 /* Because a register can be referenced in more than one mode,
1827 we might have to remove more than one table entry. */
1828 struct table_elt *elt;
1830 while ((elt = lookup_for_remove (x, hash, GET_MODE (x))))
1831 remove_from_table (elt, hash);
1833 else
1835 HOST_WIDE_INT in_table
1836 = TEST_HARD_REG_BIT (hard_regs_in_table, regno);
1837 unsigned int endregno
1838 = regno + HARD_REGNO_NREGS (regno, GET_MODE (x));
1839 unsigned int tregno, tendregno, rn;
1840 struct table_elt *p, *next;
1842 CLEAR_HARD_REG_BIT (hard_regs_in_table, regno);
1844 for (rn = regno + 1; rn < endregno; rn++)
1846 in_table |= TEST_HARD_REG_BIT (hard_regs_in_table, rn);
1847 CLEAR_HARD_REG_BIT (hard_regs_in_table, rn);
1848 delete_reg_equiv (rn);
1849 REG_TICK (rn)++;
1850 SUBREG_TICKED (rn) = -1;
1853 if (in_table)
1854 for (hash = 0; hash < HASH_SIZE; hash++)
1855 for (p = table[hash]; p; p = next)
1857 next = p->next_same_hash;
1859 if (GET_CODE (p->exp) != REG
1860 || REGNO (p->exp) >= FIRST_PSEUDO_REGISTER)
1861 continue;
1863 tregno = REGNO (p->exp);
1864 tendregno
1865 = tregno + HARD_REGNO_NREGS (tregno, GET_MODE (p->exp));
1866 if (tendregno > regno && tregno < endregno)
1867 remove_from_table (p, hash);
1871 return;
1873 case SUBREG:
1874 invalidate (SUBREG_REG (x), VOIDmode);
1875 return;
1877 case PARALLEL:
1878 for (i = XVECLEN (x, 0) - 1; i >= 0; --i)
1879 invalidate (XVECEXP (x, 0, i), VOIDmode);
1880 return;
1882 case EXPR_LIST:
1883 /* This is part of a disjoint return value; extract the location in
1884 question ignoring the offset. */
1885 invalidate (XEXP (x, 0), VOIDmode);
1886 return;
1888 case MEM:
1889 /* Calculate the canonical version of X here so that
1890 true_dependence doesn't generate new RTL for X on each call. */
1891 x = canon_rtx (x);
1893 /* Remove all hash table elements that refer to overlapping pieces of
1894 memory. */
1895 if (full_mode == VOIDmode)
1896 full_mode = GET_MODE (x);
1898 for (i = 0; i < HASH_SIZE; i++)
1900 struct table_elt *next;
1902 for (p = table[i]; p; p = next)
1904 next = p->next_same_hash;
1905 if (p->in_memory)
1907 struct check_dependence_data d;
1909 /* Just canonicalize the expression once;
1910 otherwise each time we call invalidate
1911 true_dependence will canonicalize the
1912 expression again. */
1913 if (!p->canon_exp)
1914 p->canon_exp = canon_rtx (p->exp);
1915 d.exp = x;
1916 d.mode = full_mode;
1917 if (for_each_rtx (&p->canon_exp, check_dependence, &d))
1918 remove_from_table (p, i);
1922 return;
1924 default:
1925 abort ();
1929 /* Remove all expressions that refer to register REGNO,
1930 since they are already invalid, and we are about to
1931 mark that register valid again and don't want the old
1932 expressions to reappear as valid. */
1934 static void
1935 remove_invalid_refs (unsigned int regno)
1937 unsigned int i;
1938 struct table_elt *p, *next;
1940 for (i = 0; i < HASH_SIZE; i++)
1941 for (p = table[i]; p; p = next)
1943 next = p->next_same_hash;
1944 if (GET_CODE (p->exp) != REG
1945 && refers_to_regno_p (regno, regno + 1, p->exp, (rtx *) 0))
1946 remove_from_table (p, i);
1950 /* Likewise for a subreg with subreg_reg REGNO, subreg_byte OFFSET,
1951 and mode MODE. */
1952 static void
1953 remove_invalid_subreg_refs (unsigned int regno, unsigned int offset,
1954 enum machine_mode mode)
1956 unsigned int i;
1957 struct table_elt *p, *next;
1958 unsigned int end = offset + (GET_MODE_SIZE (mode) - 1);
1960 for (i = 0; i < HASH_SIZE; i++)
1961 for (p = table[i]; p; p = next)
1963 rtx exp = p->exp;
1964 next = p->next_same_hash;
1966 if (GET_CODE (exp) != REG
1967 && (GET_CODE (exp) != SUBREG
1968 || GET_CODE (SUBREG_REG (exp)) != REG
1969 || REGNO (SUBREG_REG (exp)) != regno
1970 || (((SUBREG_BYTE (exp)
1971 + (GET_MODE_SIZE (GET_MODE (exp)) - 1)) >= offset)
1972 && SUBREG_BYTE (exp) <= end))
1973 && refers_to_regno_p (regno, regno + 1, p->exp, (rtx *) 0))
1974 remove_from_table (p, i);
1978 /* Recompute the hash codes of any valid entries in the hash table that
1979 reference X, if X is a register, or SUBREG_REG (X) if X is a SUBREG.
1981 This is called when we make a jump equivalence. */
1983 static void
1984 rehash_using_reg (rtx x)
1986 unsigned int i;
1987 struct table_elt *p, *next;
1988 unsigned hash;
1990 if (GET_CODE (x) == SUBREG)
1991 x = SUBREG_REG (x);
1993 /* If X is not a register or if the register is known not to be in any
1994 valid entries in the table, we have no work to do. */
1996 if (GET_CODE (x) != REG
1997 || REG_IN_TABLE (REGNO (x)) < 0
1998 || REG_IN_TABLE (REGNO (x)) != REG_TICK (REGNO (x)))
1999 return;
2001 /* Scan all hash chains looking for valid entries that mention X.
2002 If we find one and it is in the wrong hash chain, move it. We can skip
2003 objects that are registers, since they are handled specially. */
2005 for (i = 0; i < HASH_SIZE; i++)
2006 for (p = table[i]; p; p = next)
2008 next = p->next_same_hash;
2009 if (GET_CODE (p->exp) != REG && reg_mentioned_p (x, p->exp)
2010 && exp_equiv_p (p->exp, p->exp, 1, 0)
2011 && i != (hash = safe_hash (p->exp, p->mode) & HASH_MASK))
2013 if (p->next_same_hash)
2014 p->next_same_hash->prev_same_hash = p->prev_same_hash;
2016 if (p->prev_same_hash)
2017 p->prev_same_hash->next_same_hash = p->next_same_hash;
2018 else
2019 table[i] = p->next_same_hash;
2021 p->next_same_hash = table[hash];
2022 p->prev_same_hash = 0;
2023 if (table[hash])
2024 table[hash]->prev_same_hash = p;
2025 table[hash] = p;
2030 /* Remove from the hash table any expression that is a call-clobbered
2031 register. Also update their TICK values. */
2033 static void
2034 invalidate_for_call (void)
2036 unsigned int regno, endregno;
2037 unsigned int i;
2038 unsigned hash;
2039 struct table_elt *p, *next;
2040 int in_table = 0;
2042 /* Go through all the hard registers. For each that is clobbered in
2043 a CALL_INSN, remove the register from quantity chains and update
2044 reg_tick if defined. Also see if any of these registers is currently
2045 in the table. */
2047 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
2048 if (TEST_HARD_REG_BIT (regs_invalidated_by_call, regno))
2050 delete_reg_equiv (regno);
2051 if (REG_TICK (regno) >= 0)
2053 REG_TICK (regno)++;
2054 SUBREG_TICKED (regno) = -1;
2057 in_table |= (TEST_HARD_REG_BIT (hard_regs_in_table, regno) != 0);
2060 /* In the case where we have no call-clobbered hard registers in the
2061 table, we are done. Otherwise, scan the table and remove any
2062 entry that overlaps a call-clobbered register. */
2064 if (in_table)
2065 for (hash = 0; hash < HASH_SIZE; hash++)
2066 for (p = table[hash]; p; p = next)
2068 next = p->next_same_hash;
2070 if (GET_CODE (p->exp) != REG
2071 || REGNO (p->exp) >= FIRST_PSEUDO_REGISTER)
2072 continue;
2074 regno = REGNO (p->exp);
2075 endregno = regno + HARD_REGNO_NREGS (regno, GET_MODE (p->exp));
2077 for (i = regno; i < endregno; i++)
2078 if (TEST_HARD_REG_BIT (regs_invalidated_by_call, i))
2080 remove_from_table (p, hash);
2081 break;
2086 /* Given an expression X of type CONST,
2087 and ELT which is its table entry (or 0 if it
2088 is not in the hash table),
2089 return an alternate expression for X as a register plus integer.
2090 If none can be found, return 0. */
2092 static rtx
2093 use_related_value (rtx x, struct table_elt *elt)
2095 struct table_elt *relt = 0;
2096 struct table_elt *p, *q;
2097 HOST_WIDE_INT offset;
2099 /* First, is there anything related known?
2100 If we have a table element, we can tell from that.
2101 Otherwise, must look it up. */
2103 if (elt != 0 && elt->related_value != 0)
2104 relt = elt;
2105 else if (elt == 0 && GET_CODE (x) == CONST)
2107 rtx subexp = get_related_value (x);
2108 if (subexp != 0)
2109 relt = lookup (subexp,
2110 safe_hash (subexp, GET_MODE (subexp)) & HASH_MASK,
2111 GET_MODE (subexp));
2114 if (relt == 0)
2115 return 0;
2117 /* Search all related table entries for one that has an
2118 equivalent register. */
2120 p = relt;
2121 while (1)
2123 /* This loop is strange in that it is executed in two different cases.
2124 The first is when X is already in the table. Then it is searching
2125 the RELATED_VALUE list of X's class (RELT). The second case is when
2126 X is not in the table. Then RELT points to a class for the related
2127 value.
2129 Ensure that, whatever case we are in, that we ignore classes that have
2130 the same value as X. */
2132 if (rtx_equal_p (x, p->exp))
2133 q = 0;
2134 else
2135 for (q = p->first_same_value; q; q = q->next_same_value)
2136 if (GET_CODE (q->exp) == REG)
2137 break;
2139 if (q)
2140 break;
2142 p = p->related_value;
2144 /* We went all the way around, so there is nothing to be found.
2145 Alternatively, perhaps RELT was in the table for some other reason
2146 and it has no related values recorded. */
2147 if (p == relt || p == 0)
2148 break;
2151 if (q == 0)
2152 return 0;
2154 offset = (get_integer_term (x) - get_integer_term (p->exp));
2155 /* Note: OFFSET may be 0 if P->xexp and X are related by commutativity. */
2156 return plus_constant (q->exp, offset);
2159 /* Hash a string. Just add its bytes up. */
2160 static inline unsigned
2161 canon_hash_string (const char *ps)
2163 unsigned hash = 0;
2164 const unsigned char *p = (const unsigned char *) ps;
2166 if (p)
2167 while (*p)
2168 hash += *p++;
2170 return hash;
2173 /* Hash an rtx. We are careful to make sure the value is never negative.
2174 Equivalent registers hash identically.
2175 MODE is used in hashing for CONST_INTs only;
2176 otherwise the mode of X is used.
2178 Store 1 in do_not_record if any subexpression is volatile.
2180 Store 1 in hash_arg_in_memory if X contains a MEM rtx
2181 which does not have the RTX_UNCHANGING_P bit set.
2183 Note that cse_insn knows that the hash code of a MEM expression
2184 is just (int) MEM plus the hash code of the address. */
2186 static unsigned
2187 canon_hash (rtx x, enum machine_mode mode)
2189 int i, j;
2190 unsigned hash = 0;
2191 enum rtx_code code;
2192 const char *fmt;
2194 /* repeat is used to turn tail-recursion into iteration. */
2195 repeat:
2196 if (x == 0)
2197 return hash;
2199 code = GET_CODE (x);
2200 switch (code)
2202 case REG:
2204 unsigned int regno = REGNO (x);
2205 bool record;
2207 /* On some machines, we can't record any non-fixed hard register,
2208 because extending its life will cause reload problems. We
2209 consider ap, fp, sp, gp to be fixed for this purpose.
2211 We also consider CCmode registers to be fixed for this purpose;
2212 failure to do so leads to failure to simplify 0<100 type of
2213 conditionals.
2215 On all machines, we can't record any global registers.
2216 Nor should we record any register that is in a small
2217 class, as defined by CLASS_LIKELY_SPILLED_P. */
2219 if (regno >= FIRST_PSEUDO_REGISTER)
2220 record = true;
2221 else if (x == frame_pointer_rtx
2222 || x == hard_frame_pointer_rtx
2223 || x == arg_pointer_rtx
2224 || x == stack_pointer_rtx
2225 || x == pic_offset_table_rtx)
2226 record = true;
2227 else if (global_regs[regno])
2228 record = false;
2229 else if (fixed_regs[regno])
2230 record = true;
2231 else if (GET_MODE_CLASS (GET_MODE (x)) == MODE_CC)
2232 record = true;
2233 else if (SMALL_REGISTER_CLASSES)
2234 record = false;
2235 else if (CLASS_LIKELY_SPILLED_P (REGNO_REG_CLASS (regno)))
2236 record = false;
2237 else
2238 record = true;
2240 if (!record)
2242 do_not_record = 1;
2243 return 0;
2246 hash += ((unsigned) REG << 7) + (unsigned) REG_QTY (regno);
2247 return hash;
2250 /* We handle SUBREG of a REG specially because the underlying
2251 reg changes its hash value with every value change; we don't
2252 want to have to forget unrelated subregs when one subreg changes. */
2253 case SUBREG:
2255 if (GET_CODE (SUBREG_REG (x)) == REG)
2257 hash += (((unsigned) SUBREG << 7)
2258 + REGNO (SUBREG_REG (x))
2259 + (SUBREG_BYTE (x) / UNITS_PER_WORD));
2260 return hash;
2262 break;
2265 case CONST_INT:
2267 unsigned HOST_WIDE_INT tem = INTVAL (x);
2268 hash += ((unsigned) CONST_INT << 7) + (unsigned) mode + tem;
2269 return hash;
2272 case CONST_DOUBLE:
2273 /* This is like the general case, except that it only counts
2274 the integers representing the constant. */
2275 hash += (unsigned) code + (unsigned) GET_MODE (x);
2276 if (GET_MODE (x) != VOIDmode)
2277 hash += real_hash (CONST_DOUBLE_REAL_VALUE (x));
2278 else
2279 hash += ((unsigned) CONST_DOUBLE_LOW (x)
2280 + (unsigned) CONST_DOUBLE_HIGH (x));
2281 return hash;
2283 case CONST_VECTOR:
2285 int units;
2286 rtx elt;
2288 units = CONST_VECTOR_NUNITS (x);
2290 for (i = 0; i < units; ++i)
2292 elt = CONST_VECTOR_ELT (x, i);
2293 hash += canon_hash (elt, GET_MODE (elt));
2296 return hash;
2299 /* Assume there is only one rtx object for any given label. */
2300 case LABEL_REF:
2301 hash += ((unsigned) LABEL_REF << 7) + (unsigned long) XEXP (x, 0);
2302 return hash;
2304 case SYMBOL_REF:
2305 hash += ((unsigned) SYMBOL_REF << 7) + (unsigned long) XSTR (x, 0);
2306 return hash;
2308 case MEM:
2309 /* We don't record if marked volatile or if BLKmode since we don't
2310 know the size of the move. */
2311 if (MEM_VOLATILE_P (x) || GET_MODE (x) == BLKmode)
2313 do_not_record = 1;
2314 return 0;
2316 if (! RTX_UNCHANGING_P (x) || fixed_base_plus_p (XEXP (x, 0)))
2317 hash_arg_in_memory = 1;
2319 /* Now that we have already found this special case,
2320 might as well speed it up as much as possible. */
2321 hash += (unsigned) MEM;
2322 x = XEXP (x, 0);
2323 goto repeat;
2325 case USE:
2326 /* A USE that mentions non-volatile memory needs special
2327 handling since the MEM may be BLKmode which normally
2328 prevents an entry from being made. Pure calls are
2329 marked by a USE which mentions BLKmode memory. */
2330 if (GET_CODE (XEXP (x, 0)) == MEM
2331 && ! MEM_VOLATILE_P (XEXP (x, 0)))
2333 hash += (unsigned) USE;
2334 x = XEXP (x, 0);
2336 if (! RTX_UNCHANGING_P (x) || fixed_base_plus_p (XEXP (x, 0)))
2337 hash_arg_in_memory = 1;
2339 /* Now that we have already found this special case,
2340 might as well speed it up as much as possible. */
2341 hash += (unsigned) MEM;
2342 x = XEXP (x, 0);
2343 goto repeat;
2345 break;
2347 case PRE_DEC:
2348 case PRE_INC:
2349 case POST_DEC:
2350 case POST_INC:
2351 case PRE_MODIFY:
2352 case POST_MODIFY:
2353 case PC:
2354 case CC0:
2355 case CALL:
2356 case UNSPEC_VOLATILE:
2357 do_not_record = 1;
2358 return 0;
2360 case ASM_OPERANDS:
2361 if (MEM_VOLATILE_P (x))
2363 do_not_record = 1;
2364 return 0;
2366 else
2368 /* We don't want to take the filename and line into account. */
2369 hash += (unsigned) code + (unsigned) GET_MODE (x)
2370 + canon_hash_string (ASM_OPERANDS_TEMPLATE (x))
2371 + canon_hash_string (ASM_OPERANDS_OUTPUT_CONSTRAINT (x))
2372 + (unsigned) ASM_OPERANDS_OUTPUT_IDX (x);
2374 if (ASM_OPERANDS_INPUT_LENGTH (x))
2376 for (i = 1; i < ASM_OPERANDS_INPUT_LENGTH (x); i++)
2378 hash += (canon_hash (ASM_OPERANDS_INPUT (x, i),
2379 GET_MODE (ASM_OPERANDS_INPUT (x, i)))
2380 + canon_hash_string (ASM_OPERANDS_INPUT_CONSTRAINT
2381 (x, i)));
2384 hash += canon_hash_string (ASM_OPERANDS_INPUT_CONSTRAINT (x, 0));
2385 x = ASM_OPERANDS_INPUT (x, 0);
2386 mode = GET_MODE (x);
2387 goto repeat;
2390 return hash;
2392 break;
2394 default:
2395 break;
2398 i = GET_RTX_LENGTH (code) - 1;
2399 hash += (unsigned) code + (unsigned) GET_MODE (x);
2400 fmt = GET_RTX_FORMAT (code);
2401 for (; i >= 0; i--)
2403 if (fmt[i] == 'e')
2405 rtx tem = XEXP (x, i);
2407 /* If we are about to do the last recursive call
2408 needed at this level, change it into iteration.
2409 This function is called enough to be worth it. */
2410 if (i == 0)
2412 x = tem;
2413 goto repeat;
2415 hash += canon_hash (tem, 0);
2417 else if (fmt[i] == 'E')
2418 for (j = 0; j < XVECLEN (x, i); j++)
2419 hash += canon_hash (XVECEXP (x, i, j), 0);
2420 else if (fmt[i] == 's')
2421 hash += canon_hash_string (XSTR (x, i));
2422 else if (fmt[i] == 'i')
2424 unsigned tem = XINT (x, i);
2425 hash += tem;
2427 else if (fmt[i] == '0' || fmt[i] == 't')
2428 /* Unused. */
2430 else
2431 abort ();
2433 return hash;
2436 /* Like canon_hash but with no side effects. */
2438 static unsigned
2439 safe_hash (rtx x, enum machine_mode mode)
2441 int save_do_not_record = do_not_record;
2442 int save_hash_arg_in_memory = hash_arg_in_memory;
2443 unsigned hash = canon_hash (x, mode);
2444 hash_arg_in_memory = save_hash_arg_in_memory;
2445 do_not_record = save_do_not_record;
2446 return hash;
2449 /* Return 1 iff X and Y would canonicalize into the same thing,
2450 without actually constructing the canonicalization of either one.
2451 If VALIDATE is nonzero,
2452 we assume X is an expression being processed from the rtl
2453 and Y was found in the hash table. We check register refs
2454 in Y for being marked as valid.
2456 If EQUAL_VALUES is nonzero, we allow a register to match a constant value
2457 that is known to be in the register. Ordinarily, we don't allow them
2458 to match, because letting them match would cause unpredictable results
2459 in all the places that search a hash table chain for an equivalent
2460 for a given value. A possible equivalent that has different structure
2461 has its hash code computed from different data. Whether the hash code
2462 is the same as that of the given value is pure luck. */
2464 static int
2465 exp_equiv_p (rtx x, rtx y, int validate, int equal_values)
2467 int i, j;
2468 enum rtx_code code;
2469 const char *fmt;
2471 /* Note: it is incorrect to assume an expression is equivalent to itself
2472 if VALIDATE is nonzero. */
2473 if (x == y && !validate)
2474 return 1;
2475 if (x == 0 || y == 0)
2476 return x == y;
2478 code = GET_CODE (x);
2479 if (code != GET_CODE (y))
2481 if (!equal_values)
2482 return 0;
2484 /* If X is a constant and Y is a register or vice versa, they may be
2485 equivalent. We only have to validate if Y is a register. */
2486 if (CONSTANT_P (x) && GET_CODE (y) == REG
2487 && REGNO_QTY_VALID_P (REGNO (y)))
2489 int y_q = REG_QTY (REGNO (y));
2490 struct qty_table_elem *y_ent = &qty_table[y_q];
2492 if (GET_MODE (y) == y_ent->mode
2493 && rtx_equal_p (x, y_ent->const_rtx)
2494 && (! validate || REG_IN_TABLE (REGNO (y)) == REG_TICK (REGNO (y))))
2495 return 1;
2498 if (CONSTANT_P (y) && code == REG
2499 && REGNO_QTY_VALID_P (REGNO (x)))
2501 int x_q = REG_QTY (REGNO (x));
2502 struct qty_table_elem *x_ent = &qty_table[x_q];
2504 if (GET_MODE (x) == x_ent->mode
2505 && rtx_equal_p (y, x_ent->const_rtx))
2506 return 1;
2509 return 0;
2512 /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent. */
2513 if (GET_MODE (x) != GET_MODE (y))
2514 return 0;
2516 switch (code)
2518 case PC:
2519 case CC0:
2520 case CONST_INT:
2521 return x == y;
2523 case LABEL_REF:
2524 return XEXP (x, 0) == XEXP (y, 0);
2526 case SYMBOL_REF:
2527 return XSTR (x, 0) == XSTR (y, 0);
2529 case REG:
2531 unsigned int regno = REGNO (y);
2532 unsigned int endregno
2533 = regno + (regno >= FIRST_PSEUDO_REGISTER ? 1
2534 : HARD_REGNO_NREGS (regno, GET_MODE (y)));
2535 unsigned int i;
2537 /* If the quantities are not the same, the expressions are not
2538 equivalent. If there are and we are not to validate, they
2539 are equivalent. Otherwise, ensure all regs are up-to-date. */
2541 if (REG_QTY (REGNO (x)) != REG_QTY (regno))
2542 return 0;
2544 if (! validate)
2545 return 1;
2547 for (i = regno; i < endregno; i++)
2548 if (REG_IN_TABLE (i) != REG_TICK (i))
2549 return 0;
2551 return 1;
2554 /* For commutative operations, check both orders. */
2555 case PLUS:
2556 case MULT:
2557 case AND:
2558 case IOR:
2559 case XOR:
2560 case NE:
2561 case EQ:
2562 return ((exp_equiv_p (XEXP (x, 0), XEXP (y, 0), validate, equal_values)
2563 && exp_equiv_p (XEXP (x, 1), XEXP (y, 1),
2564 validate, equal_values))
2565 || (exp_equiv_p (XEXP (x, 0), XEXP (y, 1),
2566 validate, equal_values)
2567 && exp_equiv_p (XEXP (x, 1), XEXP (y, 0),
2568 validate, equal_values)));
2570 case ASM_OPERANDS:
2571 /* We don't use the generic code below because we want to
2572 disregard filename and line numbers. */
2574 /* A volatile asm isn't equivalent to any other. */
2575 if (MEM_VOLATILE_P (x) || MEM_VOLATILE_P (y))
2576 return 0;
2578 if (GET_MODE (x) != GET_MODE (y)
2579 || strcmp (ASM_OPERANDS_TEMPLATE (x), ASM_OPERANDS_TEMPLATE (y))
2580 || strcmp (ASM_OPERANDS_OUTPUT_CONSTRAINT (x),
2581 ASM_OPERANDS_OUTPUT_CONSTRAINT (y))
2582 || ASM_OPERANDS_OUTPUT_IDX (x) != ASM_OPERANDS_OUTPUT_IDX (y)
2583 || ASM_OPERANDS_INPUT_LENGTH (x) != ASM_OPERANDS_INPUT_LENGTH (y))
2584 return 0;
2586 if (ASM_OPERANDS_INPUT_LENGTH (x))
2588 for (i = ASM_OPERANDS_INPUT_LENGTH (x) - 1; i >= 0; i--)
2589 if (! exp_equiv_p (ASM_OPERANDS_INPUT (x, i),
2590 ASM_OPERANDS_INPUT (y, i),
2591 validate, equal_values)
2592 || strcmp (ASM_OPERANDS_INPUT_CONSTRAINT (x, i),
2593 ASM_OPERANDS_INPUT_CONSTRAINT (y, i)))
2594 return 0;
2597 return 1;
2599 default:
2600 break;
2603 /* Compare the elements. If any pair of corresponding elements
2604 fail to match, return 0 for the whole things. */
2606 fmt = GET_RTX_FORMAT (code);
2607 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2609 switch (fmt[i])
2611 case 'e':
2612 if (! exp_equiv_p (XEXP (x, i), XEXP (y, i), validate, equal_values))
2613 return 0;
2614 break;
2616 case 'E':
2617 if (XVECLEN (x, i) != XVECLEN (y, i))
2618 return 0;
2619 for (j = 0; j < XVECLEN (x, i); j++)
2620 if (! exp_equiv_p (XVECEXP (x, i, j), XVECEXP (y, i, j),
2621 validate, equal_values))
2622 return 0;
2623 break;
2625 case 's':
2626 if (strcmp (XSTR (x, i), XSTR (y, i)))
2627 return 0;
2628 break;
2630 case 'i':
2631 if (XINT (x, i) != XINT (y, i))
2632 return 0;
2633 break;
2635 case 'w':
2636 if (XWINT (x, i) != XWINT (y, i))
2637 return 0;
2638 break;
2640 case '0':
2641 case 't':
2642 break;
2644 default:
2645 abort ();
2649 return 1;
2652 /* Return 1 if X has a value that can vary even between two
2653 executions of the program. 0 means X can be compared reliably
2654 against certain constants or near-constants. */
2656 static int
2657 cse_rtx_varies_p (rtx x, int from_alias)
2659 /* We need not check for X and the equivalence class being of the same
2660 mode because if X is equivalent to a constant in some mode, it
2661 doesn't vary in any mode. */
2663 if (GET_CODE (x) == REG
2664 && REGNO_QTY_VALID_P (REGNO (x)))
2666 int x_q = REG_QTY (REGNO (x));
2667 struct qty_table_elem *x_ent = &qty_table[x_q];
2669 if (GET_MODE (x) == x_ent->mode
2670 && x_ent->const_rtx != NULL_RTX)
2671 return 0;
2674 if (GET_CODE (x) == PLUS
2675 && GET_CODE (XEXP (x, 1)) == CONST_INT
2676 && GET_CODE (XEXP (x, 0)) == REG
2677 && REGNO_QTY_VALID_P (REGNO (XEXP (x, 0))))
2679 int x0_q = REG_QTY (REGNO (XEXP (x, 0)));
2680 struct qty_table_elem *x0_ent = &qty_table[x0_q];
2682 if ((GET_MODE (XEXP (x, 0)) == x0_ent->mode)
2683 && x0_ent->const_rtx != NULL_RTX)
2684 return 0;
2687 /* This can happen as the result of virtual register instantiation, if
2688 the initial constant is too large to be a valid address. This gives
2689 us a three instruction sequence, load large offset into a register,
2690 load fp minus a constant into a register, then a MEM which is the
2691 sum of the two `constant' registers. */
2692 if (GET_CODE (x) == PLUS
2693 && GET_CODE (XEXP (x, 0)) == REG
2694 && GET_CODE (XEXP (x, 1)) == REG
2695 && REGNO_QTY_VALID_P (REGNO (XEXP (x, 0)))
2696 && REGNO_QTY_VALID_P (REGNO (XEXP (x, 1))))
2698 int x0_q = REG_QTY (REGNO (XEXP (x, 0)));
2699 int x1_q = REG_QTY (REGNO (XEXP (x, 1)));
2700 struct qty_table_elem *x0_ent = &qty_table[x0_q];
2701 struct qty_table_elem *x1_ent = &qty_table[x1_q];
2703 if ((GET_MODE (XEXP (x, 0)) == x0_ent->mode)
2704 && x0_ent->const_rtx != NULL_RTX
2705 && (GET_MODE (XEXP (x, 1)) == x1_ent->mode)
2706 && x1_ent->const_rtx != NULL_RTX)
2707 return 0;
2710 return rtx_varies_p (x, from_alias);
2713 /* Canonicalize an expression:
2714 replace each register reference inside it
2715 with the "oldest" equivalent register.
2717 If INSN is nonzero and we are replacing a pseudo with a hard register
2718 or vice versa, validate_change is used to ensure that INSN remains valid
2719 after we make our substitution. The calls are made with IN_GROUP nonzero
2720 so apply_change_group must be called upon the outermost return from this
2721 function (unless INSN is zero). The result of apply_change_group can
2722 generally be discarded since the changes we are making are optional. */
2724 static rtx
2725 canon_reg (rtx x, rtx insn)
2727 int i;
2728 enum rtx_code code;
2729 const char *fmt;
2731 if (x == 0)
2732 return x;
2734 code = GET_CODE (x);
2735 switch (code)
2737 case PC:
2738 case CC0:
2739 case CONST:
2740 case CONST_INT:
2741 case CONST_DOUBLE:
2742 case CONST_VECTOR:
2743 case SYMBOL_REF:
2744 case LABEL_REF:
2745 case ADDR_VEC:
2746 case ADDR_DIFF_VEC:
2747 return x;
2749 case REG:
2751 int first;
2752 int q;
2753 struct qty_table_elem *ent;
2755 /* Never replace a hard reg, because hard regs can appear
2756 in more than one machine mode, and we must preserve the mode
2757 of each occurrence. Also, some hard regs appear in
2758 MEMs that are shared and mustn't be altered. Don't try to
2759 replace any reg that maps to a reg of class NO_REGS. */
2760 if (REGNO (x) < FIRST_PSEUDO_REGISTER
2761 || ! REGNO_QTY_VALID_P (REGNO (x)))
2762 return x;
2764 q = REG_QTY (REGNO (x));
2765 ent = &qty_table[q];
2766 first = ent->first_reg;
2767 return (first >= FIRST_PSEUDO_REGISTER ? regno_reg_rtx[first]
2768 : REGNO_REG_CLASS (first) == NO_REGS ? x
2769 : gen_rtx_REG (ent->mode, first));
2772 default:
2773 break;
2776 fmt = GET_RTX_FORMAT (code);
2777 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2779 int j;
2781 if (fmt[i] == 'e')
2783 rtx new = canon_reg (XEXP (x, i), insn);
2784 int insn_code;
2786 /* If replacing pseudo with hard reg or vice versa, ensure the
2787 insn remains valid. Likewise if the insn has MATCH_DUPs. */
2788 if (insn != 0 && new != 0
2789 && GET_CODE (new) == REG && GET_CODE (XEXP (x, i)) == REG
2790 && (((REGNO (new) < FIRST_PSEUDO_REGISTER)
2791 != (REGNO (XEXP (x, i)) < FIRST_PSEUDO_REGISTER))
2792 || (insn_code = recog_memoized (insn)) < 0
2793 || insn_data[insn_code].n_dups > 0))
2794 validate_change (insn, &XEXP (x, i), new, 1);
2795 else
2796 XEXP (x, i) = new;
2798 else if (fmt[i] == 'E')
2799 for (j = 0; j < XVECLEN (x, i); j++)
2800 XVECEXP (x, i, j) = canon_reg (XVECEXP (x, i, j), insn);
2803 return x;
2806 /* LOC is a location within INSN that is an operand address (the contents of
2807 a MEM). Find the best equivalent address to use that is valid for this
2808 insn.
2810 On most CISC machines, complicated address modes are costly, and rtx_cost
2811 is a good approximation for that cost. However, most RISC machines have
2812 only a few (usually only one) memory reference formats. If an address is
2813 valid at all, it is often just as cheap as any other address. Hence, for
2814 RISC machines, we use `address_cost' to compare the costs of various
2815 addresses. For two addresses of equal cost, choose the one with the
2816 highest `rtx_cost' value as that has the potential of eliminating the
2817 most insns. For equal costs, we choose the first in the equivalence
2818 class. Note that we ignore the fact that pseudo registers are cheaper than
2819 hard registers here because we would also prefer the pseudo registers. */
2821 static void
2822 find_best_addr (rtx insn, rtx *loc, enum machine_mode mode)
2824 struct table_elt *elt;
2825 rtx addr = *loc;
2826 struct table_elt *p;
2827 int found_better = 1;
2828 int save_do_not_record = do_not_record;
2829 int save_hash_arg_in_memory = hash_arg_in_memory;
2830 int addr_volatile;
2831 int regno;
2832 unsigned hash;
2834 /* Do not try to replace constant addresses or addresses of local and
2835 argument slots. These MEM expressions are made only once and inserted
2836 in many instructions, as well as being used to control symbol table
2837 output. It is not safe to clobber them.
2839 There are some uncommon cases where the address is already in a register
2840 for some reason, but we cannot take advantage of that because we have
2841 no easy way to unshare the MEM. In addition, looking up all stack
2842 addresses is costly. */
2843 if ((GET_CODE (addr) == PLUS
2844 && GET_CODE (XEXP (addr, 0)) == REG
2845 && GET_CODE (XEXP (addr, 1)) == CONST_INT
2846 && (regno = REGNO (XEXP (addr, 0)),
2847 regno == FRAME_POINTER_REGNUM || regno == HARD_FRAME_POINTER_REGNUM
2848 || regno == ARG_POINTER_REGNUM))
2849 || (GET_CODE (addr) == REG
2850 && (regno = REGNO (addr), regno == FRAME_POINTER_REGNUM
2851 || regno == HARD_FRAME_POINTER_REGNUM
2852 || regno == ARG_POINTER_REGNUM))
2853 || GET_CODE (addr) == ADDRESSOF
2854 || CONSTANT_ADDRESS_P (addr))
2855 return;
2857 /* If this address is not simply a register, try to fold it. This will
2858 sometimes simplify the expression. Many simplifications
2859 will not be valid, but some, usually applying the associative rule, will
2860 be valid and produce better code. */
2861 if (GET_CODE (addr) != REG)
2863 rtx folded = fold_rtx (copy_rtx (addr), NULL_RTX);
2864 int addr_folded_cost = address_cost (folded, mode);
2865 int addr_cost = address_cost (addr, mode);
2867 if ((addr_folded_cost < addr_cost
2868 || (addr_folded_cost == addr_cost
2869 /* ??? The rtx_cost comparison is left over from an older
2870 version of this code. It is probably no longer helpful. */
2871 && (rtx_cost (folded, MEM) > rtx_cost (addr, MEM)
2872 || approx_reg_cost (folded) < approx_reg_cost (addr))))
2873 && validate_change (insn, loc, folded, 0))
2874 addr = folded;
2877 /* If this address is not in the hash table, we can't look for equivalences
2878 of the whole address. Also, ignore if volatile. */
2880 do_not_record = 0;
2881 hash = HASH (addr, Pmode);
2882 addr_volatile = do_not_record;
2883 do_not_record = save_do_not_record;
2884 hash_arg_in_memory = save_hash_arg_in_memory;
2886 if (addr_volatile)
2887 return;
2889 elt = lookup (addr, hash, Pmode);
2891 if (elt)
2893 /* We need to find the best (under the criteria documented above) entry
2894 in the class that is valid. We use the `flag' field to indicate
2895 choices that were invalid and iterate until we can't find a better
2896 one that hasn't already been tried. */
2898 for (p = elt->first_same_value; p; p = p->next_same_value)
2899 p->flag = 0;
2901 while (found_better)
2903 int best_addr_cost = address_cost (*loc, mode);
2904 int best_rtx_cost = (elt->cost + 1) >> 1;
2905 int exp_cost;
2906 struct table_elt *best_elt = elt;
2908 found_better = 0;
2909 for (p = elt->first_same_value; p; p = p->next_same_value)
2910 if (! p->flag)
2912 if ((GET_CODE (p->exp) == REG
2913 || exp_equiv_p (p->exp, p->exp, 1, 0))
2914 && ((exp_cost = address_cost (p->exp, mode)) < best_addr_cost
2915 || (exp_cost == best_addr_cost
2916 && ((p->cost + 1) >> 1) > best_rtx_cost)))
2918 found_better = 1;
2919 best_addr_cost = exp_cost;
2920 best_rtx_cost = (p->cost + 1) >> 1;
2921 best_elt = p;
2925 if (found_better)
2927 if (validate_change (insn, loc,
2928 canon_reg (copy_rtx (best_elt->exp),
2929 NULL_RTX), 0))
2930 return;
2931 else
2932 best_elt->flag = 1;
2937 /* If the address is a binary operation with the first operand a register
2938 and the second a constant, do the same as above, but looking for
2939 equivalences of the register. Then try to simplify before checking for
2940 the best address to use. This catches a few cases: First is when we
2941 have REG+const and the register is another REG+const. We can often merge
2942 the constants and eliminate one insn and one register. It may also be
2943 that a machine has a cheap REG+REG+const. Finally, this improves the
2944 code on the Alpha for unaligned byte stores. */
2946 if (flag_expensive_optimizations
2947 && (GET_RTX_CLASS (GET_CODE (*loc)) == '2'
2948 || GET_RTX_CLASS (GET_CODE (*loc)) == 'c')
2949 && GET_CODE (XEXP (*loc, 0)) == REG)
2951 rtx op1 = XEXP (*loc, 1);
2953 do_not_record = 0;
2954 hash = HASH (XEXP (*loc, 0), Pmode);
2955 do_not_record = save_do_not_record;
2956 hash_arg_in_memory = save_hash_arg_in_memory;
2958 elt = lookup (XEXP (*loc, 0), hash, Pmode);
2959 if (elt == 0)
2960 return;
2962 /* We need to find the best (under the criteria documented above) entry
2963 in the class that is valid. We use the `flag' field to indicate
2964 choices that were invalid and iterate until we can't find a better
2965 one that hasn't already been tried. */
2967 for (p = elt->first_same_value; p; p = p->next_same_value)
2968 p->flag = 0;
2970 while (found_better)
2972 int best_addr_cost = address_cost (*loc, mode);
2973 int best_rtx_cost = (COST (*loc) + 1) >> 1;
2974 struct table_elt *best_elt = elt;
2975 rtx best_rtx = *loc;
2976 int count;
2978 /* This is at worst case an O(n^2) algorithm, so limit our search
2979 to the first 32 elements on the list. This avoids trouble
2980 compiling code with very long basic blocks that can easily
2981 call simplify_gen_binary so many times that we run out of
2982 memory. */
2984 found_better = 0;
2985 for (p = elt->first_same_value, count = 0;
2986 p && count < 32;
2987 p = p->next_same_value, count++)
2988 if (! p->flag
2989 && (GET_CODE (p->exp) == REG
2990 || exp_equiv_p (p->exp, p->exp, 1, 0)))
2992 rtx new = simplify_gen_binary (GET_CODE (*loc), Pmode,
2993 p->exp, op1);
2994 int new_cost;
2995 new_cost = address_cost (new, mode);
2997 if (new_cost < best_addr_cost
2998 || (new_cost == best_addr_cost
2999 && (COST (new) + 1) >> 1 > best_rtx_cost))
3001 found_better = 1;
3002 best_addr_cost = new_cost;
3003 best_rtx_cost = (COST (new) + 1) >> 1;
3004 best_elt = p;
3005 best_rtx = new;
3009 if (found_better)
3011 if (validate_change (insn, loc,
3012 canon_reg (copy_rtx (best_rtx),
3013 NULL_RTX), 0))
3014 return;
3015 else
3016 best_elt->flag = 1;
3022 /* Given an operation (CODE, *PARG1, *PARG2), where code is a comparison
3023 operation (EQ, NE, GT, etc.), follow it back through the hash table and
3024 what values are being compared.
3026 *PARG1 and *PARG2 are updated to contain the rtx representing the values
3027 actually being compared. For example, if *PARG1 was (cc0) and *PARG2
3028 was (const_int 0), *PARG1 and *PARG2 will be set to the objects that were
3029 compared to produce cc0.
3031 The return value is the comparison operator and is either the code of
3032 A or the code corresponding to the inverse of the comparison. */
3034 static enum rtx_code
3035 find_comparison_args (enum rtx_code code, rtx *parg1, rtx *parg2,
3036 enum machine_mode *pmode1, enum machine_mode *pmode2)
3038 rtx arg1, arg2;
3040 arg1 = *parg1, arg2 = *parg2;
3042 /* If ARG2 is const0_rtx, see what ARG1 is equivalent to. */
3044 while (arg2 == CONST0_RTX (GET_MODE (arg1)))
3046 /* Set nonzero when we find something of interest. */
3047 rtx x = 0;
3048 int reverse_code = 0;
3049 struct table_elt *p = 0;
3051 /* If arg1 is a COMPARE, extract the comparison arguments from it.
3052 On machines with CC0, this is the only case that can occur, since
3053 fold_rtx will return the COMPARE or item being compared with zero
3054 when given CC0. */
3056 if (GET_CODE (arg1) == COMPARE && arg2 == const0_rtx)
3057 x = arg1;
3059 /* If ARG1 is a comparison operator and CODE is testing for
3060 STORE_FLAG_VALUE, get the inner arguments. */
3062 else if (GET_RTX_CLASS (GET_CODE (arg1)) == '<')
3064 #ifdef FLOAT_STORE_FLAG_VALUE
3065 REAL_VALUE_TYPE fsfv;
3066 #endif
3068 if (code == NE
3069 || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_INT
3070 && code == LT && STORE_FLAG_VALUE == -1)
3071 #ifdef FLOAT_STORE_FLAG_VALUE
3072 || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_FLOAT
3073 && (fsfv = FLOAT_STORE_FLAG_VALUE (GET_MODE (arg1)),
3074 REAL_VALUE_NEGATIVE (fsfv)))
3075 #endif
3077 x = arg1;
3078 else if (code == EQ
3079 || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_INT
3080 && code == GE && STORE_FLAG_VALUE == -1)
3081 #ifdef FLOAT_STORE_FLAG_VALUE
3082 || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_FLOAT
3083 && (fsfv = FLOAT_STORE_FLAG_VALUE (GET_MODE (arg1)),
3084 REAL_VALUE_NEGATIVE (fsfv)))
3085 #endif
3087 x = arg1, reverse_code = 1;
3090 /* ??? We could also check for
3092 (ne (and (eq (...) (const_int 1))) (const_int 0))
3094 and related forms, but let's wait until we see them occurring. */
3096 if (x == 0)
3097 /* Look up ARG1 in the hash table and see if it has an equivalence
3098 that lets us see what is being compared. */
3099 p = lookup (arg1, safe_hash (arg1, GET_MODE (arg1)) & HASH_MASK,
3100 GET_MODE (arg1));
3101 if (p)
3103 p = p->first_same_value;
3105 /* If what we compare is already known to be constant, that is as
3106 good as it gets.
3107 We need to break the loop in this case, because otherwise we
3108 can have an infinite loop when looking at a reg that is known
3109 to be a constant which is the same as a comparison of a reg
3110 against zero which appears later in the insn stream, which in
3111 turn is constant and the same as the comparison of the first reg
3112 against zero... */
3113 if (p->is_const)
3114 break;
3117 for (; p; p = p->next_same_value)
3119 enum machine_mode inner_mode = GET_MODE (p->exp);
3120 #ifdef FLOAT_STORE_FLAG_VALUE
3121 REAL_VALUE_TYPE fsfv;
3122 #endif
3124 /* If the entry isn't valid, skip it. */
3125 if (! exp_equiv_p (p->exp, p->exp, 1, 0))
3126 continue;
3128 if (GET_CODE (p->exp) == COMPARE
3129 /* Another possibility is that this machine has a compare insn
3130 that includes the comparison code. In that case, ARG1 would
3131 be equivalent to a comparison operation that would set ARG1 to
3132 either STORE_FLAG_VALUE or zero. If this is an NE operation,
3133 ORIG_CODE is the actual comparison being done; if it is an EQ,
3134 we must reverse ORIG_CODE. On machine with a negative value
3135 for STORE_FLAG_VALUE, also look at LT and GE operations. */
3136 || ((code == NE
3137 || (code == LT
3138 && GET_MODE_CLASS (inner_mode) == MODE_INT
3139 && (GET_MODE_BITSIZE (inner_mode)
3140 <= HOST_BITS_PER_WIDE_INT)
3141 && (STORE_FLAG_VALUE
3142 & ((HOST_WIDE_INT) 1
3143 << (GET_MODE_BITSIZE (inner_mode) - 1))))
3144 #ifdef FLOAT_STORE_FLAG_VALUE
3145 || (code == LT
3146 && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
3147 && (fsfv = FLOAT_STORE_FLAG_VALUE (GET_MODE (arg1)),
3148 REAL_VALUE_NEGATIVE (fsfv)))
3149 #endif
3151 && GET_RTX_CLASS (GET_CODE (p->exp)) == '<'))
3153 x = p->exp;
3154 break;
3156 else if ((code == EQ
3157 || (code == GE
3158 && GET_MODE_CLASS (inner_mode) == MODE_INT
3159 && (GET_MODE_BITSIZE (inner_mode)
3160 <= HOST_BITS_PER_WIDE_INT)
3161 && (STORE_FLAG_VALUE
3162 & ((HOST_WIDE_INT) 1
3163 << (GET_MODE_BITSIZE (inner_mode) - 1))))
3164 #ifdef FLOAT_STORE_FLAG_VALUE
3165 || (code == GE
3166 && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
3167 && (fsfv = FLOAT_STORE_FLAG_VALUE (GET_MODE (arg1)),
3168 REAL_VALUE_NEGATIVE (fsfv)))
3169 #endif
3171 && GET_RTX_CLASS (GET_CODE (p->exp)) == '<')
3173 reverse_code = 1;
3174 x = p->exp;
3175 break;
3178 /* If this non-trapping address, e.g. fp + constant, the
3179 equivalent is a better operand since it may let us predict
3180 the value of the comparison. */
3181 else if (!rtx_addr_can_trap_p (p->exp))
3183 arg1 = p->exp;
3184 continue;
3188 /* If we didn't find a useful equivalence for ARG1, we are done.
3189 Otherwise, set up for the next iteration. */
3190 if (x == 0)
3191 break;
3193 /* If we need to reverse the comparison, make sure that that is
3194 possible -- we can't necessarily infer the value of GE from LT
3195 with floating-point operands. */
3196 if (reverse_code)
3198 enum rtx_code reversed = reversed_comparison_code (x, NULL_RTX);
3199 if (reversed == UNKNOWN)
3200 break;
3201 else
3202 code = reversed;
3204 else if (GET_RTX_CLASS (GET_CODE (x)) == '<')
3205 code = GET_CODE (x);
3206 arg1 = XEXP (x, 0), arg2 = XEXP (x, 1);
3209 /* Return our results. Return the modes from before fold_rtx
3210 because fold_rtx might produce const_int, and then it's too late. */
3211 *pmode1 = GET_MODE (arg1), *pmode2 = GET_MODE (arg2);
3212 *parg1 = fold_rtx (arg1, 0), *parg2 = fold_rtx (arg2, 0);
3214 return code;
3217 /* If X is a nontrivial arithmetic operation on an argument
3218 for which a constant value can be determined, return
3219 the result of operating on that value, as a constant.
3220 Otherwise, return X, possibly with one or more operands
3221 modified by recursive calls to this function.
3223 If X is a register whose contents are known, we do NOT
3224 return those contents here. equiv_constant is called to
3225 perform that task.
3227 INSN is the insn that we may be modifying. If it is 0, make a copy
3228 of X before modifying it. */
3230 static rtx
3231 fold_rtx (rtx x, rtx insn)
3233 enum rtx_code code;
3234 enum machine_mode mode;
3235 const char *fmt;
3236 int i;
3237 rtx new = 0;
3238 int copied = 0;
3239 int must_swap = 0;
3241 /* Folded equivalents of first two operands of X. */
3242 rtx folded_arg0;
3243 rtx folded_arg1;
3245 /* Constant equivalents of first three operands of X;
3246 0 when no such equivalent is known. */
3247 rtx const_arg0;
3248 rtx const_arg1;
3249 rtx const_arg2;
3251 /* The mode of the first operand of X. We need this for sign and zero
3252 extends. */
3253 enum machine_mode mode_arg0;
3255 if (x == 0)
3256 return x;
3258 mode = GET_MODE (x);
3259 code = GET_CODE (x);
3260 switch (code)
3262 case CONST:
3263 case CONST_INT:
3264 case CONST_DOUBLE:
3265 case CONST_VECTOR:
3266 case SYMBOL_REF:
3267 case LABEL_REF:
3268 case REG:
3269 /* No use simplifying an EXPR_LIST
3270 since they are used only for lists of args
3271 in a function call's REG_EQUAL note. */
3272 case EXPR_LIST:
3273 /* Changing anything inside an ADDRESSOF is incorrect; we don't
3274 want to (e.g.,) make (addressof (const_int 0)) just because
3275 the location is known to be zero. */
3276 case ADDRESSOF:
3277 return x;
3279 #ifdef HAVE_cc0
3280 case CC0:
3281 return prev_insn_cc0;
3282 #endif
3284 case PC:
3285 /* If the next insn is a CODE_LABEL followed by a jump table,
3286 PC's value is a LABEL_REF pointing to that label. That
3287 lets us fold switch statements on the VAX. */
3289 rtx next;
3290 if (insn && tablejump_p (insn, &next, NULL))
3291 return gen_rtx_LABEL_REF (Pmode, next);
3293 break;
3295 case SUBREG:
3296 /* See if we previously assigned a constant value to this SUBREG. */
3297 if ((new = lookup_as_function (x, CONST_INT)) != 0
3298 || (new = lookup_as_function (x, CONST_DOUBLE)) != 0)
3299 return new;
3301 /* If this is a paradoxical SUBREG, we have no idea what value the
3302 extra bits would have. However, if the operand is equivalent
3303 to a SUBREG whose operand is the same as our mode, and all the
3304 modes are within a word, we can just use the inner operand
3305 because these SUBREGs just say how to treat the register.
3307 Similarly if we find an integer constant. */
3309 if (GET_MODE_SIZE (mode) > GET_MODE_SIZE (GET_MODE (SUBREG_REG (x))))
3311 enum machine_mode imode = GET_MODE (SUBREG_REG (x));
3312 struct table_elt *elt;
3314 if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD
3315 && GET_MODE_SIZE (imode) <= UNITS_PER_WORD
3316 && (elt = lookup (SUBREG_REG (x), HASH (SUBREG_REG (x), imode),
3317 imode)) != 0)
3318 for (elt = elt->first_same_value; elt; elt = elt->next_same_value)
3320 if (CONSTANT_P (elt->exp)
3321 && GET_MODE (elt->exp) == VOIDmode)
3322 return elt->exp;
3324 if (GET_CODE (elt->exp) == SUBREG
3325 && GET_MODE (SUBREG_REG (elt->exp)) == mode
3326 && exp_equiv_p (elt->exp, elt->exp, 1, 0))
3327 return copy_rtx (SUBREG_REG (elt->exp));
3330 return x;
3333 /* Fold SUBREG_REG. If it changed, see if we can simplify the SUBREG.
3334 We might be able to if the SUBREG is extracting a single word in an
3335 integral mode or extracting the low part. */
3337 folded_arg0 = fold_rtx (SUBREG_REG (x), insn);
3338 const_arg0 = equiv_constant (folded_arg0);
3339 if (const_arg0)
3340 folded_arg0 = const_arg0;
3342 if (folded_arg0 != SUBREG_REG (x))
3344 new = simplify_subreg (mode, folded_arg0,
3345 GET_MODE (SUBREG_REG (x)), SUBREG_BYTE (x));
3346 if (new)
3347 return new;
3350 /* If this is a narrowing SUBREG and our operand is a REG, see if
3351 we can find an equivalence for REG that is an arithmetic operation
3352 in a wider mode where both operands are paradoxical SUBREGs
3353 from objects of our result mode. In that case, we couldn't report
3354 an equivalent value for that operation, since we don't know what the
3355 extra bits will be. But we can find an equivalence for this SUBREG
3356 by folding that operation is the narrow mode. This allows us to
3357 fold arithmetic in narrow modes when the machine only supports
3358 word-sized arithmetic.
3360 Also look for a case where we have a SUBREG whose operand is the
3361 same as our result. If both modes are smaller than a word, we
3362 are simply interpreting a register in different modes and we
3363 can use the inner value. */
3365 if (GET_CODE (folded_arg0) == REG
3366 && GET_MODE_SIZE (mode) < GET_MODE_SIZE (GET_MODE (folded_arg0))
3367 && subreg_lowpart_p (x))
3369 struct table_elt *elt;
3371 /* We can use HASH here since we know that canon_hash won't be
3372 called. */
3373 elt = lookup (folded_arg0,
3374 HASH (folded_arg0, GET_MODE (folded_arg0)),
3375 GET_MODE (folded_arg0));
3377 if (elt)
3378 elt = elt->first_same_value;
3380 for (; elt; elt = elt->next_same_value)
3382 enum rtx_code eltcode = GET_CODE (elt->exp);
3384 /* Just check for unary and binary operations. */
3385 if (GET_RTX_CLASS (GET_CODE (elt->exp)) == '1'
3386 && GET_CODE (elt->exp) != SIGN_EXTEND
3387 && GET_CODE (elt->exp) != ZERO_EXTEND
3388 && GET_CODE (XEXP (elt->exp, 0)) == SUBREG
3389 && GET_MODE (SUBREG_REG (XEXP (elt->exp, 0))) == mode
3390 && (GET_MODE_CLASS (mode)
3391 == GET_MODE_CLASS (GET_MODE (XEXP (elt->exp, 0)))))
3393 rtx op0 = SUBREG_REG (XEXP (elt->exp, 0));
3395 if (GET_CODE (op0) != REG && ! CONSTANT_P (op0))
3396 op0 = fold_rtx (op0, NULL_RTX);
3398 op0 = equiv_constant (op0);
3399 if (op0)
3400 new = simplify_unary_operation (GET_CODE (elt->exp), mode,
3401 op0, mode);
3403 else if ((GET_RTX_CLASS (GET_CODE (elt->exp)) == '2'
3404 || GET_RTX_CLASS (GET_CODE (elt->exp)) == 'c')
3405 && eltcode != DIV && eltcode != MOD
3406 && eltcode != UDIV && eltcode != UMOD
3407 && eltcode != ASHIFTRT && eltcode != LSHIFTRT
3408 && eltcode != ROTATE && eltcode != ROTATERT
3409 && ((GET_CODE (XEXP (elt->exp, 0)) == SUBREG
3410 && (GET_MODE (SUBREG_REG (XEXP (elt->exp, 0)))
3411 == mode))
3412 || CONSTANT_P (XEXP (elt->exp, 0)))
3413 && ((GET_CODE (XEXP (elt->exp, 1)) == SUBREG
3414 && (GET_MODE (SUBREG_REG (XEXP (elt->exp, 1)))
3415 == mode))
3416 || CONSTANT_P (XEXP (elt->exp, 1))))
3418 rtx op0 = gen_lowpart_common (mode, XEXP (elt->exp, 0));
3419 rtx op1 = gen_lowpart_common (mode, XEXP (elt->exp, 1));
3421 if (op0 && GET_CODE (op0) != REG && ! CONSTANT_P (op0))
3422 op0 = fold_rtx (op0, NULL_RTX);
3424 if (op0)
3425 op0 = equiv_constant (op0);
3427 if (op1 && GET_CODE (op1) != REG && ! CONSTANT_P (op1))
3428 op1 = fold_rtx (op1, NULL_RTX);
3430 if (op1)
3431 op1 = equiv_constant (op1);
3433 /* If we are looking for the low SImode part of
3434 (ashift:DI c (const_int 32)), it doesn't work
3435 to compute that in SImode, because a 32-bit shift
3436 in SImode is unpredictable. We know the value is 0. */
3437 if (op0 && op1
3438 && GET_CODE (elt->exp) == ASHIFT
3439 && GET_CODE (op1) == CONST_INT
3440 && INTVAL (op1) >= GET_MODE_BITSIZE (mode))
3442 if (INTVAL (op1) < GET_MODE_BITSIZE (GET_MODE (elt->exp)))
3444 /* If the count fits in the inner mode's width,
3445 but exceeds the outer mode's width,
3446 the value will get truncated to 0
3447 by the subreg. */
3448 new = const0_rtx;
3449 else
3450 /* If the count exceeds even the inner mode's width,
3451 don't fold this expression. */
3452 new = 0;
3454 else if (op0 && op1)
3455 new = simplify_binary_operation (GET_CODE (elt->exp), mode,
3456 op0, op1);
3459 else if (GET_CODE (elt->exp) == SUBREG
3460 && GET_MODE (SUBREG_REG (elt->exp)) == mode
3461 && (GET_MODE_SIZE (GET_MODE (folded_arg0))
3462 <= UNITS_PER_WORD)
3463 && exp_equiv_p (elt->exp, elt->exp, 1, 0))
3464 new = copy_rtx (SUBREG_REG (elt->exp));
3466 if (new)
3467 return new;
3471 return x;
3473 case NOT:
3474 case NEG:
3475 /* If we have (NOT Y), see if Y is known to be (NOT Z).
3476 If so, (NOT Y) simplifies to Z. Similarly for NEG. */
3477 new = lookup_as_function (XEXP (x, 0), code);
3478 if (new)
3479 return fold_rtx (copy_rtx (XEXP (new, 0)), insn);
3480 break;
3482 case MEM:
3483 /* If we are not actually processing an insn, don't try to find the
3484 best address. Not only don't we care, but we could modify the
3485 MEM in an invalid way since we have no insn to validate against. */
3486 if (insn != 0)
3487 find_best_addr (insn, &XEXP (x, 0), GET_MODE (x));
3490 /* Even if we don't fold in the insn itself,
3491 we can safely do so here, in hopes of getting a constant. */
3492 rtx addr = fold_rtx (XEXP (x, 0), NULL_RTX);
3493 rtx base = 0;
3494 HOST_WIDE_INT offset = 0;
3496 if (GET_CODE (addr) == REG
3497 && REGNO_QTY_VALID_P (REGNO (addr)))
3499 int addr_q = REG_QTY (REGNO (addr));
3500 struct qty_table_elem *addr_ent = &qty_table[addr_q];
3502 if (GET_MODE (addr) == addr_ent->mode
3503 && addr_ent->const_rtx != NULL_RTX)
3504 addr = addr_ent->const_rtx;
3507 /* If address is constant, split it into a base and integer offset. */
3508 if (GET_CODE (addr) == SYMBOL_REF || GET_CODE (addr) == LABEL_REF)
3509 base = addr;
3510 else if (GET_CODE (addr) == CONST && GET_CODE (XEXP (addr, 0)) == PLUS
3511 && GET_CODE (XEXP (XEXP (addr, 0), 1)) == CONST_INT)
3513 base = XEXP (XEXP (addr, 0), 0);
3514 offset = INTVAL (XEXP (XEXP (addr, 0), 1));
3516 else if (GET_CODE (addr) == LO_SUM
3517 && GET_CODE (XEXP (addr, 1)) == SYMBOL_REF)
3518 base = XEXP (addr, 1);
3519 else if (GET_CODE (addr) == ADDRESSOF)
3520 return change_address (x, VOIDmode, addr);
3522 /* If this is a constant pool reference, we can fold it into its
3523 constant to allow better value tracking. */
3524 if (base && GET_CODE (base) == SYMBOL_REF
3525 && CONSTANT_POOL_ADDRESS_P (base))
3527 rtx constant = get_pool_constant (base);
3528 enum machine_mode const_mode = get_pool_mode (base);
3529 rtx new;
3531 if (CONSTANT_P (constant) && GET_CODE (constant) != CONST_INT)
3532 constant_pool_entries_cost = COST (constant);
3534 /* If we are loading the full constant, we have an equivalence. */
3535 if (offset == 0 && mode == const_mode)
3536 return constant;
3538 /* If this actually isn't a constant (weird!), we can't do
3539 anything. Otherwise, handle the two most common cases:
3540 extracting a word from a multi-word constant, and extracting
3541 the low-order bits. Other cases don't seem common enough to
3542 worry about. */
3543 if (! CONSTANT_P (constant))
3544 return x;
3546 if (GET_MODE_CLASS (mode) == MODE_INT
3547 && GET_MODE_SIZE (mode) == UNITS_PER_WORD
3548 && offset % UNITS_PER_WORD == 0
3549 && (new = operand_subword (constant,
3550 offset / UNITS_PER_WORD,
3551 0, const_mode)) != 0)
3552 return new;
3554 if (((BYTES_BIG_ENDIAN
3555 && offset == GET_MODE_SIZE (GET_MODE (constant)) - 1)
3556 || (! BYTES_BIG_ENDIAN && offset == 0))
3557 && (new = gen_lowpart_if_possible (mode, constant)) != 0)
3558 return new;
3561 /* If this is a reference to a label at a known position in a jump
3562 table, we also know its value. */
3563 if (base && GET_CODE (base) == LABEL_REF)
3565 rtx label = XEXP (base, 0);
3566 rtx table_insn = NEXT_INSN (label);
3568 if (table_insn && GET_CODE (table_insn) == JUMP_INSN
3569 && GET_CODE (PATTERN (table_insn)) == ADDR_VEC)
3571 rtx table = PATTERN (table_insn);
3573 if (offset >= 0
3574 && (offset / GET_MODE_SIZE (GET_MODE (table))
3575 < XVECLEN (table, 0)))
3576 return XVECEXP (table, 0,
3577 offset / GET_MODE_SIZE (GET_MODE (table)));
3579 if (table_insn && GET_CODE (table_insn) == JUMP_INSN
3580 && GET_CODE (PATTERN (table_insn)) == ADDR_DIFF_VEC)
3582 rtx table = PATTERN (table_insn);
3584 if (offset >= 0
3585 && (offset / GET_MODE_SIZE (GET_MODE (table))
3586 < XVECLEN (table, 1)))
3588 offset /= GET_MODE_SIZE (GET_MODE (table));
3589 new = gen_rtx_MINUS (Pmode, XVECEXP (table, 1, offset),
3590 XEXP (table, 0));
3592 if (GET_MODE (table) != Pmode)
3593 new = gen_rtx_TRUNCATE (GET_MODE (table), new);
3595 /* Indicate this is a constant. This isn't a
3596 valid form of CONST, but it will only be used
3597 to fold the next insns and then discarded, so
3598 it should be safe.
3600 Note this expression must be explicitly discarded,
3601 by cse_insn, else it may end up in a REG_EQUAL note
3602 and "escape" to cause problems elsewhere. */
3603 return gen_rtx_CONST (GET_MODE (new), new);
3608 return x;
3611 #ifdef NO_FUNCTION_CSE
3612 case CALL:
3613 if (CONSTANT_P (XEXP (XEXP (x, 0), 0)))
3614 return x;
3615 break;
3616 #endif
3618 case ASM_OPERANDS:
3619 for (i = ASM_OPERANDS_INPUT_LENGTH (x) - 1; i >= 0; i--)
3620 validate_change (insn, &ASM_OPERANDS_INPUT (x, i),
3621 fold_rtx (ASM_OPERANDS_INPUT (x, i), insn), 0);
3622 break;
3624 default:
3625 break;
3628 const_arg0 = 0;
3629 const_arg1 = 0;
3630 const_arg2 = 0;
3631 mode_arg0 = VOIDmode;
3633 /* Try folding our operands.
3634 Then see which ones have constant values known. */
3636 fmt = GET_RTX_FORMAT (code);
3637 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3638 if (fmt[i] == 'e')
3640 rtx arg = XEXP (x, i);
3641 rtx folded_arg = arg, const_arg = 0;
3642 enum machine_mode mode_arg = GET_MODE (arg);
3643 rtx cheap_arg, expensive_arg;
3644 rtx replacements[2];
3645 int j;
3646 int old_cost = COST_IN (XEXP (x, i), code);
3648 /* Most arguments are cheap, so handle them specially. */
3649 switch (GET_CODE (arg))
3651 case REG:
3652 /* This is the same as calling equiv_constant; it is duplicated
3653 here for speed. */
3654 if (REGNO_QTY_VALID_P (REGNO (arg)))
3656 int arg_q = REG_QTY (REGNO (arg));
3657 struct qty_table_elem *arg_ent = &qty_table[arg_q];
3659 if (arg_ent->const_rtx != NULL_RTX
3660 && GET_CODE (arg_ent->const_rtx) != REG
3661 && GET_CODE (arg_ent->const_rtx) != PLUS)
3662 const_arg
3663 = gen_lowpart_if_possible (GET_MODE (arg),
3664 arg_ent->const_rtx);
3666 break;
3668 case CONST:
3669 case CONST_INT:
3670 case SYMBOL_REF:
3671 case LABEL_REF:
3672 case CONST_DOUBLE:
3673 case CONST_VECTOR:
3674 const_arg = arg;
3675 break;
3677 #ifdef HAVE_cc0
3678 case CC0:
3679 folded_arg = prev_insn_cc0;
3680 mode_arg = prev_insn_cc0_mode;
3681 const_arg = equiv_constant (folded_arg);
3682 break;
3683 #endif
3685 default:
3686 folded_arg = fold_rtx (arg, insn);
3687 const_arg = equiv_constant (folded_arg);
3690 /* For the first three operands, see if the operand
3691 is constant or equivalent to a constant. */
3692 switch (i)
3694 case 0:
3695 folded_arg0 = folded_arg;
3696 const_arg0 = const_arg;
3697 mode_arg0 = mode_arg;
3698 break;
3699 case 1:
3700 folded_arg1 = folded_arg;
3701 const_arg1 = const_arg;
3702 break;
3703 case 2:
3704 const_arg2 = const_arg;
3705 break;
3708 /* Pick the least expensive of the folded argument and an
3709 equivalent constant argument. */
3710 if (const_arg == 0 || const_arg == folded_arg
3711 || COST_IN (const_arg, code) > COST_IN (folded_arg, code))
3712 cheap_arg = folded_arg, expensive_arg = const_arg;
3713 else
3714 cheap_arg = const_arg, expensive_arg = folded_arg;
3716 /* Try to replace the operand with the cheapest of the two
3717 possibilities. If it doesn't work and this is either of the first
3718 two operands of a commutative operation, try swapping them.
3719 If THAT fails, try the more expensive, provided it is cheaper
3720 than what is already there. */
3722 if (cheap_arg == XEXP (x, i))
3723 continue;
3725 if (insn == 0 && ! copied)
3727 x = copy_rtx (x);
3728 copied = 1;
3731 /* Order the replacements from cheapest to most expensive. */
3732 replacements[0] = cheap_arg;
3733 replacements[1] = expensive_arg;
3735 for (j = 0; j < 2 && replacements[j]; j++)
3737 int new_cost = COST_IN (replacements[j], code);
3739 /* Stop if what existed before was cheaper. Prefer constants
3740 in the case of a tie. */
3741 if (new_cost > old_cost
3742 || (new_cost == old_cost && CONSTANT_P (XEXP (x, i))))
3743 break;
3745 if (validate_change (insn, &XEXP (x, i), replacements[j], 0))
3746 break;
3748 if (code == NE || code == EQ || GET_RTX_CLASS (code) == 'c'
3749 || code == LTGT || code == UNEQ || code == ORDERED
3750 || code == UNORDERED)
3752 validate_change (insn, &XEXP (x, i), XEXP (x, 1 - i), 1);
3753 validate_change (insn, &XEXP (x, 1 - i), replacements[j], 1);
3755 if (apply_change_group ())
3757 /* Swap them back to be invalid so that this loop can
3758 continue and flag them to be swapped back later. */
3759 rtx tem;
3761 tem = XEXP (x, 0); XEXP (x, 0) = XEXP (x, 1);
3762 XEXP (x, 1) = tem;
3763 must_swap = 1;
3764 break;
3770 else
3772 if (fmt[i] == 'E')
3773 /* Don't try to fold inside of a vector of expressions.
3774 Doing nothing is harmless. */
3778 /* If a commutative operation, place a constant integer as the second
3779 operand unless the first operand is also a constant integer. Otherwise,
3780 place any constant second unless the first operand is also a constant. */
3782 if (code == EQ || code == NE || GET_RTX_CLASS (code) == 'c'
3783 || code == LTGT || code == UNEQ || code == ORDERED
3784 || code == UNORDERED)
3786 if (must_swap || (const_arg0
3787 && (const_arg1 == 0
3788 || (GET_CODE (const_arg0) == CONST_INT
3789 && GET_CODE (const_arg1) != CONST_INT))))
3791 rtx tem = XEXP (x, 0);
3793 if (insn == 0 && ! copied)
3795 x = copy_rtx (x);
3796 copied = 1;
3799 validate_change (insn, &XEXP (x, 0), XEXP (x, 1), 1);
3800 validate_change (insn, &XEXP (x, 1), tem, 1);
3801 if (apply_change_group ())
3803 tem = const_arg0, const_arg0 = const_arg1, const_arg1 = tem;
3804 tem = folded_arg0, folded_arg0 = folded_arg1, folded_arg1 = tem;
3809 /* If X is an arithmetic operation, see if we can simplify it. */
3811 switch (GET_RTX_CLASS (code))
3813 case '1':
3815 int is_const = 0;
3817 /* We can't simplify extension ops unless we know the
3818 original mode. */
3819 if ((code == ZERO_EXTEND || code == SIGN_EXTEND)
3820 && mode_arg0 == VOIDmode)
3821 break;
3823 /* If we had a CONST, strip it off and put it back later if we
3824 fold. */
3825 if (const_arg0 != 0 && GET_CODE (const_arg0) == CONST)
3826 is_const = 1, const_arg0 = XEXP (const_arg0, 0);
3828 new = simplify_unary_operation (code, mode,
3829 const_arg0 ? const_arg0 : folded_arg0,
3830 mode_arg0);
3831 if (new != 0 && is_const)
3832 new = gen_rtx_CONST (mode, new);
3834 break;
3836 case '<':
3837 /* See what items are actually being compared and set FOLDED_ARG[01]
3838 to those values and CODE to the actual comparison code. If any are
3839 constant, set CONST_ARG0 and CONST_ARG1 appropriately. We needn't
3840 do anything if both operands are already known to be constant. */
3842 if (const_arg0 == 0 || const_arg1 == 0)
3844 struct table_elt *p0, *p1;
3845 rtx true_rtx = const_true_rtx, false_rtx = const0_rtx;
3846 enum machine_mode mode_arg1;
3848 #ifdef FLOAT_STORE_FLAG_VALUE
3849 if (GET_MODE_CLASS (mode) == MODE_FLOAT)
3851 true_rtx = (CONST_DOUBLE_FROM_REAL_VALUE
3852 (FLOAT_STORE_FLAG_VALUE (mode), mode));
3853 false_rtx = CONST0_RTX (mode);
3855 #endif
3857 code = find_comparison_args (code, &folded_arg0, &folded_arg1,
3858 &mode_arg0, &mode_arg1);
3859 const_arg0 = equiv_constant (folded_arg0);
3860 const_arg1 = equiv_constant (folded_arg1);
3862 /* If the mode is VOIDmode or a MODE_CC mode, we don't know
3863 what kinds of things are being compared, so we can't do
3864 anything with this comparison. */
3866 if (mode_arg0 == VOIDmode || GET_MODE_CLASS (mode_arg0) == MODE_CC)
3867 break;
3869 /* If we do not now have two constants being compared, see
3870 if we can nevertheless deduce some things about the
3871 comparison. */
3872 if (const_arg0 == 0 || const_arg1 == 0)
3874 /* Some addresses are known to be nonzero. We don't know
3875 their sign, but equality comparisons are known. */
3876 if (const_arg1 == const0_rtx
3877 && nonzero_address_p (folded_arg0))
3879 if (code == EQ)
3880 return false_rtx;
3881 else if (code == NE)
3882 return true_rtx;
3885 /* See if the two operands are the same. */
3887 if (folded_arg0 == folded_arg1
3888 || (GET_CODE (folded_arg0) == REG
3889 && GET_CODE (folded_arg1) == REG
3890 && (REG_QTY (REGNO (folded_arg0))
3891 == REG_QTY (REGNO (folded_arg1))))
3892 || ((p0 = lookup (folded_arg0,
3893 (safe_hash (folded_arg0, mode_arg0)
3894 & HASH_MASK), mode_arg0))
3895 && (p1 = lookup (folded_arg1,
3896 (safe_hash (folded_arg1, mode_arg0)
3897 & HASH_MASK), mode_arg0))
3898 && p0->first_same_value == p1->first_same_value))
3900 /* Sadly two equal NaNs are not equivalent. */
3901 if (!HONOR_NANS (mode_arg0))
3902 return ((code == EQ || code == LE || code == GE
3903 || code == LEU || code == GEU || code == UNEQ
3904 || code == UNLE || code == UNGE
3905 || code == ORDERED)
3906 ? true_rtx : false_rtx);
3907 /* Take care for the FP compares we can resolve. */
3908 if (code == UNEQ || code == UNLE || code == UNGE)
3909 return true_rtx;
3910 if (code == LTGT || code == LT || code == GT)
3911 return false_rtx;
3914 /* If FOLDED_ARG0 is a register, see if the comparison we are
3915 doing now is either the same as we did before or the reverse
3916 (we only check the reverse if not floating-point). */
3917 else if (GET_CODE (folded_arg0) == REG)
3919 int qty = REG_QTY (REGNO (folded_arg0));
3921 if (REGNO_QTY_VALID_P (REGNO (folded_arg0)))
3923 struct qty_table_elem *ent = &qty_table[qty];
3925 if ((comparison_dominates_p (ent->comparison_code, code)
3926 || (! FLOAT_MODE_P (mode_arg0)
3927 && comparison_dominates_p (ent->comparison_code,
3928 reverse_condition (code))))
3929 && (rtx_equal_p (ent->comparison_const, folded_arg1)
3930 || (const_arg1
3931 && rtx_equal_p (ent->comparison_const,
3932 const_arg1))
3933 || (GET_CODE (folded_arg1) == REG
3934 && (REG_QTY (REGNO (folded_arg1)) == ent->comparison_qty))))
3935 return (comparison_dominates_p (ent->comparison_code, code)
3936 ? true_rtx : false_rtx);
3942 /* If we are comparing against zero, see if the first operand is
3943 equivalent to an IOR with a constant. If so, we may be able to
3944 determine the result of this comparison. */
3946 if (const_arg1 == const0_rtx)
3948 rtx y = lookup_as_function (folded_arg0, IOR);
3949 rtx inner_const;
3951 if (y != 0
3952 && (inner_const = equiv_constant (XEXP (y, 1))) != 0
3953 && GET_CODE (inner_const) == CONST_INT
3954 && INTVAL (inner_const) != 0)
3956 int sign_bitnum = GET_MODE_BITSIZE (mode_arg0) - 1;
3957 int has_sign = (HOST_BITS_PER_WIDE_INT >= sign_bitnum
3958 && (INTVAL (inner_const)
3959 & ((HOST_WIDE_INT) 1 << sign_bitnum)));
3960 rtx true_rtx = const_true_rtx, false_rtx = const0_rtx;
3962 #ifdef FLOAT_STORE_FLAG_VALUE
3963 if (GET_MODE_CLASS (mode) == MODE_FLOAT)
3965 true_rtx = (CONST_DOUBLE_FROM_REAL_VALUE
3966 (FLOAT_STORE_FLAG_VALUE (mode), mode));
3967 false_rtx = CONST0_RTX (mode);
3969 #endif
3971 switch (code)
3973 case EQ:
3974 return false_rtx;
3975 case NE:
3976 return true_rtx;
3977 case LT: case LE:
3978 if (has_sign)
3979 return true_rtx;
3980 break;
3981 case GT: case GE:
3982 if (has_sign)
3983 return false_rtx;
3984 break;
3985 default:
3986 break;
3991 new = simplify_relational_operation (code,
3992 (mode_arg0 != VOIDmode
3993 ? mode_arg0
3994 : (GET_MODE (const_arg0
3995 ? const_arg0
3996 : folded_arg0)
3997 != VOIDmode)
3998 ? GET_MODE (const_arg0
3999 ? const_arg0
4000 : folded_arg0)
4001 : GET_MODE (const_arg1
4002 ? const_arg1
4003 : folded_arg1)),
4004 const_arg0 ? const_arg0 : folded_arg0,
4005 const_arg1 ? const_arg1 : folded_arg1);
4006 #ifdef FLOAT_STORE_FLAG_VALUE
4007 if (new != 0 && GET_MODE_CLASS (mode) == MODE_FLOAT)
4009 if (new == const0_rtx)
4010 new = CONST0_RTX (mode);
4011 else
4012 new = (CONST_DOUBLE_FROM_REAL_VALUE
4013 (FLOAT_STORE_FLAG_VALUE (mode), mode));
4015 #endif
4016 break;
4018 case '2':
4019 case 'c':
4020 switch (code)
4022 case PLUS:
4023 /* If the second operand is a LABEL_REF, see if the first is a MINUS
4024 with that LABEL_REF as its second operand. If so, the result is
4025 the first operand of that MINUS. This handles switches with an
4026 ADDR_DIFF_VEC table. */
4027 if (const_arg1 && GET_CODE (const_arg1) == LABEL_REF)
4029 rtx y
4030 = GET_CODE (folded_arg0) == MINUS ? folded_arg0
4031 : lookup_as_function (folded_arg0, MINUS);
4033 if (y != 0 && GET_CODE (XEXP (y, 1)) == LABEL_REF
4034 && XEXP (XEXP (y, 1), 0) == XEXP (const_arg1, 0))
4035 return XEXP (y, 0);
4037 /* Now try for a CONST of a MINUS like the above. */
4038 if ((y = (GET_CODE (folded_arg0) == CONST ? folded_arg0
4039 : lookup_as_function (folded_arg0, CONST))) != 0
4040 && GET_CODE (XEXP (y, 0)) == MINUS
4041 && GET_CODE (XEXP (XEXP (y, 0), 1)) == LABEL_REF
4042 && XEXP (XEXP (XEXP (y, 0), 1), 0) == XEXP (const_arg1, 0))
4043 return XEXP (XEXP (y, 0), 0);
4046 /* Likewise if the operands are in the other order. */
4047 if (const_arg0 && GET_CODE (const_arg0) == LABEL_REF)
4049 rtx y
4050 = GET_CODE (folded_arg1) == MINUS ? folded_arg1
4051 : lookup_as_function (folded_arg1, MINUS);
4053 if (y != 0 && GET_CODE (XEXP (y, 1)) == LABEL_REF
4054 && XEXP (XEXP (y, 1), 0) == XEXP (const_arg0, 0))
4055 return XEXP (y, 0);
4057 /* Now try for a CONST of a MINUS like the above. */
4058 if ((y = (GET_CODE (folded_arg1) == CONST ? folded_arg1
4059 : lookup_as_function (folded_arg1, CONST))) != 0
4060 && GET_CODE (XEXP (y, 0)) == MINUS
4061 && GET_CODE (XEXP (XEXP (y, 0), 1)) == LABEL_REF
4062 && XEXP (XEXP (XEXP (y, 0), 1), 0) == XEXP (const_arg0, 0))
4063 return XEXP (XEXP (y, 0), 0);
4066 /* If second operand is a register equivalent to a negative
4067 CONST_INT, see if we can find a register equivalent to the
4068 positive constant. Make a MINUS if so. Don't do this for
4069 a non-negative constant since we might then alternate between
4070 choosing positive and negative constants. Having the positive
4071 constant previously-used is the more common case. Be sure
4072 the resulting constant is non-negative; if const_arg1 were
4073 the smallest negative number this would overflow: depending
4074 on the mode, this would either just be the same value (and
4075 hence not save anything) or be incorrect. */
4076 if (const_arg1 != 0 && GET_CODE (const_arg1) == CONST_INT
4077 && INTVAL (const_arg1) < 0
4078 /* This used to test
4080 -INTVAL (const_arg1) >= 0
4082 But The Sun V5.0 compilers mis-compiled that test. So
4083 instead we test for the problematic value in a more direct
4084 manner and hope the Sun compilers get it correct. */
4085 && INTVAL (const_arg1) !=
4086 ((HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT - 1))
4087 && GET_CODE (folded_arg1) == REG)
4089 rtx new_const = GEN_INT (-INTVAL (const_arg1));
4090 struct table_elt *p
4091 = lookup (new_const, safe_hash (new_const, mode) & HASH_MASK,
4092 mode);
4094 if (p)
4095 for (p = p->first_same_value; p; p = p->next_same_value)
4096 if (GET_CODE (p->exp) == REG)
4097 return simplify_gen_binary (MINUS, mode, folded_arg0,
4098 canon_reg (p->exp, NULL_RTX));
4100 goto from_plus;
4102 case MINUS:
4103 /* If we have (MINUS Y C), see if Y is known to be (PLUS Z C2).
4104 If so, produce (PLUS Z C2-C). */
4105 if (const_arg1 != 0 && GET_CODE (const_arg1) == CONST_INT)
4107 rtx y = lookup_as_function (XEXP (x, 0), PLUS);
4108 if (y && GET_CODE (XEXP (y, 1)) == CONST_INT)
4109 return fold_rtx (plus_constant (copy_rtx (y),
4110 -INTVAL (const_arg1)),
4111 NULL_RTX);
4114 /* Fall through. */
4116 from_plus:
4117 case SMIN: case SMAX: case UMIN: case UMAX:
4118 case IOR: case AND: case XOR:
4119 case MULT:
4120 case ASHIFT: case LSHIFTRT: case ASHIFTRT:
4121 /* If we have (<op> <reg> <const_int>) for an associative OP and REG
4122 is known to be of similar form, we may be able to replace the
4123 operation with a combined operation. This may eliminate the
4124 intermediate operation if every use is simplified in this way.
4125 Note that the similar optimization done by combine.c only works
4126 if the intermediate operation's result has only one reference. */
4128 if (GET_CODE (folded_arg0) == REG
4129 && const_arg1 && GET_CODE (const_arg1) == CONST_INT)
4131 int is_shift
4132 = (code == ASHIFT || code == ASHIFTRT || code == LSHIFTRT);
4133 rtx y = lookup_as_function (folded_arg0, code);
4134 rtx inner_const;
4135 enum rtx_code associate_code;
4136 rtx new_const;
4138 if (y == 0
4139 || 0 == (inner_const
4140 = equiv_constant (fold_rtx (XEXP (y, 1), 0)))
4141 || GET_CODE (inner_const) != CONST_INT
4142 /* If we have compiled a statement like
4143 "if (x == (x & mask1))", and now are looking at
4144 "x & mask2", we will have a case where the first operand
4145 of Y is the same as our first operand. Unless we detect
4146 this case, an infinite loop will result. */
4147 || XEXP (y, 0) == folded_arg0)
4148 break;
4150 /* Don't associate these operations if they are a PLUS with the
4151 same constant and it is a power of two. These might be doable
4152 with a pre- or post-increment. Similarly for two subtracts of
4153 identical powers of two with post decrement. */
4155 if (code == PLUS && const_arg1 == inner_const
4156 && ((HAVE_PRE_INCREMENT
4157 && exact_log2 (INTVAL (const_arg1)) >= 0)
4158 || (HAVE_POST_INCREMENT
4159 && exact_log2 (INTVAL (const_arg1)) >= 0)
4160 || (HAVE_PRE_DECREMENT
4161 && exact_log2 (- INTVAL (const_arg1)) >= 0)
4162 || (HAVE_POST_DECREMENT
4163 && exact_log2 (- INTVAL (const_arg1)) >= 0)))
4164 break;
4166 /* Compute the code used to compose the constants. For example,
4167 A-C1-C2 is A-(C1 + C2), so if CODE == MINUS, we want PLUS. */
4169 associate_code = (is_shift || code == MINUS ? PLUS : code);
4171 new_const = simplify_binary_operation (associate_code, mode,
4172 const_arg1, inner_const);
4174 if (new_const == 0)
4175 break;
4177 /* If we are associating shift operations, don't let this
4178 produce a shift of the size of the object or larger.
4179 This could occur when we follow a sign-extend by a right
4180 shift on a machine that does a sign-extend as a pair
4181 of shifts. */
4183 if (is_shift && GET_CODE (new_const) == CONST_INT
4184 && INTVAL (new_const) >= GET_MODE_BITSIZE (mode))
4186 /* As an exception, we can turn an ASHIFTRT of this
4187 form into a shift of the number of bits - 1. */
4188 if (code == ASHIFTRT)
4189 new_const = GEN_INT (GET_MODE_BITSIZE (mode) - 1);
4190 else
4191 break;
4194 y = copy_rtx (XEXP (y, 0));
4196 /* If Y contains our first operand (the most common way this
4197 can happen is if Y is a MEM), we would do into an infinite
4198 loop if we tried to fold it. So don't in that case. */
4200 if (! reg_mentioned_p (folded_arg0, y))
4201 y = fold_rtx (y, insn);
4203 return simplify_gen_binary (code, mode, y, new_const);
4205 break;
4207 case DIV: case UDIV:
4208 /* ??? The associative optimization performed immediately above is
4209 also possible for DIV and UDIV using associate_code of MULT.
4210 However, we would need extra code to verify that the
4211 multiplication does not overflow, that is, there is no overflow
4212 in the calculation of new_const. */
4213 break;
4215 default:
4216 break;
4219 new = simplify_binary_operation (code, mode,
4220 const_arg0 ? const_arg0 : folded_arg0,
4221 const_arg1 ? const_arg1 : folded_arg1);
4222 break;
4224 case 'o':
4225 /* (lo_sum (high X) X) is simply X. */
4226 if (code == LO_SUM && const_arg0 != 0
4227 && GET_CODE (const_arg0) == HIGH
4228 && rtx_equal_p (XEXP (const_arg0, 0), const_arg1))
4229 return const_arg1;
4230 break;
4232 case '3':
4233 case 'b':
4234 new = simplify_ternary_operation (code, mode, mode_arg0,
4235 const_arg0 ? const_arg0 : folded_arg0,
4236 const_arg1 ? const_arg1 : folded_arg1,
4237 const_arg2 ? const_arg2 : XEXP (x, 2));
4238 break;
4240 case 'x':
4241 /* Eliminate CONSTANT_P_RTX if its constant. */
4242 if (code == CONSTANT_P_RTX)
4244 if (const_arg0)
4245 return const1_rtx;
4246 if (optimize == 0 || !flag_gcse)
4247 return const0_rtx;
4249 break;
4252 return new ? new : x;
4255 /* Return a constant value currently equivalent to X.
4256 Return 0 if we don't know one. */
4258 static rtx
4259 equiv_constant (rtx x)
4261 if (GET_CODE (x) == REG
4262 && REGNO_QTY_VALID_P (REGNO (x)))
4264 int x_q = REG_QTY (REGNO (x));
4265 struct qty_table_elem *x_ent = &qty_table[x_q];
4267 if (x_ent->const_rtx)
4268 x = gen_lowpart_if_possible (GET_MODE (x), x_ent->const_rtx);
4271 if (x == 0 || CONSTANT_P (x))
4272 return x;
4274 /* If X is a MEM, try to fold it outside the context of any insn to see if
4275 it might be equivalent to a constant. That handles the case where it
4276 is a constant-pool reference. Then try to look it up in the hash table
4277 in case it is something whose value we have seen before. */
4279 if (GET_CODE (x) == MEM)
4281 struct table_elt *elt;
4283 x = fold_rtx (x, NULL_RTX);
4284 if (CONSTANT_P (x))
4285 return x;
4287 elt = lookup (x, safe_hash (x, GET_MODE (x)) & HASH_MASK, GET_MODE (x));
4288 if (elt == 0)
4289 return 0;
4291 for (elt = elt->first_same_value; elt; elt = elt->next_same_value)
4292 if (elt->is_const && CONSTANT_P (elt->exp))
4293 return elt->exp;
4296 return 0;
4299 /* Assuming that X is an rtx (e.g., MEM, REG or SUBREG) for a fixed-point
4300 number, return an rtx (MEM, SUBREG, or CONST_INT) that refers to the
4301 least-significant part of X.
4302 MODE specifies how big a part of X to return.
4304 If the requested operation cannot be done, 0 is returned.
4306 This is similar to gen_lowpart in emit-rtl.c. */
4309 gen_lowpart_if_possible (enum machine_mode mode, rtx x)
4311 rtx result = gen_lowpart_common (mode, x);
4313 if (result)
4314 return result;
4315 else if (GET_CODE (x) == MEM)
4317 /* This is the only other case we handle. */
4318 int offset = 0;
4319 rtx new;
4321 if (WORDS_BIG_ENDIAN)
4322 offset = (MAX (GET_MODE_SIZE (GET_MODE (x)), UNITS_PER_WORD)
4323 - MAX (GET_MODE_SIZE (mode), UNITS_PER_WORD));
4324 if (BYTES_BIG_ENDIAN)
4325 /* Adjust the address so that the address-after-the-data is
4326 unchanged. */
4327 offset -= (MIN (UNITS_PER_WORD, GET_MODE_SIZE (mode))
4328 - MIN (UNITS_PER_WORD, GET_MODE_SIZE (GET_MODE (x))));
4330 new = adjust_address_nv (x, mode, offset);
4331 if (! memory_address_p (mode, XEXP (new, 0)))
4332 return 0;
4334 return new;
4336 else
4337 return 0;
4340 /* Given INSN, a jump insn, TAKEN indicates if we are following the "taken"
4341 branch. It will be zero if not.
4343 In certain cases, this can cause us to add an equivalence. For example,
4344 if we are following the taken case of
4345 if (i == 2)
4346 we can add the fact that `i' and '2' are now equivalent.
4348 In any case, we can record that this comparison was passed. If the same
4349 comparison is seen later, we will know its value. */
4351 static void
4352 record_jump_equiv (rtx insn, int taken)
4354 int cond_known_true;
4355 rtx op0, op1;
4356 rtx set;
4357 enum machine_mode mode, mode0, mode1;
4358 int reversed_nonequality = 0;
4359 enum rtx_code code;
4361 /* Ensure this is the right kind of insn. */
4362 if (! any_condjump_p (insn))
4363 return;
4364 set = pc_set (insn);
4366 /* See if this jump condition is known true or false. */
4367 if (taken)
4368 cond_known_true = (XEXP (SET_SRC (set), 2) == pc_rtx);
4369 else
4370 cond_known_true = (XEXP (SET_SRC (set), 1) == pc_rtx);
4372 /* Get the type of comparison being done and the operands being compared.
4373 If we had to reverse a non-equality condition, record that fact so we
4374 know that it isn't valid for floating-point. */
4375 code = GET_CODE (XEXP (SET_SRC (set), 0));
4376 op0 = fold_rtx (XEXP (XEXP (SET_SRC (set), 0), 0), insn);
4377 op1 = fold_rtx (XEXP (XEXP (SET_SRC (set), 0), 1), insn);
4379 code = find_comparison_args (code, &op0, &op1, &mode0, &mode1);
4380 if (! cond_known_true)
4382 code = reversed_comparison_code_parts (code, op0, op1, insn);
4384 /* Don't remember if we can't find the inverse. */
4385 if (code == UNKNOWN)
4386 return;
4389 /* The mode is the mode of the non-constant. */
4390 mode = mode0;
4391 if (mode1 != VOIDmode)
4392 mode = mode1;
4394 record_jump_cond (code, mode, op0, op1, reversed_nonequality);
4397 /* We know that comparison CODE applied to OP0 and OP1 in MODE is true.
4398 REVERSED_NONEQUALITY is nonzero if CODE had to be swapped.
4399 Make any useful entries we can with that information. Called from
4400 above function and called recursively. */
4402 static void
4403 record_jump_cond (enum rtx_code code, enum machine_mode mode, rtx op0,
4404 rtx op1, int reversed_nonequality)
4406 unsigned op0_hash, op1_hash;
4407 int op0_in_memory, op1_in_memory;
4408 struct table_elt *op0_elt, *op1_elt;
4410 /* If OP0 and OP1 are known equal, and either is a paradoxical SUBREG,
4411 we know that they are also equal in the smaller mode (this is also
4412 true for all smaller modes whether or not there is a SUBREG, but
4413 is not worth testing for with no SUBREG). */
4415 /* Note that GET_MODE (op0) may not equal MODE. */
4416 if (code == EQ && GET_CODE (op0) == SUBREG
4417 && (GET_MODE_SIZE (GET_MODE (op0))
4418 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (op0)))))
4420 enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op0));
4421 rtx tem = gen_lowpart_if_possible (inner_mode, op1);
4423 record_jump_cond (code, mode, SUBREG_REG (op0),
4424 tem ? tem : gen_rtx_SUBREG (inner_mode, op1, 0),
4425 reversed_nonequality);
4428 if (code == EQ && GET_CODE (op1) == SUBREG
4429 && (GET_MODE_SIZE (GET_MODE (op1))
4430 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (op1)))))
4432 enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op1));
4433 rtx tem = gen_lowpart_if_possible (inner_mode, op0);
4435 record_jump_cond (code, mode, SUBREG_REG (op1),
4436 tem ? tem : gen_rtx_SUBREG (inner_mode, op0, 0),
4437 reversed_nonequality);
4440 /* Similarly, if this is an NE comparison, and either is a SUBREG
4441 making a smaller mode, we know the whole thing is also NE. */
4443 /* Note that GET_MODE (op0) may not equal MODE;
4444 if we test MODE instead, we can get an infinite recursion
4445 alternating between two modes each wider than MODE. */
4447 if (code == NE && GET_CODE (op0) == SUBREG
4448 && subreg_lowpart_p (op0)
4449 && (GET_MODE_SIZE (GET_MODE (op0))
4450 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (op0)))))
4452 enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op0));
4453 rtx tem = gen_lowpart_if_possible (inner_mode, op1);
4455 record_jump_cond (code, mode, SUBREG_REG (op0),
4456 tem ? tem : gen_rtx_SUBREG (inner_mode, op1, 0),
4457 reversed_nonequality);
4460 if (code == NE && GET_CODE (op1) == SUBREG
4461 && subreg_lowpart_p (op1)
4462 && (GET_MODE_SIZE (GET_MODE (op1))
4463 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (op1)))))
4465 enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op1));
4466 rtx tem = gen_lowpart_if_possible (inner_mode, op0);
4468 record_jump_cond (code, mode, SUBREG_REG (op1),
4469 tem ? tem : gen_rtx_SUBREG (inner_mode, op0, 0),
4470 reversed_nonequality);
4473 /* Hash both operands. */
4475 do_not_record = 0;
4476 hash_arg_in_memory = 0;
4477 op0_hash = HASH (op0, mode);
4478 op0_in_memory = hash_arg_in_memory;
4480 if (do_not_record)
4481 return;
4483 do_not_record = 0;
4484 hash_arg_in_memory = 0;
4485 op1_hash = HASH (op1, mode);
4486 op1_in_memory = hash_arg_in_memory;
4488 if (do_not_record)
4489 return;
4491 /* Look up both operands. */
4492 op0_elt = lookup (op0, op0_hash, mode);
4493 op1_elt = lookup (op1, op1_hash, mode);
4495 /* If both operands are already equivalent or if they are not in the
4496 table but are identical, do nothing. */
4497 if ((op0_elt != 0 && op1_elt != 0
4498 && op0_elt->first_same_value == op1_elt->first_same_value)
4499 || op0 == op1 || rtx_equal_p (op0, op1))
4500 return;
4502 /* If we aren't setting two things equal all we can do is save this
4503 comparison. Similarly if this is floating-point. In the latter
4504 case, OP1 might be zero and both -0.0 and 0.0 are equal to it.
4505 If we record the equality, we might inadvertently delete code
4506 whose intent was to change -0 to +0. */
4508 if (code != EQ || FLOAT_MODE_P (GET_MODE (op0)))
4510 struct qty_table_elem *ent;
4511 int qty;
4513 /* If we reversed a floating-point comparison, if OP0 is not a
4514 register, or if OP1 is neither a register or constant, we can't
4515 do anything. */
4517 if (GET_CODE (op1) != REG)
4518 op1 = equiv_constant (op1);
4520 if ((reversed_nonequality && FLOAT_MODE_P (mode))
4521 || GET_CODE (op0) != REG || op1 == 0)
4522 return;
4524 /* Put OP0 in the hash table if it isn't already. This gives it a
4525 new quantity number. */
4526 if (op0_elt == 0)
4528 if (insert_regs (op0, NULL, 0))
4530 rehash_using_reg (op0);
4531 op0_hash = HASH (op0, mode);
4533 /* If OP0 is contained in OP1, this changes its hash code
4534 as well. Faster to rehash than to check, except
4535 for the simple case of a constant. */
4536 if (! CONSTANT_P (op1))
4537 op1_hash = HASH (op1,mode);
4540 op0_elt = insert (op0, NULL, op0_hash, mode);
4541 op0_elt->in_memory = op0_in_memory;
4544 qty = REG_QTY (REGNO (op0));
4545 ent = &qty_table[qty];
4547 ent->comparison_code = code;
4548 if (GET_CODE (op1) == REG)
4550 /* Look it up again--in case op0 and op1 are the same. */
4551 op1_elt = lookup (op1, op1_hash, mode);
4553 /* Put OP1 in the hash table so it gets a new quantity number. */
4554 if (op1_elt == 0)
4556 if (insert_regs (op1, NULL, 0))
4558 rehash_using_reg (op1);
4559 op1_hash = HASH (op1, mode);
4562 op1_elt = insert (op1, NULL, op1_hash, mode);
4563 op1_elt->in_memory = op1_in_memory;
4566 ent->comparison_const = NULL_RTX;
4567 ent->comparison_qty = REG_QTY (REGNO (op1));
4569 else
4571 ent->comparison_const = op1;
4572 ent->comparison_qty = -1;
4575 return;
4578 /* If either side is still missing an equivalence, make it now,
4579 then merge the equivalences. */
4581 if (op0_elt == 0)
4583 if (insert_regs (op0, NULL, 0))
4585 rehash_using_reg (op0);
4586 op0_hash = HASH (op0, mode);
4589 op0_elt = insert (op0, NULL, op0_hash, mode);
4590 op0_elt->in_memory = op0_in_memory;
4593 if (op1_elt == 0)
4595 if (insert_regs (op1, NULL, 0))
4597 rehash_using_reg (op1);
4598 op1_hash = HASH (op1, mode);
4601 op1_elt = insert (op1, NULL, op1_hash, mode);
4602 op1_elt->in_memory = op1_in_memory;
4605 merge_equiv_classes (op0_elt, op1_elt);
4606 last_jump_equiv_class = op0_elt;
4609 /* CSE processing for one instruction.
4610 First simplify sources and addresses of all assignments
4611 in the instruction, using previously-computed equivalents values.
4612 Then install the new sources and destinations in the table
4613 of available values.
4615 If LIBCALL_INSN is nonzero, don't record any equivalence made in
4616 the insn. It means that INSN is inside libcall block. In this
4617 case LIBCALL_INSN is the corresponding insn with REG_LIBCALL. */
4619 /* Data on one SET contained in the instruction. */
4621 struct set
4623 /* The SET rtx itself. */
4624 rtx rtl;
4625 /* The SET_SRC of the rtx (the original value, if it is changing). */
4626 rtx src;
4627 /* The hash-table element for the SET_SRC of the SET. */
4628 struct table_elt *src_elt;
4629 /* Hash value for the SET_SRC. */
4630 unsigned src_hash;
4631 /* Hash value for the SET_DEST. */
4632 unsigned dest_hash;
4633 /* The SET_DEST, with SUBREG, etc., stripped. */
4634 rtx inner_dest;
4635 /* Nonzero if the SET_SRC is in memory. */
4636 char src_in_memory;
4637 /* Nonzero if the SET_SRC contains something
4638 whose value cannot be predicted and understood. */
4639 char src_volatile;
4640 /* Original machine mode, in case it becomes a CONST_INT.
4641 The size of this field should match the size of the mode
4642 field of struct rtx_def (see rtl.h). */
4643 ENUM_BITFIELD(machine_mode) mode : 8;
4644 /* A constant equivalent for SET_SRC, if any. */
4645 rtx src_const;
4646 /* Original SET_SRC value used for libcall notes. */
4647 rtx orig_src;
4648 /* Hash value of constant equivalent for SET_SRC. */
4649 unsigned src_const_hash;
4650 /* Table entry for constant equivalent for SET_SRC, if any. */
4651 struct table_elt *src_const_elt;
4654 static void
4655 cse_insn (rtx insn, rtx libcall_insn)
4657 rtx x = PATTERN (insn);
4658 int i;
4659 rtx tem;
4660 int n_sets = 0;
4662 #ifdef HAVE_cc0
4663 /* Records what this insn does to set CC0. */
4664 rtx this_insn_cc0 = 0;
4665 enum machine_mode this_insn_cc0_mode = VOIDmode;
4666 #endif
4668 rtx src_eqv = 0;
4669 struct table_elt *src_eqv_elt = 0;
4670 int src_eqv_volatile = 0;
4671 int src_eqv_in_memory = 0;
4672 unsigned src_eqv_hash = 0;
4674 struct set *sets = (struct set *) 0;
4676 this_insn = insn;
4678 /* Find all the SETs and CLOBBERs in this instruction.
4679 Record all the SETs in the array `set' and count them.
4680 Also determine whether there is a CLOBBER that invalidates
4681 all memory references, or all references at varying addresses. */
4683 if (GET_CODE (insn) == CALL_INSN)
4685 for (tem = CALL_INSN_FUNCTION_USAGE (insn); tem; tem = XEXP (tem, 1))
4687 if (GET_CODE (XEXP (tem, 0)) == CLOBBER)
4688 invalidate (SET_DEST (XEXP (tem, 0)), VOIDmode);
4689 XEXP (tem, 0) = canon_reg (XEXP (tem, 0), insn);
4693 if (GET_CODE (x) == SET)
4695 sets = (struct set *) alloca (sizeof (struct set));
4696 sets[0].rtl = x;
4698 /* Ignore SETs that are unconditional jumps.
4699 They never need cse processing, so this does not hurt.
4700 The reason is not efficiency but rather
4701 so that we can test at the end for instructions
4702 that have been simplified to unconditional jumps
4703 and not be misled by unchanged instructions
4704 that were unconditional jumps to begin with. */
4705 if (SET_DEST (x) == pc_rtx
4706 && GET_CODE (SET_SRC (x)) == LABEL_REF)
4709 /* Don't count call-insns, (set (reg 0) (call ...)), as a set.
4710 The hard function value register is used only once, to copy to
4711 someplace else, so it isn't worth cse'ing (and on 80386 is unsafe)!
4712 Ensure we invalidate the destination register. On the 80386 no
4713 other code would invalidate it since it is a fixed_reg.
4714 We need not check the return of apply_change_group; see canon_reg. */
4716 else if (GET_CODE (SET_SRC (x)) == CALL)
4718 canon_reg (SET_SRC (x), insn);
4719 apply_change_group ();
4720 fold_rtx (SET_SRC (x), insn);
4721 invalidate (SET_DEST (x), VOIDmode);
4723 else
4724 n_sets = 1;
4726 else if (GET_CODE (x) == PARALLEL)
4728 int lim = XVECLEN (x, 0);
4730 sets = (struct set *) alloca (lim * sizeof (struct set));
4732 /* Find all regs explicitly clobbered in this insn,
4733 and ensure they are not replaced with any other regs
4734 elsewhere in this insn.
4735 When a reg that is clobbered is also used for input,
4736 we should presume that that is for a reason,
4737 and we should not substitute some other register
4738 which is not supposed to be clobbered.
4739 Therefore, this loop cannot be merged into the one below
4740 because a CALL may precede a CLOBBER and refer to the
4741 value clobbered. We must not let a canonicalization do
4742 anything in that case. */
4743 for (i = 0; i < lim; i++)
4745 rtx y = XVECEXP (x, 0, i);
4746 if (GET_CODE (y) == CLOBBER)
4748 rtx clobbered = XEXP (y, 0);
4750 if (GET_CODE (clobbered) == REG
4751 || GET_CODE (clobbered) == SUBREG)
4752 invalidate (clobbered, VOIDmode);
4753 else if (GET_CODE (clobbered) == STRICT_LOW_PART
4754 || GET_CODE (clobbered) == ZERO_EXTRACT)
4755 invalidate (XEXP (clobbered, 0), GET_MODE (clobbered));
4759 for (i = 0; i < lim; i++)
4761 rtx y = XVECEXP (x, 0, i);
4762 if (GET_CODE (y) == SET)
4764 /* As above, we ignore unconditional jumps and call-insns and
4765 ignore the result of apply_change_group. */
4766 if (GET_CODE (SET_SRC (y)) == CALL)
4768 canon_reg (SET_SRC (y), insn);
4769 apply_change_group ();
4770 fold_rtx (SET_SRC (y), insn);
4771 invalidate (SET_DEST (y), VOIDmode);
4773 else if (SET_DEST (y) == pc_rtx
4774 && GET_CODE (SET_SRC (y)) == LABEL_REF)
4776 else
4777 sets[n_sets++].rtl = y;
4779 else if (GET_CODE (y) == CLOBBER)
4781 /* If we clobber memory, canon the address.
4782 This does nothing when a register is clobbered
4783 because we have already invalidated the reg. */
4784 if (GET_CODE (XEXP (y, 0)) == MEM)
4785 canon_reg (XEXP (y, 0), NULL_RTX);
4787 else if (GET_CODE (y) == USE
4788 && ! (GET_CODE (XEXP (y, 0)) == REG
4789 && REGNO (XEXP (y, 0)) < FIRST_PSEUDO_REGISTER))
4790 canon_reg (y, NULL_RTX);
4791 else if (GET_CODE (y) == CALL)
4793 /* The result of apply_change_group can be ignored; see
4794 canon_reg. */
4795 canon_reg (y, insn);
4796 apply_change_group ();
4797 fold_rtx (y, insn);
4801 else if (GET_CODE (x) == CLOBBER)
4803 if (GET_CODE (XEXP (x, 0)) == MEM)
4804 canon_reg (XEXP (x, 0), NULL_RTX);
4807 /* Canonicalize a USE of a pseudo register or memory location. */
4808 else if (GET_CODE (x) == USE
4809 && ! (GET_CODE (XEXP (x, 0)) == REG
4810 && REGNO (XEXP (x, 0)) < FIRST_PSEUDO_REGISTER))
4811 canon_reg (XEXP (x, 0), NULL_RTX);
4812 else if (GET_CODE (x) == CALL)
4814 /* The result of apply_change_group can be ignored; see canon_reg. */
4815 canon_reg (x, insn);
4816 apply_change_group ();
4817 fold_rtx (x, insn);
4820 /* Store the equivalent value in SRC_EQV, if different, or if the DEST
4821 is a STRICT_LOW_PART. The latter condition is necessary because SRC_EQV
4822 is handled specially for this case, and if it isn't set, then there will
4823 be no equivalence for the destination. */
4824 if (n_sets == 1 && REG_NOTES (insn) != 0
4825 && (tem = find_reg_note (insn, REG_EQUAL, NULL_RTX)) != 0
4826 && (! rtx_equal_p (XEXP (tem, 0), SET_SRC (sets[0].rtl))
4827 || GET_CODE (SET_DEST (sets[0].rtl)) == STRICT_LOW_PART))
4829 src_eqv = fold_rtx (canon_reg (XEXP (tem, 0), NULL_RTX), insn);
4830 XEXP (tem, 0) = src_eqv;
4833 /* Canonicalize sources and addresses of destinations.
4834 We do this in a separate pass to avoid problems when a MATCH_DUP is
4835 present in the insn pattern. In that case, we want to ensure that
4836 we don't break the duplicate nature of the pattern. So we will replace
4837 both operands at the same time. Otherwise, we would fail to find an
4838 equivalent substitution in the loop calling validate_change below.
4840 We used to suppress canonicalization of DEST if it appears in SRC,
4841 but we don't do this any more. */
4843 for (i = 0; i < n_sets; i++)
4845 rtx dest = SET_DEST (sets[i].rtl);
4846 rtx src = SET_SRC (sets[i].rtl);
4847 rtx new = canon_reg (src, insn);
4848 int insn_code;
4850 sets[i].orig_src = src;
4851 if ((GET_CODE (new) == REG && GET_CODE (src) == REG
4852 && ((REGNO (new) < FIRST_PSEUDO_REGISTER)
4853 != (REGNO (src) < FIRST_PSEUDO_REGISTER)))
4854 || (insn_code = recog_memoized (insn)) < 0
4855 || insn_data[insn_code].n_dups > 0)
4856 validate_change (insn, &SET_SRC (sets[i].rtl), new, 1);
4857 else
4858 SET_SRC (sets[i].rtl) = new;
4860 if (GET_CODE (dest) == ZERO_EXTRACT || GET_CODE (dest) == SIGN_EXTRACT)
4862 validate_change (insn, &XEXP (dest, 1),
4863 canon_reg (XEXP (dest, 1), insn), 1);
4864 validate_change (insn, &XEXP (dest, 2),
4865 canon_reg (XEXP (dest, 2), insn), 1);
4868 while (GET_CODE (dest) == SUBREG || GET_CODE (dest) == STRICT_LOW_PART
4869 || GET_CODE (dest) == ZERO_EXTRACT
4870 || GET_CODE (dest) == SIGN_EXTRACT)
4871 dest = XEXP (dest, 0);
4873 if (GET_CODE (dest) == MEM)
4874 canon_reg (dest, insn);
4877 /* Now that we have done all the replacements, we can apply the change
4878 group and see if they all work. Note that this will cause some
4879 canonicalizations that would have worked individually not to be applied
4880 because some other canonicalization didn't work, but this should not
4881 occur often.
4883 The result of apply_change_group can be ignored; see canon_reg. */
4885 apply_change_group ();
4887 /* Set sets[i].src_elt to the class each source belongs to.
4888 Detect assignments from or to volatile things
4889 and set set[i] to zero so they will be ignored
4890 in the rest of this function.
4892 Nothing in this loop changes the hash table or the register chains. */
4894 for (i = 0; i < n_sets; i++)
4896 rtx src, dest;
4897 rtx src_folded;
4898 struct table_elt *elt = 0, *p;
4899 enum machine_mode mode;
4900 rtx src_eqv_here;
4901 rtx src_const = 0;
4902 rtx src_related = 0;
4903 struct table_elt *src_const_elt = 0;
4904 int src_cost = MAX_COST;
4905 int src_eqv_cost = MAX_COST;
4906 int src_folded_cost = MAX_COST;
4907 int src_related_cost = MAX_COST;
4908 int src_elt_cost = MAX_COST;
4909 int src_regcost = MAX_COST;
4910 int src_eqv_regcost = MAX_COST;
4911 int src_folded_regcost = MAX_COST;
4912 int src_related_regcost = MAX_COST;
4913 int src_elt_regcost = MAX_COST;
4914 /* Set nonzero if we need to call force_const_mem on with the
4915 contents of src_folded before using it. */
4916 int src_folded_force_flag = 0;
4918 dest = SET_DEST (sets[i].rtl);
4919 src = SET_SRC (sets[i].rtl);
4921 /* If SRC is a constant that has no machine mode,
4922 hash it with the destination's machine mode.
4923 This way we can keep different modes separate. */
4925 mode = GET_MODE (src) == VOIDmode ? GET_MODE (dest) : GET_MODE (src);
4926 sets[i].mode = mode;
4928 if (src_eqv)
4930 enum machine_mode eqvmode = mode;
4931 if (GET_CODE (dest) == STRICT_LOW_PART)
4932 eqvmode = GET_MODE (SUBREG_REG (XEXP (dest, 0)));
4933 do_not_record = 0;
4934 hash_arg_in_memory = 0;
4935 src_eqv_hash = HASH (src_eqv, eqvmode);
4937 /* Find the equivalence class for the equivalent expression. */
4939 if (!do_not_record)
4940 src_eqv_elt = lookup (src_eqv, src_eqv_hash, eqvmode);
4942 src_eqv_volatile = do_not_record;
4943 src_eqv_in_memory = hash_arg_in_memory;
4946 /* If this is a STRICT_LOW_PART assignment, src_eqv corresponds to the
4947 value of the INNER register, not the destination. So it is not
4948 a valid substitution for the source. But save it for later. */
4949 if (GET_CODE (dest) == STRICT_LOW_PART)
4950 src_eqv_here = 0;
4951 else
4952 src_eqv_here = src_eqv;
4954 /* Simplify and foldable subexpressions in SRC. Then get the fully-
4955 simplified result, which may not necessarily be valid. */
4956 src_folded = fold_rtx (src, insn);
4958 #if 0
4959 /* ??? This caused bad code to be generated for the m68k port with -O2.
4960 Suppose src is (CONST_INT -1), and that after truncation src_folded
4961 is (CONST_INT 3). Suppose src_folded is then used for src_const.
4962 At the end we will add src and src_const to the same equivalence
4963 class. We now have 3 and -1 on the same equivalence class. This
4964 causes later instructions to be mis-optimized. */
4965 /* If storing a constant in a bitfield, pre-truncate the constant
4966 so we will be able to record it later. */
4967 if (GET_CODE (SET_DEST (sets[i].rtl)) == ZERO_EXTRACT
4968 || GET_CODE (SET_DEST (sets[i].rtl)) == SIGN_EXTRACT)
4970 rtx width = XEXP (SET_DEST (sets[i].rtl), 1);
4972 if (GET_CODE (src) == CONST_INT
4973 && GET_CODE (width) == CONST_INT
4974 && INTVAL (width) < HOST_BITS_PER_WIDE_INT
4975 && (INTVAL (src) & ((HOST_WIDE_INT) (-1) << INTVAL (width))))
4976 src_folded
4977 = GEN_INT (INTVAL (src) & (((HOST_WIDE_INT) 1
4978 << INTVAL (width)) - 1));
4980 #endif
4982 /* Compute SRC's hash code, and also notice if it
4983 should not be recorded at all. In that case,
4984 prevent any further processing of this assignment. */
4985 do_not_record = 0;
4986 hash_arg_in_memory = 0;
4988 sets[i].src = src;
4989 sets[i].src_hash = HASH (src, mode);
4990 sets[i].src_volatile = do_not_record;
4991 sets[i].src_in_memory = hash_arg_in_memory;
4993 /* If SRC is a MEM, there is a REG_EQUIV note for SRC, and DEST is
4994 a pseudo, do not record SRC. Using SRC as a replacement for
4995 anything else will be incorrect in that situation. Note that
4996 this usually occurs only for stack slots, in which case all the
4997 RTL would be referring to SRC, so we don't lose any optimization
4998 opportunities by not having SRC in the hash table. */
5000 if (GET_CODE (src) == MEM
5001 && find_reg_note (insn, REG_EQUIV, NULL_RTX) != 0
5002 && GET_CODE (dest) == REG
5003 && REGNO (dest) >= FIRST_PSEUDO_REGISTER)
5004 sets[i].src_volatile = 1;
5006 #if 0
5007 /* It is no longer clear why we used to do this, but it doesn't
5008 appear to still be needed. So let's try without it since this
5009 code hurts cse'ing widened ops. */
5010 /* If source is a perverse subreg (such as QI treated as an SI),
5011 treat it as volatile. It may do the work of an SI in one context
5012 where the extra bits are not being used, but cannot replace an SI
5013 in general. */
5014 if (GET_CODE (src) == SUBREG
5015 && (GET_MODE_SIZE (GET_MODE (src))
5016 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (src)))))
5017 sets[i].src_volatile = 1;
5018 #endif
5020 /* Locate all possible equivalent forms for SRC. Try to replace
5021 SRC in the insn with each cheaper equivalent.
5023 We have the following types of equivalents: SRC itself, a folded
5024 version, a value given in a REG_EQUAL note, or a value related
5025 to a constant.
5027 Each of these equivalents may be part of an additional class
5028 of equivalents (if more than one is in the table, they must be in
5029 the same class; we check for this).
5031 If the source is volatile, we don't do any table lookups.
5033 We note any constant equivalent for possible later use in a
5034 REG_NOTE. */
5036 if (!sets[i].src_volatile)
5037 elt = lookup (src, sets[i].src_hash, mode);
5039 sets[i].src_elt = elt;
5041 if (elt && src_eqv_here && src_eqv_elt)
5043 if (elt->first_same_value != src_eqv_elt->first_same_value)
5045 /* The REG_EQUAL is indicating that two formerly distinct
5046 classes are now equivalent. So merge them. */
5047 merge_equiv_classes (elt, src_eqv_elt);
5048 src_eqv_hash = HASH (src_eqv, elt->mode);
5049 src_eqv_elt = lookup (src_eqv, src_eqv_hash, elt->mode);
5052 src_eqv_here = 0;
5055 else if (src_eqv_elt)
5056 elt = src_eqv_elt;
5058 /* Try to find a constant somewhere and record it in `src_const'.
5059 Record its table element, if any, in `src_const_elt'. Look in
5060 any known equivalences first. (If the constant is not in the
5061 table, also set `sets[i].src_const_hash'). */
5062 if (elt)
5063 for (p = elt->first_same_value; p; p = p->next_same_value)
5064 if (p->is_const)
5066 src_const = p->exp;
5067 src_const_elt = elt;
5068 break;
5071 if (src_const == 0
5072 && (CONSTANT_P (src_folded)
5073 /* Consider (minus (label_ref L1) (label_ref L2)) as
5074 "constant" here so we will record it. This allows us
5075 to fold switch statements when an ADDR_DIFF_VEC is used. */
5076 || (GET_CODE (src_folded) == MINUS
5077 && GET_CODE (XEXP (src_folded, 0)) == LABEL_REF
5078 && GET_CODE (XEXP (src_folded, 1)) == LABEL_REF)))
5079 src_const = src_folded, src_const_elt = elt;
5080 else if (src_const == 0 && src_eqv_here && CONSTANT_P (src_eqv_here))
5081 src_const = src_eqv_here, src_const_elt = src_eqv_elt;
5083 /* If we don't know if the constant is in the table, get its
5084 hash code and look it up. */
5085 if (src_const && src_const_elt == 0)
5087 sets[i].src_const_hash = HASH (src_const, mode);
5088 src_const_elt = lookup (src_const, sets[i].src_const_hash, mode);
5091 sets[i].src_const = src_const;
5092 sets[i].src_const_elt = src_const_elt;
5094 /* If the constant and our source are both in the table, mark them as
5095 equivalent. Otherwise, if a constant is in the table but the source
5096 isn't, set ELT to it. */
5097 if (src_const_elt && elt
5098 && src_const_elt->first_same_value != elt->first_same_value)
5099 merge_equiv_classes (elt, src_const_elt);
5100 else if (src_const_elt && elt == 0)
5101 elt = src_const_elt;
5103 /* See if there is a register linearly related to a constant
5104 equivalent of SRC. */
5105 if (src_const
5106 && (GET_CODE (src_const) == CONST
5107 || (src_const_elt && src_const_elt->related_value != 0)))
5109 src_related = use_related_value (src_const, src_const_elt);
5110 if (src_related)
5112 struct table_elt *src_related_elt
5113 = lookup (src_related, HASH (src_related, mode), mode);
5114 if (src_related_elt && elt)
5116 if (elt->first_same_value
5117 != src_related_elt->first_same_value)
5118 /* This can occur when we previously saw a CONST
5119 involving a SYMBOL_REF and then see the SYMBOL_REF
5120 twice. Merge the involved classes. */
5121 merge_equiv_classes (elt, src_related_elt);
5123 src_related = 0;
5124 src_related_elt = 0;
5126 else if (src_related_elt && elt == 0)
5127 elt = src_related_elt;
5131 /* See if we have a CONST_INT that is already in a register in a
5132 wider mode. */
5134 if (src_const && src_related == 0 && GET_CODE (src_const) == CONST_INT
5135 && GET_MODE_CLASS (mode) == MODE_INT
5136 && GET_MODE_BITSIZE (mode) < BITS_PER_WORD)
5138 enum machine_mode wider_mode;
5140 for (wider_mode = GET_MODE_WIDER_MODE (mode);
5141 GET_MODE_BITSIZE (wider_mode) <= BITS_PER_WORD
5142 && src_related == 0;
5143 wider_mode = GET_MODE_WIDER_MODE (wider_mode))
5145 struct table_elt *const_elt
5146 = lookup (src_const, HASH (src_const, wider_mode), wider_mode);
5148 if (const_elt == 0)
5149 continue;
5151 for (const_elt = const_elt->first_same_value;
5152 const_elt; const_elt = const_elt->next_same_value)
5153 if (GET_CODE (const_elt->exp) == REG)
5155 src_related = gen_lowpart_if_possible (mode,
5156 const_elt->exp);
5157 break;
5162 /* Another possibility is that we have an AND with a constant in
5163 a mode narrower than a word. If so, it might have been generated
5164 as part of an "if" which would narrow the AND. If we already
5165 have done the AND in a wider mode, we can use a SUBREG of that
5166 value. */
5168 if (flag_expensive_optimizations && ! src_related
5169 && GET_CODE (src) == AND && GET_CODE (XEXP (src, 1)) == CONST_INT
5170 && GET_MODE_SIZE (mode) < UNITS_PER_WORD)
5172 enum machine_mode tmode;
5173 rtx new_and = gen_rtx_AND (VOIDmode, NULL_RTX, XEXP (src, 1));
5175 for (tmode = GET_MODE_WIDER_MODE (mode);
5176 GET_MODE_SIZE (tmode) <= UNITS_PER_WORD;
5177 tmode = GET_MODE_WIDER_MODE (tmode))
5179 rtx inner = gen_lowpart_if_possible (tmode, XEXP (src, 0));
5180 struct table_elt *larger_elt;
5182 if (inner)
5184 PUT_MODE (new_and, tmode);
5185 XEXP (new_and, 0) = inner;
5186 larger_elt = lookup (new_and, HASH (new_and, tmode), tmode);
5187 if (larger_elt == 0)
5188 continue;
5190 for (larger_elt = larger_elt->first_same_value;
5191 larger_elt; larger_elt = larger_elt->next_same_value)
5192 if (GET_CODE (larger_elt->exp) == REG)
5194 src_related
5195 = gen_lowpart_if_possible (mode, larger_elt->exp);
5196 break;
5199 if (src_related)
5200 break;
5205 #ifdef LOAD_EXTEND_OP
5206 /* See if a MEM has already been loaded with a widening operation;
5207 if it has, we can use a subreg of that. Many CISC machines
5208 also have such operations, but this is only likely to be
5209 beneficial these machines. */
5211 if (flag_expensive_optimizations && src_related == 0
5212 && (GET_MODE_SIZE (mode) < UNITS_PER_WORD)
5213 && GET_MODE_CLASS (mode) == MODE_INT
5214 && GET_CODE (src) == MEM && ! do_not_record
5215 && LOAD_EXTEND_OP (mode) != NIL)
5217 enum machine_mode tmode;
5219 /* Set what we are trying to extend and the operation it might
5220 have been extended with. */
5221 PUT_CODE (memory_extend_rtx, LOAD_EXTEND_OP (mode));
5222 XEXP (memory_extend_rtx, 0) = src;
5224 for (tmode = GET_MODE_WIDER_MODE (mode);
5225 GET_MODE_SIZE (tmode) <= UNITS_PER_WORD;
5226 tmode = GET_MODE_WIDER_MODE (tmode))
5228 struct table_elt *larger_elt;
5230 PUT_MODE (memory_extend_rtx, tmode);
5231 larger_elt = lookup (memory_extend_rtx,
5232 HASH (memory_extend_rtx, tmode), tmode);
5233 if (larger_elt == 0)
5234 continue;
5236 for (larger_elt = larger_elt->first_same_value;
5237 larger_elt; larger_elt = larger_elt->next_same_value)
5238 if (GET_CODE (larger_elt->exp) == REG)
5240 src_related = gen_lowpart_if_possible (mode,
5241 larger_elt->exp);
5242 break;
5245 if (src_related)
5246 break;
5249 #endif /* LOAD_EXTEND_OP */
5251 if (src == src_folded)
5252 src_folded = 0;
5254 /* At this point, ELT, if nonzero, points to a class of expressions
5255 equivalent to the source of this SET and SRC, SRC_EQV, SRC_FOLDED,
5256 and SRC_RELATED, if nonzero, each contain additional equivalent
5257 expressions. Prune these latter expressions by deleting expressions
5258 already in the equivalence class.
5260 Check for an equivalent identical to the destination. If found,
5261 this is the preferred equivalent since it will likely lead to
5262 elimination of the insn. Indicate this by placing it in
5263 `src_related'. */
5265 if (elt)
5266 elt = elt->first_same_value;
5267 for (p = elt; p; p = p->next_same_value)
5269 enum rtx_code code = GET_CODE (p->exp);
5271 /* If the expression is not valid, ignore it. Then we do not
5272 have to check for validity below. In most cases, we can use
5273 `rtx_equal_p', since canonicalization has already been done. */
5274 if (code != REG && ! exp_equiv_p (p->exp, p->exp, 1, 0))
5275 continue;
5277 /* Also skip paradoxical subregs, unless that's what we're
5278 looking for. */
5279 if (code == SUBREG
5280 && (GET_MODE_SIZE (GET_MODE (p->exp))
5281 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (p->exp))))
5282 && ! (src != 0
5283 && GET_CODE (src) == SUBREG
5284 && GET_MODE (src) == GET_MODE (p->exp)
5285 && (GET_MODE_SIZE (GET_MODE (SUBREG_REG (src)))
5286 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (p->exp))))))
5287 continue;
5289 if (src && GET_CODE (src) == code && rtx_equal_p (src, p->exp))
5290 src = 0;
5291 else if (src_folded && GET_CODE (src_folded) == code
5292 && rtx_equal_p (src_folded, p->exp))
5293 src_folded = 0;
5294 else if (src_eqv_here && GET_CODE (src_eqv_here) == code
5295 && rtx_equal_p (src_eqv_here, p->exp))
5296 src_eqv_here = 0;
5297 else if (src_related && GET_CODE (src_related) == code
5298 && rtx_equal_p (src_related, p->exp))
5299 src_related = 0;
5301 /* This is the same as the destination of the insns, we want
5302 to prefer it. Copy it to src_related. The code below will
5303 then give it a negative cost. */
5304 if (GET_CODE (dest) == code && rtx_equal_p (p->exp, dest))
5305 src_related = dest;
5308 /* Find the cheapest valid equivalent, trying all the available
5309 possibilities. Prefer items not in the hash table to ones
5310 that are when they are equal cost. Note that we can never
5311 worsen an insn as the current contents will also succeed.
5312 If we find an equivalent identical to the destination, use it as best,
5313 since this insn will probably be eliminated in that case. */
5314 if (src)
5316 if (rtx_equal_p (src, dest))
5317 src_cost = src_regcost = -1;
5318 else
5320 src_cost = COST (src);
5321 src_regcost = approx_reg_cost (src);
5325 if (src_eqv_here)
5327 if (rtx_equal_p (src_eqv_here, dest))
5328 src_eqv_cost = src_eqv_regcost = -1;
5329 else
5331 src_eqv_cost = COST (src_eqv_here);
5332 src_eqv_regcost = approx_reg_cost (src_eqv_here);
5336 if (src_folded)
5338 if (rtx_equal_p (src_folded, dest))
5339 src_folded_cost = src_folded_regcost = -1;
5340 else
5342 src_folded_cost = COST (src_folded);
5343 src_folded_regcost = approx_reg_cost (src_folded);
5347 if (src_related)
5349 if (rtx_equal_p (src_related, dest))
5350 src_related_cost = src_related_regcost = -1;
5351 else
5353 src_related_cost = COST (src_related);
5354 src_related_regcost = approx_reg_cost (src_related);
5358 /* If this was an indirect jump insn, a known label will really be
5359 cheaper even though it looks more expensive. */
5360 if (dest == pc_rtx && src_const && GET_CODE (src_const) == LABEL_REF)
5361 src_folded = src_const, src_folded_cost = src_folded_regcost = -1;
5363 /* Terminate loop when replacement made. This must terminate since
5364 the current contents will be tested and will always be valid. */
5365 while (1)
5367 rtx trial;
5369 /* Skip invalid entries. */
5370 while (elt && GET_CODE (elt->exp) != REG
5371 && ! exp_equiv_p (elt->exp, elt->exp, 1, 0))
5372 elt = elt->next_same_value;
5374 /* A paradoxical subreg would be bad here: it'll be the right
5375 size, but later may be adjusted so that the upper bits aren't
5376 what we want. So reject it. */
5377 if (elt != 0
5378 && GET_CODE (elt->exp) == SUBREG
5379 && (GET_MODE_SIZE (GET_MODE (elt->exp))
5380 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (elt->exp))))
5381 /* It is okay, though, if the rtx we're trying to match
5382 will ignore any of the bits we can't predict. */
5383 && ! (src != 0
5384 && GET_CODE (src) == SUBREG
5385 && GET_MODE (src) == GET_MODE (elt->exp)
5386 && (GET_MODE_SIZE (GET_MODE (SUBREG_REG (src)))
5387 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (elt->exp))))))
5389 elt = elt->next_same_value;
5390 continue;
5393 if (elt)
5395 src_elt_cost = elt->cost;
5396 src_elt_regcost = elt->regcost;
5399 /* Find cheapest and skip it for the next time. For items
5400 of equal cost, use this order:
5401 src_folded, src, src_eqv, src_related and hash table entry. */
5402 if (src_folded
5403 && preferrable (src_folded_cost, src_folded_regcost,
5404 src_cost, src_regcost) <= 0
5405 && preferrable (src_folded_cost, src_folded_regcost,
5406 src_eqv_cost, src_eqv_regcost) <= 0
5407 && preferrable (src_folded_cost, src_folded_regcost,
5408 src_related_cost, src_related_regcost) <= 0
5409 && preferrable (src_folded_cost, src_folded_regcost,
5410 src_elt_cost, src_elt_regcost) <= 0)
5412 trial = src_folded, src_folded_cost = MAX_COST;
5413 if (src_folded_force_flag)
5414 trial = force_const_mem (mode, trial);
5416 else if (src
5417 && preferrable (src_cost, src_regcost,
5418 src_eqv_cost, src_eqv_regcost) <= 0
5419 && preferrable (src_cost, src_regcost,
5420 src_related_cost, src_related_regcost) <= 0
5421 && preferrable (src_cost, src_regcost,
5422 src_elt_cost, src_elt_regcost) <= 0)
5423 trial = src, src_cost = MAX_COST;
5424 else if (src_eqv_here
5425 && preferrable (src_eqv_cost, src_eqv_regcost,
5426 src_related_cost, src_related_regcost) <= 0
5427 && preferrable (src_eqv_cost, src_eqv_regcost,
5428 src_elt_cost, src_elt_regcost) <= 0)
5429 trial = copy_rtx (src_eqv_here), src_eqv_cost = MAX_COST;
5430 else if (src_related
5431 && preferrable (src_related_cost, src_related_regcost,
5432 src_elt_cost, src_elt_regcost) <= 0)
5433 trial = copy_rtx (src_related), src_related_cost = MAX_COST;
5434 else
5436 trial = copy_rtx (elt->exp);
5437 elt = elt->next_same_value;
5438 src_elt_cost = MAX_COST;
5441 /* We don't normally have an insn matching (set (pc) (pc)), so
5442 check for this separately here. We will delete such an
5443 insn below.
5445 For other cases such as a table jump or conditional jump
5446 where we know the ultimate target, go ahead and replace the
5447 operand. While that may not make a valid insn, we will
5448 reemit the jump below (and also insert any necessary
5449 barriers). */
5450 if (n_sets == 1 && dest == pc_rtx
5451 && (trial == pc_rtx
5452 || (GET_CODE (trial) == LABEL_REF
5453 && ! condjump_p (insn))))
5455 SET_SRC (sets[i].rtl) = trial;
5456 cse_jumps_altered = 1;
5457 break;
5460 /* Look for a substitution that makes a valid insn. */
5461 else if (validate_change (insn, &SET_SRC (sets[i].rtl), trial, 0))
5463 rtx new = canon_reg (SET_SRC (sets[i].rtl), insn);
5465 /* If we just made a substitution inside a libcall, then we
5466 need to make the same substitution in any notes attached
5467 to the RETVAL insn. */
5468 if (libcall_insn
5469 && (GET_CODE (sets[i].orig_src) == REG
5470 || GET_CODE (sets[i].orig_src) == SUBREG
5471 || GET_CODE (sets[i].orig_src) == MEM))
5472 simplify_replace_rtx (REG_NOTES (libcall_insn),
5473 sets[i].orig_src, copy_rtx (new));
5475 /* The result of apply_change_group can be ignored; see
5476 canon_reg. */
5478 validate_change (insn, &SET_SRC (sets[i].rtl), new, 1);
5479 apply_change_group ();
5480 break;
5483 /* If we previously found constant pool entries for
5484 constants and this is a constant, try making a
5485 pool entry. Put it in src_folded unless we already have done
5486 this since that is where it likely came from. */
5488 else if (constant_pool_entries_cost
5489 && CONSTANT_P (trial)
5490 /* Reject cases that will abort in decode_rtx_const.
5491 On the alpha when simplifying a switch, we get
5492 (const (truncate (minus (label_ref) (label_ref)))). */
5493 && ! (GET_CODE (trial) == CONST
5494 && GET_CODE (XEXP (trial, 0)) == TRUNCATE)
5495 /* Likewise on IA-64, except without the truncate. */
5496 && ! (GET_CODE (trial) == CONST
5497 && GET_CODE (XEXP (trial, 0)) == MINUS
5498 && GET_CODE (XEXP (XEXP (trial, 0), 0)) == LABEL_REF
5499 && GET_CODE (XEXP (XEXP (trial, 0), 1)) == LABEL_REF)
5500 && (src_folded == 0
5501 || (GET_CODE (src_folded) != MEM
5502 && ! src_folded_force_flag))
5503 && GET_MODE_CLASS (mode) != MODE_CC
5504 && mode != VOIDmode)
5506 src_folded_force_flag = 1;
5507 src_folded = trial;
5508 src_folded_cost = constant_pool_entries_cost;
5512 src = SET_SRC (sets[i].rtl);
5514 /* In general, it is good to have a SET with SET_SRC == SET_DEST.
5515 However, there is an important exception: If both are registers
5516 that are not the head of their equivalence class, replace SET_SRC
5517 with the head of the class. If we do not do this, we will have
5518 both registers live over a portion of the basic block. This way,
5519 their lifetimes will likely abut instead of overlapping. */
5520 if (GET_CODE (dest) == REG
5521 && REGNO_QTY_VALID_P (REGNO (dest)))
5523 int dest_q = REG_QTY (REGNO (dest));
5524 struct qty_table_elem *dest_ent = &qty_table[dest_q];
5526 if (dest_ent->mode == GET_MODE (dest)
5527 && dest_ent->first_reg != REGNO (dest)
5528 && GET_CODE (src) == REG && REGNO (src) == REGNO (dest)
5529 /* Don't do this if the original insn had a hard reg as
5530 SET_SRC or SET_DEST. */
5531 && (GET_CODE (sets[i].src) != REG
5532 || REGNO (sets[i].src) >= FIRST_PSEUDO_REGISTER)
5533 && (GET_CODE (dest) != REG || REGNO (dest) >= FIRST_PSEUDO_REGISTER))
5534 /* We can't call canon_reg here because it won't do anything if
5535 SRC is a hard register. */
5537 int src_q = REG_QTY (REGNO (src));
5538 struct qty_table_elem *src_ent = &qty_table[src_q];
5539 int first = src_ent->first_reg;
5540 rtx new_src
5541 = (first >= FIRST_PSEUDO_REGISTER
5542 ? regno_reg_rtx[first] : gen_rtx_REG (GET_MODE (src), first));
5544 /* We must use validate-change even for this, because this
5545 might be a special no-op instruction, suitable only to
5546 tag notes onto. */
5547 if (validate_change (insn, &SET_SRC (sets[i].rtl), new_src, 0))
5549 src = new_src;
5550 /* If we had a constant that is cheaper than what we are now
5551 setting SRC to, use that constant. We ignored it when we
5552 thought we could make this into a no-op. */
5553 if (src_const && COST (src_const) < COST (src)
5554 && validate_change (insn, &SET_SRC (sets[i].rtl),
5555 src_const, 0))
5556 src = src_const;
5561 /* If we made a change, recompute SRC values. */
5562 if (src != sets[i].src)
5564 cse_altered = 1;
5565 do_not_record = 0;
5566 hash_arg_in_memory = 0;
5567 sets[i].src = src;
5568 sets[i].src_hash = HASH (src, mode);
5569 sets[i].src_volatile = do_not_record;
5570 sets[i].src_in_memory = hash_arg_in_memory;
5571 sets[i].src_elt = lookup (src, sets[i].src_hash, mode);
5574 /* If this is a single SET, we are setting a register, and we have an
5575 equivalent constant, we want to add a REG_NOTE. We don't want
5576 to write a REG_EQUAL note for a constant pseudo since verifying that
5577 that pseudo hasn't been eliminated is a pain. Such a note also
5578 won't help anything.
5580 Avoid a REG_EQUAL note for (CONST (MINUS (LABEL_REF) (LABEL_REF)))
5581 which can be created for a reference to a compile time computable
5582 entry in a jump table. */
5584 if (n_sets == 1 && src_const && GET_CODE (dest) == REG
5585 && GET_CODE (src_const) != REG
5586 && ! (GET_CODE (src_const) == CONST
5587 && GET_CODE (XEXP (src_const, 0)) == MINUS
5588 && GET_CODE (XEXP (XEXP (src_const, 0), 0)) == LABEL_REF
5589 && GET_CODE (XEXP (XEXP (src_const, 0), 1)) == LABEL_REF))
5591 /* We only want a REG_EQUAL note if src_const != src. */
5592 if (! rtx_equal_p (src, src_const))
5594 /* Make sure that the rtx is not shared. */
5595 src_const = copy_rtx (src_const);
5597 /* Record the actual constant value in a REG_EQUAL note,
5598 making a new one if one does not already exist. */
5599 set_unique_reg_note (insn, REG_EQUAL, src_const);
5603 /* Now deal with the destination. */
5604 do_not_record = 0;
5606 /* Look within any SIGN_EXTRACT or ZERO_EXTRACT
5607 to the MEM or REG within it. */
5608 while (GET_CODE (dest) == SIGN_EXTRACT
5609 || GET_CODE (dest) == ZERO_EXTRACT
5610 || GET_CODE (dest) == SUBREG
5611 || GET_CODE (dest) == STRICT_LOW_PART)
5612 dest = XEXP (dest, 0);
5614 sets[i].inner_dest = dest;
5616 if (GET_CODE (dest) == MEM)
5618 #ifdef PUSH_ROUNDING
5619 /* Stack pushes invalidate the stack pointer. */
5620 rtx addr = XEXP (dest, 0);
5621 if (GET_RTX_CLASS (GET_CODE (addr)) == 'a'
5622 && XEXP (addr, 0) == stack_pointer_rtx)
5623 invalidate (stack_pointer_rtx, Pmode);
5624 #endif
5625 dest = fold_rtx (dest, insn);
5628 /* Compute the hash code of the destination now,
5629 before the effects of this instruction are recorded,
5630 since the register values used in the address computation
5631 are those before this instruction. */
5632 sets[i].dest_hash = HASH (dest, mode);
5634 /* Don't enter a bit-field in the hash table
5635 because the value in it after the store
5636 may not equal what was stored, due to truncation. */
5638 if (GET_CODE (SET_DEST (sets[i].rtl)) == ZERO_EXTRACT
5639 || GET_CODE (SET_DEST (sets[i].rtl)) == SIGN_EXTRACT)
5641 rtx width = XEXP (SET_DEST (sets[i].rtl), 1);
5643 if (src_const != 0 && GET_CODE (src_const) == CONST_INT
5644 && GET_CODE (width) == CONST_INT
5645 && INTVAL (width) < HOST_BITS_PER_WIDE_INT
5646 && ! (INTVAL (src_const)
5647 & ((HOST_WIDE_INT) (-1) << INTVAL (width))))
5648 /* Exception: if the value is constant,
5649 and it won't be truncated, record it. */
5651 else
5653 /* This is chosen so that the destination will be invalidated
5654 but no new value will be recorded.
5655 We must invalidate because sometimes constant
5656 values can be recorded for bitfields. */
5657 sets[i].src_elt = 0;
5658 sets[i].src_volatile = 1;
5659 src_eqv = 0;
5660 src_eqv_elt = 0;
5664 /* If only one set in a JUMP_INSN and it is now a no-op, we can delete
5665 the insn. */
5666 else if (n_sets == 1 && dest == pc_rtx && src == pc_rtx)
5668 /* One less use of the label this insn used to jump to. */
5669 delete_insn (insn);
5670 cse_jumps_altered = 1;
5671 /* No more processing for this set. */
5672 sets[i].rtl = 0;
5675 /* If this SET is now setting PC to a label, we know it used to
5676 be a conditional or computed branch. */
5677 else if (dest == pc_rtx && GET_CODE (src) == LABEL_REF)
5679 /* Now emit a BARRIER after the unconditional jump. */
5680 if (NEXT_INSN (insn) == 0
5681 || GET_CODE (NEXT_INSN (insn)) != BARRIER)
5682 emit_barrier_after (insn);
5684 /* We reemit the jump in as many cases as possible just in
5685 case the form of an unconditional jump is significantly
5686 different than a computed jump or conditional jump.
5688 If this insn has multiple sets, then reemitting the
5689 jump is nontrivial. So instead we just force rerecognition
5690 and hope for the best. */
5691 if (n_sets == 1)
5693 rtx new = emit_jump_insn_after (gen_jump (XEXP (src, 0)), insn);
5695 JUMP_LABEL (new) = XEXP (src, 0);
5696 LABEL_NUSES (XEXP (src, 0))++;
5697 delete_insn (insn);
5698 insn = new;
5700 /* Now emit a BARRIER after the unconditional jump. */
5701 if (NEXT_INSN (insn) == 0
5702 || GET_CODE (NEXT_INSN (insn)) != BARRIER)
5703 emit_barrier_after (insn);
5705 else
5706 INSN_CODE (insn) = -1;
5708 never_reached_warning (insn, NULL);
5710 /* Do not bother deleting any unreachable code,
5711 let jump/flow do that. */
5713 cse_jumps_altered = 1;
5714 sets[i].rtl = 0;
5717 /* If destination is volatile, invalidate it and then do no further
5718 processing for this assignment. */
5720 else if (do_not_record)
5722 if (GET_CODE (dest) == REG || GET_CODE (dest) == SUBREG)
5723 invalidate (dest, VOIDmode);
5724 else if (GET_CODE (dest) == MEM)
5726 /* Outgoing arguments for a libcall don't
5727 affect any recorded expressions. */
5728 if (! libcall_insn || insn == libcall_insn)
5729 invalidate (dest, VOIDmode);
5731 else if (GET_CODE (dest) == STRICT_LOW_PART
5732 || GET_CODE (dest) == ZERO_EXTRACT)
5733 invalidate (XEXP (dest, 0), GET_MODE (dest));
5734 sets[i].rtl = 0;
5737 if (sets[i].rtl != 0 && dest != SET_DEST (sets[i].rtl))
5738 sets[i].dest_hash = HASH (SET_DEST (sets[i].rtl), mode);
5740 #ifdef HAVE_cc0
5741 /* If setting CC0, record what it was set to, or a constant, if it
5742 is equivalent to a constant. If it is being set to a floating-point
5743 value, make a COMPARE with the appropriate constant of 0. If we
5744 don't do this, later code can interpret this as a test against
5745 const0_rtx, which can cause problems if we try to put it into an
5746 insn as a floating-point operand. */
5747 if (dest == cc0_rtx)
5749 this_insn_cc0 = src_const && mode != VOIDmode ? src_const : src;
5750 this_insn_cc0_mode = mode;
5751 if (FLOAT_MODE_P (mode))
5752 this_insn_cc0 = gen_rtx_COMPARE (VOIDmode, this_insn_cc0,
5753 CONST0_RTX (mode));
5755 #endif
5758 /* Now enter all non-volatile source expressions in the hash table
5759 if they are not already present.
5760 Record their equivalence classes in src_elt.
5761 This way we can insert the corresponding destinations into
5762 the same classes even if the actual sources are no longer in them
5763 (having been invalidated). */
5765 if (src_eqv && src_eqv_elt == 0 && sets[0].rtl != 0 && ! src_eqv_volatile
5766 && ! rtx_equal_p (src_eqv, SET_DEST (sets[0].rtl)))
5768 struct table_elt *elt;
5769 struct table_elt *classp = sets[0].src_elt;
5770 rtx dest = SET_DEST (sets[0].rtl);
5771 enum machine_mode eqvmode = GET_MODE (dest);
5773 if (GET_CODE (dest) == STRICT_LOW_PART)
5775 eqvmode = GET_MODE (SUBREG_REG (XEXP (dest, 0)));
5776 classp = 0;
5778 if (insert_regs (src_eqv, classp, 0))
5780 rehash_using_reg (src_eqv);
5781 src_eqv_hash = HASH (src_eqv, eqvmode);
5783 elt = insert (src_eqv, classp, src_eqv_hash, eqvmode);
5784 elt->in_memory = src_eqv_in_memory;
5785 src_eqv_elt = elt;
5787 /* Check to see if src_eqv_elt is the same as a set source which
5788 does not yet have an elt, and if so set the elt of the set source
5789 to src_eqv_elt. */
5790 for (i = 0; i < n_sets; i++)
5791 if (sets[i].rtl && sets[i].src_elt == 0
5792 && rtx_equal_p (SET_SRC (sets[i].rtl), src_eqv))
5793 sets[i].src_elt = src_eqv_elt;
5796 for (i = 0; i < n_sets; i++)
5797 if (sets[i].rtl && ! sets[i].src_volatile
5798 && ! rtx_equal_p (SET_SRC (sets[i].rtl), SET_DEST (sets[i].rtl)))
5800 if (GET_CODE (SET_DEST (sets[i].rtl)) == STRICT_LOW_PART)
5802 /* REG_EQUAL in setting a STRICT_LOW_PART
5803 gives an equivalent for the entire destination register,
5804 not just for the subreg being stored in now.
5805 This is a more interesting equivalence, so we arrange later
5806 to treat the entire reg as the destination. */
5807 sets[i].src_elt = src_eqv_elt;
5808 sets[i].src_hash = src_eqv_hash;
5810 else
5812 /* Insert source and constant equivalent into hash table, if not
5813 already present. */
5814 struct table_elt *classp = src_eqv_elt;
5815 rtx src = sets[i].src;
5816 rtx dest = SET_DEST (sets[i].rtl);
5817 enum machine_mode mode
5818 = GET_MODE (src) == VOIDmode ? GET_MODE (dest) : GET_MODE (src);
5820 if (sets[i].src_elt == 0)
5822 /* Don't put a hard register source into the table if this is
5823 the last insn of a libcall. In this case, we only need
5824 to put src_eqv_elt in src_elt. */
5825 if (! find_reg_note (insn, REG_RETVAL, NULL_RTX))
5827 struct table_elt *elt;
5829 /* Note that these insert_regs calls cannot remove
5830 any of the src_elt's, because they would have failed to
5831 match if not still valid. */
5832 if (insert_regs (src, classp, 0))
5834 rehash_using_reg (src);
5835 sets[i].src_hash = HASH (src, mode);
5837 elt = insert (src, classp, sets[i].src_hash, mode);
5838 elt->in_memory = sets[i].src_in_memory;
5839 sets[i].src_elt = classp = elt;
5841 else
5842 sets[i].src_elt = classp;
5844 if (sets[i].src_const && sets[i].src_const_elt == 0
5845 && src != sets[i].src_const
5846 && ! rtx_equal_p (sets[i].src_const, src))
5847 sets[i].src_elt = insert (sets[i].src_const, classp,
5848 sets[i].src_const_hash, mode);
5851 else if (sets[i].src_elt == 0)
5852 /* If we did not insert the source into the hash table (e.g., it was
5853 volatile), note the equivalence class for the REG_EQUAL value, if any,
5854 so that the destination goes into that class. */
5855 sets[i].src_elt = src_eqv_elt;
5857 invalidate_from_clobbers (x);
5859 /* Some registers are invalidated by subroutine calls. Memory is
5860 invalidated by non-constant calls. */
5862 if (GET_CODE (insn) == CALL_INSN)
5864 if (! CONST_OR_PURE_CALL_P (insn))
5865 invalidate_memory ();
5866 invalidate_for_call ();
5869 /* Now invalidate everything set by this instruction.
5870 If a SUBREG or other funny destination is being set,
5871 sets[i].rtl is still nonzero, so here we invalidate the reg
5872 a part of which is being set. */
5874 for (i = 0; i < n_sets; i++)
5875 if (sets[i].rtl)
5877 /* We can't use the inner dest, because the mode associated with
5878 a ZERO_EXTRACT is significant. */
5879 rtx dest = SET_DEST (sets[i].rtl);
5881 /* Needed for registers to remove the register from its
5882 previous quantity's chain.
5883 Needed for memory if this is a nonvarying address, unless
5884 we have just done an invalidate_memory that covers even those. */
5885 if (GET_CODE (dest) == REG || GET_CODE (dest) == SUBREG)
5886 invalidate (dest, VOIDmode);
5887 else if (GET_CODE (dest) == MEM)
5889 /* Outgoing arguments for a libcall don't
5890 affect any recorded expressions. */
5891 if (! libcall_insn || insn == libcall_insn)
5892 invalidate (dest, VOIDmode);
5894 else if (GET_CODE (dest) == STRICT_LOW_PART
5895 || GET_CODE (dest) == ZERO_EXTRACT)
5896 invalidate (XEXP (dest, 0), GET_MODE (dest));
5899 /* A volatile ASM invalidates everything. */
5900 if (GET_CODE (insn) == INSN
5901 && GET_CODE (PATTERN (insn)) == ASM_OPERANDS
5902 && MEM_VOLATILE_P (PATTERN (insn)))
5903 flush_hash_table ();
5905 /* Make sure registers mentioned in destinations
5906 are safe for use in an expression to be inserted.
5907 This removes from the hash table
5908 any invalid entry that refers to one of these registers.
5910 We don't care about the return value from mention_regs because
5911 we are going to hash the SET_DEST values unconditionally. */
5913 for (i = 0; i < n_sets; i++)
5915 if (sets[i].rtl)
5917 rtx x = SET_DEST (sets[i].rtl);
5919 if (GET_CODE (x) != REG)
5920 mention_regs (x);
5921 else
5923 /* We used to rely on all references to a register becoming
5924 inaccessible when a register changes to a new quantity,
5925 since that changes the hash code. However, that is not
5926 safe, since after HASH_SIZE new quantities we get a
5927 hash 'collision' of a register with its own invalid
5928 entries. And since SUBREGs have been changed not to
5929 change their hash code with the hash code of the register,
5930 it wouldn't work any longer at all. So we have to check
5931 for any invalid references lying around now.
5932 This code is similar to the REG case in mention_regs,
5933 but it knows that reg_tick has been incremented, and
5934 it leaves reg_in_table as -1 . */
5935 unsigned int regno = REGNO (x);
5936 unsigned int endregno
5937 = regno + (regno >= FIRST_PSEUDO_REGISTER ? 1
5938 : HARD_REGNO_NREGS (regno, GET_MODE (x)));
5939 unsigned int i;
5941 for (i = regno; i < endregno; i++)
5943 if (REG_IN_TABLE (i) >= 0)
5945 remove_invalid_refs (i);
5946 REG_IN_TABLE (i) = -1;
5953 /* We may have just removed some of the src_elt's from the hash table.
5954 So replace each one with the current head of the same class. */
5956 for (i = 0; i < n_sets; i++)
5957 if (sets[i].rtl)
5959 if (sets[i].src_elt && sets[i].src_elt->first_same_value == 0)
5960 /* If elt was removed, find current head of same class,
5961 or 0 if nothing remains of that class. */
5963 struct table_elt *elt = sets[i].src_elt;
5965 while (elt && elt->prev_same_value)
5966 elt = elt->prev_same_value;
5968 while (elt && elt->first_same_value == 0)
5969 elt = elt->next_same_value;
5970 sets[i].src_elt = elt ? elt->first_same_value : 0;
5974 /* Now insert the destinations into their equivalence classes. */
5976 for (i = 0; i < n_sets; i++)
5977 if (sets[i].rtl)
5979 rtx dest = SET_DEST (sets[i].rtl);
5980 rtx inner_dest = sets[i].inner_dest;
5981 struct table_elt *elt;
5983 /* Don't record value if we are not supposed to risk allocating
5984 floating-point values in registers that might be wider than
5985 memory. */
5986 if ((flag_float_store
5987 && GET_CODE (dest) == MEM
5988 && FLOAT_MODE_P (GET_MODE (dest)))
5989 /* Don't record BLKmode values, because we don't know the
5990 size of it, and can't be sure that other BLKmode values
5991 have the same or smaller size. */
5992 || GET_MODE (dest) == BLKmode
5993 /* Don't record values of destinations set inside a libcall block
5994 since we might delete the libcall. Things should have been set
5995 up so we won't want to reuse such a value, but we play it safe
5996 here. */
5997 || libcall_insn
5998 /* If we didn't put a REG_EQUAL value or a source into the hash
5999 table, there is no point is recording DEST. */
6000 || sets[i].src_elt == 0
6001 /* If DEST is a paradoxical SUBREG and SRC is a ZERO_EXTEND
6002 or SIGN_EXTEND, don't record DEST since it can cause
6003 some tracking to be wrong.
6005 ??? Think about this more later. */
6006 || (GET_CODE (dest) == SUBREG
6007 && (GET_MODE_SIZE (GET_MODE (dest))
6008 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest))))
6009 && (GET_CODE (sets[i].src) == SIGN_EXTEND
6010 || GET_CODE (sets[i].src) == ZERO_EXTEND)))
6011 continue;
6013 /* STRICT_LOW_PART isn't part of the value BEING set,
6014 and neither is the SUBREG inside it.
6015 Note that in this case SETS[I].SRC_ELT is really SRC_EQV_ELT. */
6016 if (GET_CODE (dest) == STRICT_LOW_PART)
6017 dest = SUBREG_REG (XEXP (dest, 0));
6019 if (GET_CODE (dest) == REG || GET_CODE (dest) == SUBREG)
6020 /* Registers must also be inserted into chains for quantities. */
6021 if (insert_regs (dest, sets[i].src_elt, 1))
6023 /* If `insert_regs' changes something, the hash code must be
6024 recalculated. */
6025 rehash_using_reg (dest);
6026 sets[i].dest_hash = HASH (dest, GET_MODE (dest));
6029 if (GET_CODE (inner_dest) == MEM
6030 && GET_CODE (XEXP (inner_dest, 0)) == ADDRESSOF)
6031 /* Given (SET (MEM (ADDRESSOF (X))) Y) we don't want to say
6032 that (MEM (ADDRESSOF (X))) is equivalent to Y.
6033 Consider the case in which the address of the MEM is
6034 passed to a function, which alters the MEM. Then, if we
6035 later use Y instead of the MEM we'll miss the update. */
6036 elt = insert (dest, 0, sets[i].dest_hash, GET_MODE (dest));
6037 else
6038 elt = insert (dest, sets[i].src_elt,
6039 sets[i].dest_hash, GET_MODE (dest));
6041 elt->in_memory = (GET_CODE (sets[i].inner_dest) == MEM
6042 && (! RTX_UNCHANGING_P (sets[i].inner_dest)
6043 || fixed_base_plus_p (XEXP (sets[i].inner_dest,
6044 0))));
6046 /* If we have (set (subreg:m1 (reg:m2 foo) 0) (bar:m1)), M1 is no
6047 narrower than M2, and both M1 and M2 are the same number of words,
6048 we are also doing (set (reg:m2 foo) (subreg:m2 (bar:m1) 0)) so
6049 make that equivalence as well.
6051 However, BAR may have equivalences for which gen_lowpart_if_possible
6052 will produce a simpler value than gen_lowpart_if_possible applied to
6053 BAR (e.g., if BAR was ZERO_EXTENDed from M2), so we will scan all
6054 BAR's equivalences. If we don't get a simplified form, make
6055 the SUBREG. It will not be used in an equivalence, but will
6056 cause two similar assignments to be detected.
6058 Note the loop below will find SUBREG_REG (DEST) since we have
6059 already entered SRC and DEST of the SET in the table. */
6061 if (GET_CODE (dest) == SUBREG
6062 && (((GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest))) - 1)
6063 / UNITS_PER_WORD)
6064 == (GET_MODE_SIZE (GET_MODE (dest)) - 1) / UNITS_PER_WORD)
6065 && (GET_MODE_SIZE (GET_MODE (dest))
6066 >= GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest))))
6067 && sets[i].src_elt != 0)
6069 enum machine_mode new_mode = GET_MODE (SUBREG_REG (dest));
6070 struct table_elt *elt, *classp = 0;
6072 for (elt = sets[i].src_elt->first_same_value; elt;
6073 elt = elt->next_same_value)
6075 rtx new_src = 0;
6076 unsigned src_hash;
6077 struct table_elt *src_elt;
6078 int byte = 0;
6080 /* Ignore invalid entries. */
6081 if (GET_CODE (elt->exp) != REG
6082 && ! exp_equiv_p (elt->exp, elt->exp, 1, 0))
6083 continue;
6085 /* We may have already been playing subreg games. If the
6086 mode is already correct for the destination, use it. */
6087 if (GET_MODE (elt->exp) == new_mode)
6088 new_src = elt->exp;
6089 else
6091 /* Calculate big endian correction for the SUBREG_BYTE.
6092 We have already checked that M1 (GET_MODE (dest))
6093 is not narrower than M2 (new_mode). */
6094 if (BYTES_BIG_ENDIAN)
6095 byte = (GET_MODE_SIZE (GET_MODE (dest))
6096 - GET_MODE_SIZE (new_mode));
6098 new_src = simplify_gen_subreg (new_mode, elt->exp,
6099 GET_MODE (dest), byte);
6102 /* The call to simplify_gen_subreg fails if the value
6103 is VOIDmode, yet we can't do any simplification, e.g.
6104 for EXPR_LISTs denoting function call results.
6105 It is invalid to construct a SUBREG with a VOIDmode
6106 SUBREG_REG, hence a zero new_src means we can't do
6107 this substitution. */
6108 if (! new_src)
6109 continue;
6111 src_hash = HASH (new_src, new_mode);
6112 src_elt = lookup (new_src, src_hash, new_mode);
6114 /* Put the new source in the hash table is if isn't
6115 already. */
6116 if (src_elt == 0)
6118 if (insert_regs (new_src, classp, 0))
6120 rehash_using_reg (new_src);
6121 src_hash = HASH (new_src, new_mode);
6123 src_elt = insert (new_src, classp, src_hash, new_mode);
6124 src_elt->in_memory = elt->in_memory;
6126 else if (classp && classp != src_elt->first_same_value)
6127 /* Show that two things that we've seen before are
6128 actually the same. */
6129 merge_equiv_classes (src_elt, classp);
6131 classp = src_elt->first_same_value;
6132 /* Ignore invalid entries. */
6133 while (classp
6134 && GET_CODE (classp->exp) != REG
6135 && ! exp_equiv_p (classp->exp, classp->exp, 1, 0))
6136 classp = classp->next_same_value;
6141 /* Special handling for (set REG0 REG1) where REG0 is the
6142 "cheapest", cheaper than REG1. After cse, REG1 will probably not
6143 be used in the sequel, so (if easily done) change this insn to
6144 (set REG1 REG0) and replace REG1 with REG0 in the previous insn
6145 that computed their value. Then REG1 will become a dead store
6146 and won't cloud the situation for later optimizations.
6148 Do not make this change if REG1 is a hard register, because it will
6149 then be used in the sequel and we may be changing a two-operand insn
6150 into a three-operand insn.
6152 Also do not do this if we are operating on a copy of INSN.
6154 Also don't do this if INSN ends a libcall; this would cause an unrelated
6155 register to be set in the middle of a libcall, and we then get bad code
6156 if the libcall is deleted. */
6158 if (n_sets == 1 && sets[0].rtl && GET_CODE (SET_DEST (sets[0].rtl)) == REG
6159 && NEXT_INSN (PREV_INSN (insn)) == insn
6160 && GET_CODE (SET_SRC (sets[0].rtl)) == REG
6161 && REGNO (SET_SRC (sets[0].rtl)) >= FIRST_PSEUDO_REGISTER
6162 && REGNO_QTY_VALID_P (REGNO (SET_SRC (sets[0].rtl))))
6164 int src_q = REG_QTY (REGNO (SET_SRC (sets[0].rtl)));
6165 struct qty_table_elem *src_ent = &qty_table[src_q];
6167 if ((src_ent->first_reg == REGNO (SET_DEST (sets[0].rtl)))
6168 && ! find_reg_note (insn, REG_RETVAL, NULL_RTX))
6170 rtx prev = insn;
6171 /* Scan for the previous nonnote insn, but stop at a basic
6172 block boundary. */
6175 prev = PREV_INSN (prev);
6177 while (prev && GET_CODE (prev) == NOTE
6178 && NOTE_LINE_NUMBER (prev) != NOTE_INSN_BASIC_BLOCK);
6180 /* Do not swap the registers around if the previous instruction
6181 attaches a REG_EQUIV note to REG1.
6183 ??? It's not entirely clear whether we can transfer a REG_EQUIV
6184 from the pseudo that originally shadowed an incoming argument
6185 to another register. Some uses of REG_EQUIV might rely on it
6186 being attached to REG1 rather than REG2.
6188 This section previously turned the REG_EQUIV into a REG_EQUAL
6189 note. We cannot do that because REG_EQUIV may provide an
6190 uninitialized stack slot when REG_PARM_STACK_SPACE is used. */
6192 if (prev != 0 && GET_CODE (prev) == INSN
6193 && GET_CODE (PATTERN (prev)) == SET
6194 && SET_DEST (PATTERN (prev)) == SET_SRC (sets[0].rtl)
6195 && ! find_reg_note (prev, REG_EQUIV, NULL_RTX))
6197 rtx dest = SET_DEST (sets[0].rtl);
6198 rtx src = SET_SRC (sets[0].rtl);
6199 rtx note;
6201 validate_change (prev, &SET_DEST (PATTERN (prev)), dest, 1);
6202 validate_change (insn, &SET_DEST (sets[0].rtl), src, 1);
6203 validate_change (insn, &SET_SRC (sets[0].rtl), dest, 1);
6204 apply_change_group ();
6206 /* If INSN has a REG_EQUAL note, and this note mentions
6207 REG0, then we must delete it, because the value in
6208 REG0 has changed. If the note's value is REG1, we must
6209 also delete it because that is now this insn's dest. */
6210 note = find_reg_note (insn, REG_EQUAL, NULL_RTX);
6211 if (note != 0
6212 && (reg_mentioned_p (dest, XEXP (note, 0))
6213 || rtx_equal_p (src, XEXP (note, 0))))
6214 remove_note (insn, note);
6219 /* If this is a conditional jump insn, record any known equivalences due to
6220 the condition being tested. */
6222 last_jump_equiv_class = 0;
6223 if (GET_CODE (insn) == JUMP_INSN
6224 && n_sets == 1 && GET_CODE (x) == SET
6225 && GET_CODE (SET_SRC (x)) == IF_THEN_ELSE)
6226 record_jump_equiv (insn, 0);
6228 #ifdef HAVE_cc0
6229 /* If the previous insn set CC0 and this insn no longer references CC0,
6230 delete the previous insn. Here we use the fact that nothing expects CC0
6231 to be valid over an insn, which is true until the final pass. */
6232 if (prev_insn && GET_CODE (prev_insn) == INSN
6233 && (tem = single_set (prev_insn)) != 0
6234 && SET_DEST (tem) == cc0_rtx
6235 && ! reg_mentioned_p (cc0_rtx, x))
6236 delete_insn (prev_insn);
6238 prev_insn_cc0 = this_insn_cc0;
6239 prev_insn_cc0_mode = this_insn_cc0_mode;
6240 prev_insn = insn;
6241 #endif
6244 /* Remove from the hash table all expressions that reference memory. */
6246 static void
6247 invalidate_memory (void)
6249 int i;
6250 struct table_elt *p, *next;
6252 for (i = 0; i < HASH_SIZE; i++)
6253 for (p = table[i]; p; p = next)
6255 next = p->next_same_hash;
6256 if (p->in_memory)
6257 remove_from_table (p, i);
6261 /* If ADDR is an address that implicitly affects the stack pointer, return
6262 1 and update the register tables to show the effect. Else, return 0. */
6264 static int
6265 addr_affects_sp_p (rtx addr)
6267 if (GET_RTX_CLASS (GET_CODE (addr)) == 'a'
6268 && GET_CODE (XEXP (addr, 0)) == REG
6269 && REGNO (XEXP (addr, 0)) == STACK_POINTER_REGNUM)
6271 if (REG_TICK (STACK_POINTER_REGNUM) >= 0)
6273 REG_TICK (STACK_POINTER_REGNUM)++;
6274 /* Is it possible to use a subreg of SP? */
6275 SUBREG_TICKED (STACK_POINTER_REGNUM) = -1;
6278 /* This should be *very* rare. */
6279 if (TEST_HARD_REG_BIT (hard_regs_in_table, STACK_POINTER_REGNUM))
6280 invalidate (stack_pointer_rtx, VOIDmode);
6282 return 1;
6285 return 0;
6288 /* Perform invalidation on the basis of everything about an insn
6289 except for invalidating the actual places that are SET in it.
6290 This includes the places CLOBBERed, and anything that might
6291 alias with something that is SET or CLOBBERed.
6293 X is the pattern of the insn. */
6295 static void
6296 invalidate_from_clobbers (rtx x)
6298 if (GET_CODE (x) == CLOBBER)
6300 rtx ref = XEXP (x, 0);
6301 if (ref)
6303 if (GET_CODE (ref) == REG || GET_CODE (ref) == SUBREG
6304 || GET_CODE (ref) == MEM)
6305 invalidate (ref, VOIDmode);
6306 else if (GET_CODE (ref) == STRICT_LOW_PART
6307 || GET_CODE (ref) == ZERO_EXTRACT)
6308 invalidate (XEXP (ref, 0), GET_MODE (ref));
6311 else if (GET_CODE (x) == PARALLEL)
6313 int i;
6314 for (i = XVECLEN (x, 0) - 1; i >= 0; i--)
6316 rtx y = XVECEXP (x, 0, i);
6317 if (GET_CODE (y) == CLOBBER)
6319 rtx ref = XEXP (y, 0);
6320 if (GET_CODE (ref) == REG || GET_CODE (ref) == SUBREG
6321 || GET_CODE (ref) == MEM)
6322 invalidate (ref, VOIDmode);
6323 else if (GET_CODE (ref) == STRICT_LOW_PART
6324 || GET_CODE (ref) == ZERO_EXTRACT)
6325 invalidate (XEXP (ref, 0), GET_MODE (ref));
6331 /* Process X, part of the REG_NOTES of an insn. Look at any REG_EQUAL notes
6332 and replace any registers in them with either an equivalent constant
6333 or the canonical form of the register. If we are inside an address,
6334 only do this if the address remains valid.
6336 OBJECT is 0 except when within a MEM in which case it is the MEM.
6338 Return the replacement for X. */
6340 static rtx
6341 cse_process_notes (rtx x, rtx object)
6343 enum rtx_code code = GET_CODE (x);
6344 const char *fmt = GET_RTX_FORMAT (code);
6345 int i;
6347 switch (code)
6349 case CONST_INT:
6350 case CONST:
6351 case SYMBOL_REF:
6352 case LABEL_REF:
6353 case CONST_DOUBLE:
6354 case CONST_VECTOR:
6355 case PC:
6356 case CC0:
6357 case LO_SUM:
6358 return x;
6360 case MEM:
6361 validate_change (x, &XEXP (x, 0),
6362 cse_process_notes (XEXP (x, 0), x), 0);
6363 return x;
6365 case EXPR_LIST:
6366 case INSN_LIST:
6367 if (REG_NOTE_KIND (x) == REG_EQUAL)
6368 XEXP (x, 0) = cse_process_notes (XEXP (x, 0), NULL_RTX);
6369 if (XEXP (x, 1))
6370 XEXP (x, 1) = cse_process_notes (XEXP (x, 1), NULL_RTX);
6371 return x;
6373 case SIGN_EXTEND:
6374 case ZERO_EXTEND:
6375 case SUBREG:
6377 rtx new = cse_process_notes (XEXP (x, 0), object);
6378 /* We don't substitute VOIDmode constants into these rtx,
6379 since they would impede folding. */
6380 if (GET_MODE (new) != VOIDmode)
6381 validate_change (object, &XEXP (x, 0), new, 0);
6382 return x;
6385 case REG:
6386 i = REG_QTY (REGNO (x));
6388 /* Return a constant or a constant register. */
6389 if (REGNO_QTY_VALID_P (REGNO (x)))
6391 struct qty_table_elem *ent = &qty_table[i];
6393 if (ent->const_rtx != NULL_RTX
6394 && (CONSTANT_P (ent->const_rtx)
6395 || GET_CODE (ent->const_rtx) == REG))
6397 rtx new = gen_lowpart_if_possible (GET_MODE (x), ent->const_rtx);
6398 if (new)
6399 return new;
6403 /* Otherwise, canonicalize this register. */
6404 return canon_reg (x, NULL_RTX);
6406 default:
6407 break;
6410 for (i = 0; i < GET_RTX_LENGTH (code); i++)
6411 if (fmt[i] == 'e')
6412 validate_change (object, &XEXP (x, i),
6413 cse_process_notes (XEXP (x, i), object), 0);
6415 return x;
6418 /* Find common subexpressions between the end test of a loop and the beginning
6419 of the loop. LOOP_START is the CODE_LABEL at the start of a loop.
6421 Often we have a loop where an expression in the exit test is used
6422 in the body of the loop. For example "while (*p) *q++ = *p++;".
6423 Because of the way we duplicate the loop exit test in front of the loop,
6424 however, we don't detect that common subexpression. This will be caught
6425 when global cse is implemented, but this is a quite common case.
6427 This function handles the most common cases of these common expressions.
6428 It is called after we have processed the basic block ending with the
6429 NOTE_INSN_LOOP_END note that ends a loop and the previous JUMP_INSN
6430 jumps to a label used only once. */
6432 static void
6433 cse_around_loop (rtx loop_start)
6435 rtx insn;
6436 int i;
6437 struct table_elt *p;
6439 /* If the jump at the end of the loop doesn't go to the start, we don't
6440 do anything. */
6441 for (insn = PREV_INSN (loop_start);
6442 insn && (GET_CODE (insn) == NOTE && NOTE_LINE_NUMBER (insn) >= 0);
6443 insn = PREV_INSN (insn))
6446 if (insn == 0
6447 || GET_CODE (insn) != NOTE
6448 || NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG)
6449 return;
6451 /* If the last insn of the loop (the end test) was an NE comparison,
6452 we will interpret it as an EQ comparison, since we fell through
6453 the loop. Any equivalences resulting from that comparison are
6454 therefore not valid and must be invalidated. */
6455 if (last_jump_equiv_class)
6456 for (p = last_jump_equiv_class->first_same_value; p;
6457 p = p->next_same_value)
6459 if (GET_CODE (p->exp) == MEM || GET_CODE (p->exp) == REG
6460 || (GET_CODE (p->exp) == SUBREG
6461 && GET_CODE (SUBREG_REG (p->exp)) == REG))
6462 invalidate (p->exp, VOIDmode);
6463 else if (GET_CODE (p->exp) == STRICT_LOW_PART
6464 || GET_CODE (p->exp) == ZERO_EXTRACT)
6465 invalidate (XEXP (p->exp, 0), GET_MODE (p->exp));
6468 /* Process insns starting after LOOP_START until we hit a CALL_INSN or
6469 a CODE_LABEL (we could handle a CALL_INSN, but it isn't worth it).
6471 The only thing we do with SET_DEST is invalidate entries, so we
6472 can safely process each SET in order. It is slightly less efficient
6473 to do so, but we only want to handle the most common cases.
6475 The gen_move_insn call in cse_set_around_loop may create new pseudos.
6476 These pseudos won't have valid entries in any of the tables indexed
6477 by register number, such as reg_qty. We avoid out-of-range array
6478 accesses by not processing any instructions created after cse started. */
6480 for (insn = NEXT_INSN (loop_start);
6481 GET_CODE (insn) != CALL_INSN && GET_CODE (insn) != CODE_LABEL
6482 && INSN_UID (insn) < max_insn_uid
6483 && ! (GET_CODE (insn) == NOTE
6484 && NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_END);
6485 insn = NEXT_INSN (insn))
6487 if (INSN_P (insn)
6488 && (GET_CODE (PATTERN (insn)) == SET
6489 || GET_CODE (PATTERN (insn)) == CLOBBER))
6490 cse_set_around_loop (PATTERN (insn), insn, loop_start);
6491 else if (INSN_P (insn) && GET_CODE (PATTERN (insn)) == PARALLEL)
6492 for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
6493 if (GET_CODE (XVECEXP (PATTERN (insn), 0, i)) == SET
6494 || GET_CODE (XVECEXP (PATTERN (insn), 0, i)) == CLOBBER)
6495 cse_set_around_loop (XVECEXP (PATTERN (insn), 0, i), insn,
6496 loop_start);
6500 /* Process one SET of an insn that was skipped. We ignore CLOBBERs
6501 since they are done elsewhere. This function is called via note_stores. */
6503 static void
6504 invalidate_skipped_set (rtx dest, rtx set, void *data ATTRIBUTE_UNUSED)
6506 enum rtx_code code = GET_CODE (dest);
6508 if (code == MEM
6509 && ! addr_affects_sp_p (dest) /* If this is not a stack push ... */
6510 /* There are times when an address can appear varying and be a PLUS
6511 during this scan when it would be a fixed address were we to know
6512 the proper equivalences. So invalidate all memory if there is
6513 a BLKmode or nonscalar memory reference or a reference to a
6514 variable address. */
6515 && (MEM_IN_STRUCT_P (dest) || GET_MODE (dest) == BLKmode
6516 || cse_rtx_varies_p (XEXP (dest, 0), 0)))
6518 invalidate_memory ();
6519 return;
6522 if (GET_CODE (set) == CLOBBER
6523 || CC0_P (dest)
6524 || dest == pc_rtx)
6525 return;
6527 if (code == STRICT_LOW_PART || code == ZERO_EXTRACT)
6528 invalidate (XEXP (dest, 0), GET_MODE (dest));
6529 else if (code == REG || code == SUBREG || code == MEM)
6530 invalidate (dest, VOIDmode);
6533 /* Invalidate all insns from START up to the end of the function or the
6534 next label. This called when we wish to CSE around a block that is
6535 conditionally executed. */
6537 static void
6538 invalidate_skipped_block (rtx start)
6540 rtx insn;
6542 for (insn = start; insn && GET_CODE (insn) != CODE_LABEL;
6543 insn = NEXT_INSN (insn))
6545 if (! INSN_P (insn))
6546 continue;
6548 if (GET_CODE (insn) == CALL_INSN)
6550 if (! CONST_OR_PURE_CALL_P (insn))
6551 invalidate_memory ();
6552 invalidate_for_call ();
6555 invalidate_from_clobbers (PATTERN (insn));
6556 note_stores (PATTERN (insn), invalidate_skipped_set, NULL);
6560 /* If modifying X will modify the value in *DATA (which is really an
6561 `rtx *'), indicate that fact by setting the pointed to value to
6562 NULL_RTX. */
6564 static void
6565 cse_check_loop_start (rtx x, rtx set ATTRIBUTE_UNUSED, void *data)
6567 rtx *cse_check_loop_start_value = (rtx *) data;
6569 if (*cse_check_loop_start_value == NULL_RTX
6570 || GET_CODE (x) == CC0 || GET_CODE (x) == PC)
6571 return;
6573 if ((GET_CODE (x) == MEM && GET_CODE (*cse_check_loop_start_value) == MEM)
6574 || reg_overlap_mentioned_p (x, *cse_check_loop_start_value))
6575 *cse_check_loop_start_value = NULL_RTX;
6578 /* X is a SET or CLOBBER contained in INSN that was found near the start of
6579 a loop that starts with the label at LOOP_START.
6581 If X is a SET, we see if its SET_SRC is currently in our hash table.
6582 If so, we see if it has a value equal to some register used only in the
6583 loop exit code (as marked by jump.c).
6585 If those two conditions are true, we search backwards from the start of
6586 the loop to see if that same value was loaded into a register that still
6587 retains its value at the start of the loop.
6589 If so, we insert an insn after the load to copy the destination of that
6590 load into the equivalent register and (try to) replace our SET_SRC with that
6591 register.
6593 In any event, we invalidate whatever this SET or CLOBBER modifies. */
6595 static void
6596 cse_set_around_loop (rtx x, rtx insn, rtx loop_start)
6598 struct table_elt *src_elt;
6600 /* If this is a SET, see if we can replace SET_SRC, but ignore SETs that
6601 are setting PC or CC0 or whose SET_SRC is already a register. */
6602 if (GET_CODE (x) == SET
6603 && GET_CODE (SET_DEST (x)) != PC && GET_CODE (SET_DEST (x)) != CC0
6604 && GET_CODE (SET_SRC (x)) != REG)
6606 src_elt = lookup (SET_SRC (x),
6607 HASH (SET_SRC (x), GET_MODE (SET_DEST (x))),
6608 GET_MODE (SET_DEST (x)));
6610 if (src_elt)
6611 for (src_elt = src_elt->first_same_value; src_elt;
6612 src_elt = src_elt->next_same_value)
6613 if (GET_CODE (src_elt->exp) == REG && REG_LOOP_TEST_P (src_elt->exp)
6614 && COST (src_elt->exp) < COST (SET_SRC (x)))
6616 rtx p, set;
6618 /* Look for an insn in front of LOOP_START that sets
6619 something in the desired mode to SET_SRC (x) before we hit
6620 a label or CALL_INSN. */
6622 for (p = prev_nonnote_insn (loop_start);
6623 p && GET_CODE (p) != CALL_INSN
6624 && GET_CODE (p) != CODE_LABEL;
6625 p = prev_nonnote_insn (p))
6626 if ((set = single_set (p)) != 0
6627 && GET_CODE (SET_DEST (set)) == REG
6628 && GET_MODE (SET_DEST (set)) == src_elt->mode
6629 && rtx_equal_p (SET_SRC (set), SET_SRC (x)))
6631 /* We now have to ensure that nothing between P
6632 and LOOP_START modified anything referenced in
6633 SET_SRC (x). We know that nothing within the loop
6634 can modify it, or we would have invalidated it in
6635 the hash table. */
6636 rtx q;
6637 rtx cse_check_loop_start_value = SET_SRC (x);
6638 for (q = p; q != loop_start; q = NEXT_INSN (q))
6639 if (INSN_P (q))
6640 note_stores (PATTERN (q),
6641 cse_check_loop_start,
6642 &cse_check_loop_start_value);
6644 /* If nothing was changed and we can replace our
6645 SET_SRC, add an insn after P to copy its destination
6646 to what we will be replacing SET_SRC with. */
6647 if (cse_check_loop_start_value
6648 && single_set (p)
6649 && !can_throw_internal (insn)
6650 && validate_change (insn, &SET_SRC (x),
6651 src_elt->exp, 0))
6653 /* If this creates new pseudos, this is unsafe,
6654 because the regno of new pseudo is unsuitable
6655 to index into reg_qty when cse_insn processes
6656 the new insn. Therefore, if a new pseudo was
6657 created, discard this optimization. */
6658 int nregs = max_reg_num ();
6659 rtx move
6660 = gen_move_insn (src_elt->exp, SET_DEST (set));
6661 if (nregs != max_reg_num ())
6663 if (! validate_change (insn, &SET_SRC (x),
6664 SET_SRC (set), 0))
6665 abort ();
6667 else
6668 emit_insn_after (move, p);
6670 break;
6675 /* Deal with the destination of X affecting the stack pointer. */
6676 addr_affects_sp_p (SET_DEST (x));
6678 /* See comment on similar code in cse_insn for explanation of these
6679 tests. */
6680 if (GET_CODE (SET_DEST (x)) == REG || GET_CODE (SET_DEST (x)) == SUBREG
6681 || GET_CODE (SET_DEST (x)) == MEM)
6682 invalidate (SET_DEST (x), VOIDmode);
6683 else if (GET_CODE (SET_DEST (x)) == STRICT_LOW_PART
6684 || GET_CODE (SET_DEST (x)) == ZERO_EXTRACT)
6685 invalidate (XEXP (SET_DEST (x), 0), GET_MODE (SET_DEST (x)));
6688 /* Find the end of INSN's basic block and return its range,
6689 the total number of SETs in all the insns of the block, the last insn of the
6690 block, and the branch path.
6692 The branch path indicates which branches should be followed. If a nonzero
6693 path size is specified, the block should be rescanned and a different set
6694 of branches will be taken. The branch path is only used if
6695 FLAG_CSE_FOLLOW_JUMPS or FLAG_CSE_SKIP_BLOCKS is nonzero.
6697 DATA is a pointer to a struct cse_basic_block_data, defined below, that is
6698 used to describe the block. It is filled in with the information about
6699 the current block. The incoming structure's branch path, if any, is used
6700 to construct the output branch path. */
6702 void
6703 cse_end_of_basic_block (rtx insn, struct cse_basic_block_data *data,
6704 int follow_jumps, int after_loop, int skip_blocks)
6706 rtx p = insn, q;
6707 int nsets = 0;
6708 int low_cuid = INSN_CUID (insn), high_cuid = INSN_CUID (insn);
6709 rtx next = INSN_P (insn) ? insn : next_real_insn (insn);
6710 int path_size = data->path_size;
6711 int path_entry = 0;
6712 int i;
6714 /* Update the previous branch path, if any. If the last branch was
6715 previously TAKEN, mark it NOT_TAKEN. If it was previously NOT_TAKEN,
6716 shorten the path by one and look at the previous branch. We know that
6717 at least one branch must have been taken if PATH_SIZE is nonzero. */
6718 while (path_size > 0)
6720 if (data->path[path_size - 1].status != NOT_TAKEN)
6722 data->path[path_size - 1].status = NOT_TAKEN;
6723 break;
6725 else
6726 path_size--;
6729 /* If the first instruction is marked with QImode, that means we've
6730 already processed this block. Our caller will look at DATA->LAST
6731 to figure out where to go next. We want to return the next block
6732 in the instruction stream, not some branched-to block somewhere
6733 else. We accomplish this by pretending our called forbid us to
6734 follow jumps, or skip blocks. */
6735 if (GET_MODE (insn) == QImode)
6736 follow_jumps = skip_blocks = 0;
6738 /* Scan to end of this basic block. */
6739 while (p && GET_CODE (p) != CODE_LABEL)
6741 /* Don't cse out the end of a loop. This makes a difference
6742 only for the unusual loops that always execute at least once;
6743 all other loops have labels there so we will stop in any case.
6744 Cse'ing out the end of the loop is dangerous because it
6745 might cause an invariant expression inside the loop
6746 to be reused after the end of the loop. This would make it
6747 hard to move the expression out of the loop in loop.c,
6748 especially if it is one of several equivalent expressions
6749 and loop.c would like to eliminate it.
6751 If we are running after loop.c has finished, we can ignore
6752 the NOTE_INSN_LOOP_END. */
6754 if (! after_loop && GET_CODE (p) == NOTE
6755 && NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_END)
6756 break;
6758 /* Don't cse over a call to setjmp; on some machines (eg VAX)
6759 the regs restored by the longjmp come from
6760 a later time than the setjmp. */
6761 if (PREV_INSN (p) && GET_CODE (PREV_INSN (p)) == CALL_INSN
6762 && find_reg_note (PREV_INSN (p), REG_SETJMP, NULL))
6763 break;
6765 /* A PARALLEL can have lots of SETs in it,
6766 especially if it is really an ASM_OPERANDS. */
6767 if (INSN_P (p) && GET_CODE (PATTERN (p)) == PARALLEL)
6768 nsets += XVECLEN (PATTERN (p), 0);
6769 else if (GET_CODE (p) != NOTE)
6770 nsets += 1;
6772 /* Ignore insns made by CSE; they cannot affect the boundaries of
6773 the basic block. */
6775 if (INSN_UID (p) <= max_uid && INSN_CUID (p) > high_cuid)
6776 high_cuid = INSN_CUID (p);
6777 if (INSN_UID (p) <= max_uid && INSN_CUID (p) < low_cuid)
6778 low_cuid = INSN_CUID (p);
6780 /* See if this insn is in our branch path. If it is and we are to
6781 take it, do so. */
6782 if (path_entry < path_size && data->path[path_entry].branch == p)
6784 if (data->path[path_entry].status != NOT_TAKEN)
6785 p = JUMP_LABEL (p);
6787 /* Point to next entry in path, if any. */
6788 path_entry++;
6791 /* If this is a conditional jump, we can follow it if -fcse-follow-jumps
6792 was specified, we haven't reached our maximum path length, there are
6793 insns following the target of the jump, this is the only use of the
6794 jump label, and the target label is preceded by a BARRIER.
6796 Alternatively, we can follow the jump if it branches around a
6797 block of code and there are no other branches into the block.
6798 In this case invalidate_skipped_block will be called to invalidate any
6799 registers set in the block when following the jump. */
6801 else if ((follow_jumps || skip_blocks) && path_size < PARAM_VALUE (PARAM_MAX_CSE_PATH_LENGTH) - 1
6802 && GET_CODE (p) == JUMP_INSN
6803 && GET_CODE (PATTERN (p)) == SET
6804 && GET_CODE (SET_SRC (PATTERN (p))) == IF_THEN_ELSE
6805 && JUMP_LABEL (p) != 0
6806 && LABEL_NUSES (JUMP_LABEL (p)) == 1
6807 && NEXT_INSN (JUMP_LABEL (p)) != 0)
6809 for (q = PREV_INSN (JUMP_LABEL (p)); q; q = PREV_INSN (q))
6810 if ((GET_CODE (q) != NOTE
6811 || NOTE_LINE_NUMBER (q) == NOTE_INSN_LOOP_END
6812 || (PREV_INSN (q) && GET_CODE (PREV_INSN (q)) == CALL_INSN
6813 && find_reg_note (PREV_INSN (q), REG_SETJMP, NULL)))
6814 && (GET_CODE (q) != CODE_LABEL || LABEL_NUSES (q) != 0))
6815 break;
6817 /* If we ran into a BARRIER, this code is an extension of the
6818 basic block when the branch is taken. */
6819 if (follow_jumps && q != 0 && GET_CODE (q) == BARRIER)
6821 /* Don't allow ourself to keep walking around an
6822 always-executed loop. */
6823 if (next_real_insn (q) == next)
6825 p = NEXT_INSN (p);
6826 continue;
6829 /* Similarly, don't put a branch in our path more than once. */
6830 for (i = 0; i < path_entry; i++)
6831 if (data->path[i].branch == p)
6832 break;
6834 if (i != path_entry)
6835 break;
6837 data->path[path_entry].branch = p;
6838 data->path[path_entry++].status = TAKEN;
6840 /* This branch now ends our path. It was possible that we
6841 didn't see this branch the last time around (when the
6842 insn in front of the target was a JUMP_INSN that was
6843 turned into a no-op). */
6844 path_size = path_entry;
6846 p = JUMP_LABEL (p);
6847 /* Mark block so we won't scan it again later. */
6848 PUT_MODE (NEXT_INSN (p), QImode);
6850 /* Detect a branch around a block of code. */
6851 else if (skip_blocks && q != 0 && GET_CODE (q) != CODE_LABEL)
6853 rtx tmp;
6855 if (next_real_insn (q) == next)
6857 p = NEXT_INSN (p);
6858 continue;
6861 for (i = 0; i < path_entry; i++)
6862 if (data->path[i].branch == p)
6863 break;
6865 if (i != path_entry)
6866 break;
6868 /* This is no_labels_between_p (p, q) with an added check for
6869 reaching the end of a function (in case Q precedes P). */
6870 for (tmp = NEXT_INSN (p); tmp && tmp != q; tmp = NEXT_INSN (tmp))
6871 if (GET_CODE (tmp) == CODE_LABEL)
6872 break;
6874 if (tmp == q)
6876 data->path[path_entry].branch = p;
6877 data->path[path_entry++].status = AROUND;
6879 path_size = path_entry;
6881 p = JUMP_LABEL (p);
6882 /* Mark block so we won't scan it again later. */
6883 PUT_MODE (NEXT_INSN (p), QImode);
6887 p = NEXT_INSN (p);
6890 data->low_cuid = low_cuid;
6891 data->high_cuid = high_cuid;
6892 data->nsets = nsets;
6893 data->last = p;
6895 /* If all jumps in the path are not taken, set our path length to zero
6896 so a rescan won't be done. */
6897 for (i = path_size - 1; i >= 0; i--)
6898 if (data->path[i].status != NOT_TAKEN)
6899 break;
6901 if (i == -1)
6902 data->path_size = 0;
6903 else
6904 data->path_size = path_size;
6906 /* End the current branch path. */
6907 data->path[path_size].branch = 0;
6910 /* Perform cse on the instructions of a function.
6911 F is the first instruction.
6912 NREGS is one plus the highest pseudo-reg number used in the instruction.
6914 AFTER_LOOP is 1 if this is the cse call done after loop optimization
6915 (only if -frerun-cse-after-loop).
6917 Returns 1 if jump_optimize should be redone due to simplifications
6918 in conditional jump instructions. */
6921 cse_main (rtx f, int nregs, int after_loop, FILE *file)
6923 struct cse_basic_block_data val;
6924 rtx insn = f;
6925 int i;
6927 val.path = xmalloc (sizeof (struct branch_path)
6928 * PARAM_VALUE (PARAM_MAX_CSE_PATH_LENGTH));
6930 cse_jumps_altered = 0;
6931 recorded_label_ref = 0;
6932 constant_pool_entries_cost = 0;
6933 val.path_size = 0;
6935 init_recog ();
6936 init_alias_analysis ();
6938 max_reg = nregs;
6940 max_insn_uid = get_max_uid ();
6942 reg_eqv_table = (struct reg_eqv_elem *)
6943 xmalloc (nregs * sizeof (struct reg_eqv_elem));
6945 #ifdef LOAD_EXTEND_OP
6947 /* Allocate scratch rtl here. cse_insn will fill in the memory reference
6948 and change the code and mode as appropriate. */
6949 memory_extend_rtx = gen_rtx_ZERO_EXTEND (VOIDmode, NULL_RTX);
6950 #endif
6952 /* Reset the counter indicating how many elements have been made
6953 thus far. */
6954 n_elements_made = 0;
6956 /* Find the largest uid. */
6958 max_uid = get_max_uid ();
6959 uid_cuid = (int *) xcalloc (max_uid + 1, sizeof (int));
6961 /* Compute the mapping from uids to cuids.
6962 CUIDs are numbers assigned to insns, like uids,
6963 except that cuids increase monotonically through the code.
6964 Don't assign cuids to line-number NOTEs, so that the distance in cuids
6965 between two insns is not affected by -g. */
6967 for (insn = f, i = 0; insn; insn = NEXT_INSN (insn))
6969 if (GET_CODE (insn) != NOTE
6970 || NOTE_LINE_NUMBER (insn) < 0)
6971 INSN_CUID (insn) = ++i;
6972 else
6973 /* Give a line number note the same cuid as preceding insn. */
6974 INSN_CUID (insn) = i;
6977 ggc_push_context ();
6979 /* Loop over basic blocks.
6980 Compute the maximum number of qty's needed for each basic block
6981 (which is 2 for each SET). */
6982 insn = f;
6983 while (insn)
6985 cse_altered = 0;
6986 cse_end_of_basic_block (insn, &val, flag_cse_follow_jumps, after_loop,
6987 flag_cse_skip_blocks);
6989 /* If this basic block was already processed or has no sets, skip it. */
6990 if (val.nsets == 0 || GET_MODE (insn) == QImode)
6992 PUT_MODE (insn, VOIDmode);
6993 insn = (val.last ? NEXT_INSN (val.last) : 0);
6994 val.path_size = 0;
6995 continue;
6998 cse_basic_block_start = val.low_cuid;
6999 cse_basic_block_end = val.high_cuid;
7000 max_qty = val.nsets * 2;
7002 if (file)
7003 fnotice (file, ";; Processing block from %d to %d, %d sets.\n",
7004 INSN_UID (insn), val.last ? INSN_UID (val.last) : 0,
7005 val.nsets);
7007 /* Make MAX_QTY bigger to give us room to optimize
7008 past the end of this basic block, if that should prove useful. */
7009 if (max_qty < 500)
7010 max_qty = 500;
7012 max_qty += max_reg;
7014 /* If this basic block is being extended by following certain jumps,
7015 (see `cse_end_of_basic_block'), we reprocess the code from the start.
7016 Otherwise, we start after this basic block. */
7017 if (val.path_size > 0)
7018 cse_basic_block (insn, val.last, val.path, 0);
7019 else
7021 int old_cse_jumps_altered = cse_jumps_altered;
7022 rtx temp;
7024 /* When cse changes a conditional jump to an unconditional
7025 jump, we want to reprocess the block, since it will give
7026 us a new branch path to investigate. */
7027 cse_jumps_altered = 0;
7028 temp = cse_basic_block (insn, val.last, val.path, ! after_loop);
7029 if (cse_jumps_altered == 0
7030 || (flag_cse_follow_jumps == 0 && flag_cse_skip_blocks == 0))
7031 insn = temp;
7033 cse_jumps_altered |= old_cse_jumps_altered;
7036 if (cse_altered)
7037 ggc_collect ();
7039 #ifdef USE_C_ALLOCA
7040 alloca (0);
7041 #endif
7044 ggc_pop_context ();
7046 if (max_elements_made < n_elements_made)
7047 max_elements_made = n_elements_made;
7049 /* Clean up. */
7050 end_alias_analysis ();
7051 free (uid_cuid);
7052 free (reg_eqv_table);
7053 free (val.path);
7055 return cse_jumps_altered || recorded_label_ref;
7058 /* Process a single basic block. FROM and TO and the limits of the basic
7059 block. NEXT_BRANCH points to the branch path when following jumps or
7060 a null path when not following jumps.
7062 AROUND_LOOP is nonzero if we are to try to cse around to the start of a
7063 loop. This is true when we are being called for the last time on a
7064 block and this CSE pass is before loop.c. */
7066 static rtx
7067 cse_basic_block (rtx from, rtx to, struct branch_path *next_branch,
7068 int around_loop)
7070 rtx insn;
7071 int to_usage = 0;
7072 rtx libcall_insn = NULL_RTX;
7073 int num_insns = 0;
7075 /* This array is undefined before max_reg, so only allocate
7076 the space actually needed and adjust the start. */
7078 qty_table
7079 = (struct qty_table_elem *) xmalloc ((max_qty - max_reg)
7080 * sizeof (struct qty_table_elem));
7081 qty_table -= max_reg;
7083 new_basic_block ();
7085 /* TO might be a label. If so, protect it from being deleted. */
7086 if (to != 0 && GET_CODE (to) == CODE_LABEL)
7087 ++LABEL_NUSES (to);
7089 for (insn = from; insn != to; insn = NEXT_INSN (insn))
7091 enum rtx_code code = GET_CODE (insn);
7093 /* If we have processed 1,000 insns, flush the hash table to
7094 avoid extreme quadratic behavior. We must not include NOTEs
7095 in the count since there may be more of them when generating
7096 debugging information. If we clear the table at different
7097 times, code generated with -g -O might be different than code
7098 generated with -O but not -g.
7100 ??? This is a real kludge and needs to be done some other way.
7101 Perhaps for 2.9. */
7102 if (code != NOTE && num_insns++ > 1000)
7104 flush_hash_table ();
7105 num_insns = 0;
7108 /* See if this is a branch that is part of the path. If so, and it is
7109 to be taken, do so. */
7110 if (next_branch->branch == insn)
7112 enum taken status = next_branch++->status;
7113 if (status != NOT_TAKEN)
7115 if (status == TAKEN)
7116 record_jump_equiv (insn, 1);
7117 else
7118 invalidate_skipped_block (NEXT_INSN (insn));
7120 /* Set the last insn as the jump insn; it doesn't affect cc0.
7121 Then follow this branch. */
7122 #ifdef HAVE_cc0
7123 prev_insn_cc0 = 0;
7124 prev_insn = insn;
7125 #endif
7126 insn = JUMP_LABEL (insn);
7127 continue;
7131 if (GET_MODE (insn) == QImode)
7132 PUT_MODE (insn, VOIDmode);
7134 if (GET_RTX_CLASS (code) == 'i')
7136 rtx p;
7138 /* Process notes first so we have all notes in canonical forms when
7139 looking for duplicate operations. */
7141 if (REG_NOTES (insn))
7142 REG_NOTES (insn) = cse_process_notes (REG_NOTES (insn), NULL_RTX);
7144 /* Track when we are inside in LIBCALL block. Inside such a block,
7145 we do not want to record destinations. The last insn of a
7146 LIBCALL block is not considered to be part of the block, since
7147 its destination is the result of the block and hence should be
7148 recorded. */
7150 if (REG_NOTES (insn) != 0)
7152 if ((p = find_reg_note (insn, REG_LIBCALL, NULL_RTX)))
7153 libcall_insn = XEXP (p, 0);
7154 else if (find_reg_note (insn, REG_RETVAL, NULL_RTX))
7155 libcall_insn = 0;
7158 cse_insn (insn, libcall_insn);
7160 /* If we haven't already found an insn where we added a LABEL_REF,
7161 check this one. */
7162 if (GET_CODE (insn) == INSN && ! recorded_label_ref
7163 && for_each_rtx (&PATTERN (insn), check_for_label_ref,
7164 (void *) insn))
7165 recorded_label_ref = 1;
7168 /* If INSN is now an unconditional jump, skip to the end of our
7169 basic block by pretending that we just did the last insn in the
7170 basic block. If we are jumping to the end of our block, show
7171 that we can have one usage of TO. */
7173 if (any_uncondjump_p (insn))
7175 if (to == 0)
7177 free (qty_table + max_reg);
7178 return 0;
7181 if (JUMP_LABEL (insn) == to)
7182 to_usage = 1;
7184 /* Maybe TO was deleted because the jump is unconditional.
7185 If so, there is nothing left in this basic block. */
7186 /* ??? Perhaps it would be smarter to set TO
7187 to whatever follows this insn,
7188 and pretend the basic block had always ended here. */
7189 if (INSN_DELETED_P (to))
7190 break;
7192 insn = PREV_INSN (to);
7195 /* See if it is ok to keep on going past the label
7196 which used to end our basic block. Remember that we incremented
7197 the count of that label, so we decrement it here. If we made
7198 a jump unconditional, TO_USAGE will be one; in that case, we don't
7199 want to count the use in that jump. */
7201 if (to != 0 && NEXT_INSN (insn) == to
7202 && GET_CODE (to) == CODE_LABEL && --LABEL_NUSES (to) == to_usage)
7204 struct cse_basic_block_data val;
7205 rtx prev;
7207 insn = NEXT_INSN (to);
7209 /* If TO was the last insn in the function, we are done. */
7210 if (insn == 0)
7212 free (qty_table + max_reg);
7213 return 0;
7216 /* If TO was preceded by a BARRIER we are done with this block
7217 because it has no continuation. */
7218 prev = prev_nonnote_insn (to);
7219 if (prev && GET_CODE (prev) == BARRIER)
7221 free (qty_table + max_reg);
7222 return insn;
7225 /* Find the end of the following block. Note that we won't be
7226 following branches in this case. */
7227 to_usage = 0;
7228 val.path_size = 0;
7229 val.path = xmalloc (sizeof (struct branch_path)
7230 * PARAM_VALUE (PARAM_MAX_CSE_PATH_LENGTH));
7231 cse_end_of_basic_block (insn, &val, 0, 0, 0);
7232 free (val.path);
7234 /* If the tables we allocated have enough space left
7235 to handle all the SETs in the next basic block,
7236 continue through it. Otherwise, return,
7237 and that block will be scanned individually. */
7238 if (val.nsets * 2 + next_qty > max_qty)
7239 break;
7241 cse_basic_block_start = val.low_cuid;
7242 cse_basic_block_end = val.high_cuid;
7243 to = val.last;
7245 /* Prevent TO from being deleted if it is a label. */
7246 if (to != 0 && GET_CODE (to) == CODE_LABEL)
7247 ++LABEL_NUSES (to);
7249 /* Back up so we process the first insn in the extension. */
7250 insn = PREV_INSN (insn);
7254 if (next_qty > max_qty)
7255 abort ();
7257 /* If we are running before loop.c, we stopped on a NOTE_INSN_LOOP_END, and
7258 the previous insn is the only insn that branches to the head of a loop,
7259 we can cse into the loop. Don't do this if we changed the jump
7260 structure of a loop unless we aren't going to be following jumps. */
7262 insn = prev_nonnote_insn (to);
7263 if ((cse_jumps_altered == 0
7264 || (flag_cse_follow_jumps == 0 && flag_cse_skip_blocks == 0))
7265 && around_loop && to != 0
7266 && GET_CODE (to) == NOTE && NOTE_LINE_NUMBER (to) == NOTE_INSN_LOOP_END
7267 && GET_CODE (insn) == JUMP_INSN
7268 && JUMP_LABEL (insn) != 0
7269 && LABEL_NUSES (JUMP_LABEL (insn)) == 1)
7270 cse_around_loop (JUMP_LABEL (insn));
7272 free (qty_table + max_reg);
7274 return to ? NEXT_INSN (to) : 0;
7277 /* Called via for_each_rtx to see if an insn is using a LABEL_REF for which
7278 there isn't a REG_LABEL note. Return one if so. DATA is the insn. */
7280 static int
7281 check_for_label_ref (rtx *rtl, void *data)
7283 rtx insn = (rtx) data;
7285 /* If this insn uses a LABEL_REF and there isn't a REG_LABEL note for it,
7286 we must rerun jump since it needs to place the note. If this is a
7287 LABEL_REF for a CODE_LABEL that isn't in the insn chain, don't do this
7288 since no REG_LABEL will be added. */
7289 return (GET_CODE (*rtl) == LABEL_REF
7290 && ! LABEL_REF_NONLOCAL_P (*rtl)
7291 && LABEL_P (XEXP (*rtl, 0))
7292 && INSN_UID (XEXP (*rtl, 0)) != 0
7293 && ! find_reg_note (insn, REG_LABEL, XEXP (*rtl, 0)));
7296 /* Count the number of times registers are used (not set) in X.
7297 COUNTS is an array in which we accumulate the count, INCR is how much
7298 we count each register usage.
7300 Don't count a usage of DEST, which is the SET_DEST of a SET which
7301 contains X in its SET_SRC. This is because such a SET does not
7302 modify the liveness of DEST. */
7304 static void
7305 count_reg_usage (rtx x, int *counts, rtx dest, int incr)
7307 enum rtx_code code;
7308 rtx note;
7309 const char *fmt;
7310 int i, j;
7312 if (x == 0)
7313 return;
7315 switch (code = GET_CODE (x))
7317 case REG:
7318 if (x != dest)
7319 counts[REGNO (x)] += incr;
7320 return;
7322 case PC:
7323 case CC0:
7324 case CONST:
7325 case CONST_INT:
7326 case CONST_DOUBLE:
7327 case CONST_VECTOR:
7328 case SYMBOL_REF:
7329 case LABEL_REF:
7330 return;
7332 case CLOBBER:
7333 /* If we are clobbering a MEM, mark any registers inside the address
7334 as being used. */
7335 if (GET_CODE (XEXP (x, 0)) == MEM)
7336 count_reg_usage (XEXP (XEXP (x, 0), 0), counts, NULL_RTX, incr);
7337 return;
7339 case SET:
7340 /* Unless we are setting a REG, count everything in SET_DEST. */
7341 if (GET_CODE (SET_DEST (x)) != REG)
7342 count_reg_usage (SET_DEST (x), counts, NULL_RTX, incr);
7343 count_reg_usage (SET_SRC (x), counts,
7344 SET_DEST (x),
7345 incr);
7346 return;
7348 case CALL_INSN:
7349 count_reg_usage (CALL_INSN_FUNCTION_USAGE (x), counts, NULL_RTX, incr);
7350 /* Fall through. */
7352 case INSN:
7353 case JUMP_INSN:
7354 count_reg_usage (PATTERN (x), counts, NULL_RTX, incr);
7356 /* Things used in a REG_EQUAL note aren't dead since loop may try to
7357 use them. */
7359 note = find_reg_equal_equiv_note (x);
7360 if (note)
7362 rtx eqv = XEXP (note, 0);
7364 if (GET_CODE (eqv) == EXPR_LIST)
7365 /* This REG_EQUAL note describes the result of a function call.
7366 Process all the arguments. */
7369 count_reg_usage (XEXP (eqv, 0), counts, NULL_RTX, incr);
7370 eqv = XEXP (eqv, 1);
7372 while (eqv && GET_CODE (eqv) == EXPR_LIST);
7373 else
7374 count_reg_usage (eqv, counts, NULL_RTX, incr);
7376 return;
7378 case EXPR_LIST:
7379 if (REG_NOTE_KIND (x) == REG_EQUAL
7380 || (REG_NOTE_KIND (x) != REG_NONNEG && GET_CODE (XEXP (x,0)) == USE)
7381 /* FUNCTION_USAGE expression lists may include (CLOBBER (mem /u)),
7382 involving registers in the address. */
7383 || GET_CODE (XEXP (x, 0)) == CLOBBER)
7384 count_reg_usage (XEXP (x, 0), counts, NULL_RTX, incr);
7386 count_reg_usage (XEXP (x, 1), counts, NULL_RTX, incr);
7387 return;
7389 case INSN_LIST:
7390 abort ();
7392 default:
7393 break;
7396 fmt = GET_RTX_FORMAT (code);
7397 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
7399 if (fmt[i] == 'e')
7400 count_reg_usage (XEXP (x, i), counts, dest, incr);
7401 else if (fmt[i] == 'E')
7402 for (j = XVECLEN (x, i) - 1; j >= 0; j--)
7403 count_reg_usage (XVECEXP (x, i, j), counts, dest, incr);
7407 /* Return true if set is live. */
7408 static bool
7409 set_live_p (rtx set, rtx insn ATTRIBUTE_UNUSED, /* Only used with HAVE_cc0. */
7410 int *counts)
7412 #ifdef HAVE_cc0
7413 rtx tem;
7414 #endif
7416 if (set_noop_p (set))
7419 #ifdef HAVE_cc0
7420 else if (GET_CODE (SET_DEST (set)) == CC0
7421 && !side_effects_p (SET_SRC (set))
7422 && ((tem = next_nonnote_insn (insn)) == 0
7423 || !INSN_P (tem)
7424 || !reg_referenced_p (cc0_rtx, PATTERN (tem))))
7425 return false;
7426 #endif
7427 else if (GET_CODE (SET_DEST (set)) != REG
7428 || REGNO (SET_DEST (set)) < FIRST_PSEUDO_REGISTER
7429 || counts[REGNO (SET_DEST (set))] != 0
7430 || side_effects_p (SET_SRC (set))
7431 /* An ADDRESSOF expression can turn into a use of the
7432 internal arg pointer, so always consider the
7433 internal arg pointer live. If it is truly dead,
7434 flow will delete the initializing insn. */
7435 || (SET_DEST (set) == current_function_internal_arg_pointer))
7436 return true;
7437 return false;
7440 /* Return true if insn is live. */
7442 static bool
7443 insn_live_p (rtx insn, int *counts)
7445 int i;
7446 if (flag_non_call_exceptions && may_trap_p (PATTERN (insn)))
7447 return true;
7448 else if (GET_CODE (PATTERN (insn)) == SET)
7449 return set_live_p (PATTERN (insn), insn, counts);
7450 else if (GET_CODE (PATTERN (insn)) == PARALLEL)
7452 for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
7454 rtx elt = XVECEXP (PATTERN (insn), 0, i);
7456 if (GET_CODE (elt) == SET)
7458 if (set_live_p (elt, insn, counts))
7459 return true;
7461 else if (GET_CODE (elt) != CLOBBER && GET_CODE (elt) != USE)
7462 return true;
7464 return false;
7466 else
7467 return true;
7470 /* Return true if libcall is dead as a whole. */
7472 static bool
7473 dead_libcall_p (rtx insn, int *counts)
7475 rtx note, set, new;
7477 /* See if there's a REG_EQUAL note on this insn and try to
7478 replace the source with the REG_EQUAL expression.
7480 We assume that insns with REG_RETVALs can only be reg->reg
7481 copies at this point. */
7482 note = find_reg_note (insn, REG_EQUAL, NULL_RTX);
7483 if (!note)
7484 return false;
7486 set = single_set (insn);
7487 if (!set)
7488 return false;
7490 new = simplify_rtx (XEXP (note, 0));
7491 if (!new)
7492 new = XEXP (note, 0);
7494 /* While changing insn, we must update the counts accordingly. */
7495 count_reg_usage (insn, counts, NULL_RTX, -1);
7497 if (validate_change (insn, &SET_SRC (set), new, 0))
7499 count_reg_usage (insn, counts, NULL_RTX, 1);
7500 remove_note (insn, find_reg_note (insn, REG_RETVAL, NULL_RTX));
7501 remove_note (insn, note);
7502 return true;
7505 if (CONSTANT_P (new))
7507 new = force_const_mem (GET_MODE (SET_DEST (set)), new);
7508 if (new && validate_change (insn, &SET_SRC (set), new, 0))
7510 count_reg_usage (insn, counts, NULL_RTX, 1);
7511 remove_note (insn, find_reg_note (insn, REG_RETVAL, NULL_RTX));
7512 remove_note (insn, note);
7513 return true;
7517 count_reg_usage (insn, counts, NULL_RTX, 1);
7518 return false;
7521 /* Scan all the insns and delete any that are dead; i.e., they store a register
7522 that is never used or they copy a register to itself.
7524 This is used to remove insns made obviously dead by cse, loop or other
7525 optimizations. It improves the heuristics in loop since it won't try to
7526 move dead invariants out of loops or make givs for dead quantities. The
7527 remaining passes of the compilation are also sped up. */
7530 delete_trivially_dead_insns (rtx insns, int nreg)
7532 int *counts;
7533 rtx insn, prev;
7534 int in_libcall = 0, dead_libcall = 0;
7535 int ndead = 0, nlastdead, niterations = 0;
7537 timevar_push (TV_DELETE_TRIVIALLY_DEAD);
7538 /* First count the number of times each register is used. */
7539 counts = (int *) xcalloc (nreg, sizeof (int));
7540 for (insn = next_real_insn (insns); insn; insn = next_real_insn (insn))
7541 count_reg_usage (insn, counts, NULL_RTX, 1);
7545 nlastdead = ndead;
7546 niterations++;
7547 /* Go from the last insn to the first and delete insns that only set unused
7548 registers or copy a register to itself. As we delete an insn, remove
7549 usage counts for registers it uses.
7551 The first jump optimization pass may leave a real insn as the last
7552 insn in the function. We must not skip that insn or we may end
7553 up deleting code that is not really dead. */
7554 insn = get_last_insn ();
7555 if (! INSN_P (insn))
7556 insn = prev_real_insn (insn);
7558 for (; insn; insn = prev)
7560 int live_insn = 0;
7562 prev = prev_real_insn (insn);
7564 /* Don't delete any insns that are part of a libcall block unless
7565 we can delete the whole libcall block.
7567 Flow or loop might get confused if we did that. Remember
7568 that we are scanning backwards. */
7569 if (find_reg_note (insn, REG_RETVAL, NULL_RTX))
7571 in_libcall = 1;
7572 live_insn = 1;
7573 dead_libcall = dead_libcall_p (insn, counts);
7575 else if (in_libcall)
7576 live_insn = ! dead_libcall;
7577 else
7578 live_insn = insn_live_p (insn, counts);
7580 /* If this is a dead insn, delete it and show registers in it aren't
7581 being used. */
7583 if (! live_insn)
7585 count_reg_usage (insn, counts, NULL_RTX, -1);
7586 delete_insn_and_edges (insn);
7587 ndead++;
7590 if (find_reg_note (insn, REG_LIBCALL, NULL_RTX))
7592 in_libcall = 0;
7593 dead_libcall = 0;
7597 while (ndead != nlastdead);
7599 if (rtl_dump_file && ndead)
7600 fprintf (rtl_dump_file, "Deleted %i trivially dead insns; %i iterations\n",
7601 ndead, niterations);
7602 /* Clean up. */
7603 free (counts);
7604 timevar_pop (TV_DELETE_TRIVIALLY_DEAD);
7605 return ndead;