PR middle-end/19616
[official-gcc.git] / gcc / cse.c
blobfebf243f9326832b9e7dff941a1a94012cf45f14
1 /* Common subexpression elimination for GNU compiler.
2 Copyright (C) 1987, 1988, 1989, 1992, 1993, 1994, 1995, 1996, 1997, 1998
3 1999, 2000, 2001, 2002, 2003, 2004, 2005 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to the Free
19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
20 02111-1307, USA. */
22 #include "config.h"
23 /* stdio.h must precede rtl.h for FFS. */
24 #include "system.h"
25 #include "coretypes.h"
26 #include "tm.h"
27 #include "rtl.h"
28 #include "tm_p.h"
29 #include "hard-reg-set.h"
30 #include "regs.h"
31 #include "basic-block.h"
32 #include "flags.h"
33 #include "real.h"
34 #include "insn-config.h"
35 #include "recog.h"
36 #include "function.h"
37 #include "expr.h"
38 #include "toplev.h"
39 #include "output.h"
40 #include "ggc.h"
41 #include "timevar.h"
42 #include "except.h"
43 #include "target.h"
44 #include "params.h"
45 #include "rtlhooks-def.h"
47 /* The basic idea of common subexpression elimination is to go
48 through the code, keeping a record of expressions that would
49 have the same value at the current scan point, and replacing
50 expressions encountered with the cheapest equivalent expression.
52 It is too complicated to keep track of the different possibilities
53 when control paths merge in this code; so, at each label, we forget all
54 that is known and start fresh. This can be described as processing each
55 extended basic block separately. We have a separate pass to perform
56 global CSE.
58 Note CSE can turn a conditional or computed jump into a nop or
59 an unconditional jump. When this occurs we arrange to run the jump
60 optimizer after CSE to delete the unreachable code.
62 We use two data structures to record the equivalent expressions:
63 a hash table for most expressions, and a vector of "quantity
64 numbers" to record equivalent (pseudo) registers.
66 The use of the special data structure for registers is desirable
67 because it is faster. It is possible because registers references
68 contain a fairly small number, the register number, taken from
69 a contiguously allocated series, and two register references are
70 identical if they have the same number. General expressions
71 do not have any such thing, so the only way to retrieve the
72 information recorded on an expression other than a register
73 is to keep it in a hash table.
75 Registers and "quantity numbers":
77 At the start of each basic block, all of the (hardware and pseudo)
78 registers used in the function are given distinct quantity
79 numbers to indicate their contents. During scan, when the code
80 copies one register into another, we copy the quantity number.
81 When a register is loaded in any other way, we allocate a new
82 quantity number to describe the value generated by this operation.
83 `reg_qty' records what quantity a register is currently thought
84 of as containing.
86 All real quantity numbers are greater than or equal to zero.
87 If register N has not been assigned a quantity, reg_qty[N] will
88 equal -N - 1, which is always negative.
90 Quantity numbers below zero do not exist and none of the `qty_table'
91 entries should be referenced with a negative index.
93 We also maintain a bidirectional chain of registers for each
94 quantity number. The `qty_table` members `first_reg' and `last_reg',
95 and `reg_eqv_table' members `next' and `prev' hold these chains.
97 The first register in a chain is the one whose lifespan is least local.
98 Among equals, it is the one that was seen first.
99 We replace any equivalent register with that one.
101 If two registers have the same quantity number, it must be true that
102 REG expressions with qty_table `mode' must be in the hash table for both
103 registers and must be in the same class.
105 The converse is not true. Since hard registers may be referenced in
106 any mode, two REG expressions might be equivalent in the hash table
107 but not have the same quantity number if the quantity number of one
108 of the registers is not the same mode as those expressions.
110 Constants and quantity numbers
112 When a quantity has a known constant value, that value is stored
113 in the appropriate qty_table `const_rtx'. This is in addition to
114 putting the constant in the hash table as is usual for non-regs.
116 Whether a reg or a constant is preferred is determined by the configuration
117 macro CONST_COSTS and will often depend on the constant value. In any
118 event, expressions containing constants can be simplified, by fold_rtx.
120 When a quantity has a known nearly constant value (such as an address
121 of a stack slot), that value is stored in the appropriate qty_table
122 `const_rtx'.
124 Integer constants don't have a machine mode. However, cse
125 determines the intended machine mode from the destination
126 of the instruction that moves the constant. The machine mode
127 is recorded in the hash table along with the actual RTL
128 constant expression so that different modes are kept separate.
130 Other expressions:
132 To record known equivalences among expressions in general
133 we use a hash table called `table'. It has a fixed number of buckets
134 that contain chains of `struct table_elt' elements for expressions.
135 These chains connect the elements whose expressions have the same
136 hash codes.
138 Other chains through the same elements connect the elements which
139 currently have equivalent values.
141 Register references in an expression are canonicalized before hashing
142 the expression. This is done using `reg_qty' and qty_table `first_reg'.
143 The hash code of a register reference is computed using the quantity
144 number, not the register number.
146 When the value of an expression changes, it is necessary to remove from the
147 hash table not just that expression but all expressions whose values
148 could be different as a result.
150 1. If the value changing is in memory, except in special cases
151 ANYTHING referring to memory could be changed. That is because
152 nobody knows where a pointer does not point.
153 The function `invalidate_memory' removes what is necessary.
155 The special cases are when the address is constant or is
156 a constant plus a fixed register such as the frame pointer
157 or a static chain pointer. When such addresses are stored in,
158 we can tell exactly which other such addresses must be invalidated
159 due to overlap. `invalidate' does this.
160 All expressions that refer to non-constant
161 memory addresses are also invalidated. `invalidate_memory' does this.
163 2. If the value changing is a register, all expressions
164 containing references to that register, and only those,
165 must be removed.
167 Because searching the entire hash table for expressions that contain
168 a register is very slow, we try to figure out when it isn't necessary.
169 Precisely, this is necessary only when expressions have been
170 entered in the hash table using this register, and then the value has
171 changed, and then another expression wants to be added to refer to
172 the register's new value. This sequence of circumstances is rare
173 within any one basic block.
175 The vectors `reg_tick' and `reg_in_table' are used to detect this case.
176 reg_tick[i] is incremented whenever a value is stored in register i.
177 reg_in_table[i] holds -1 if no references to register i have been
178 entered in the table; otherwise, it contains the value reg_tick[i] had
179 when the references were entered. If we want to enter a reference
180 and reg_in_table[i] != reg_tick[i], we must scan and remove old references.
181 Until we want to enter a new entry, the mere fact that the two vectors
182 don't match makes the entries be ignored if anyone tries to match them.
184 Registers themselves are entered in the hash table as well as in
185 the equivalent-register chains. However, the vectors `reg_tick'
186 and `reg_in_table' do not apply to expressions which are simple
187 register references. These expressions are removed from the table
188 immediately when they become invalid, and this can be done even if
189 we do not immediately search for all the expressions that refer to
190 the register.
192 A CLOBBER rtx in an instruction invalidates its operand for further
193 reuse. A CLOBBER or SET rtx whose operand is a MEM:BLK
194 invalidates everything that resides in memory.
196 Related expressions:
198 Constant expressions that differ only by an additive integer
199 are called related. When a constant expression is put in
200 the table, the related expression with no constant term
201 is also entered. These are made to point at each other
202 so that it is possible to find out if there exists any
203 register equivalent to an expression related to a given expression. */
205 /* Length of qty_table vector. We know in advance we will not need
206 a quantity number this big. */
208 static int max_qty;
210 /* Next quantity number to be allocated.
211 This is 1 + the largest number needed so far. */
213 static int next_qty;
215 /* Per-qty information tracking.
217 `first_reg' and `last_reg' track the head and tail of the
218 chain of registers which currently contain this quantity.
220 `mode' contains the machine mode of this quantity.
222 `const_rtx' holds the rtx of the constant value of this
223 quantity, if known. A summations of the frame/arg pointer
224 and a constant can also be entered here. When this holds
225 a known value, `const_insn' is the insn which stored the
226 constant value.
228 `comparison_{code,const,qty}' are used to track when a
229 comparison between a quantity and some constant or register has
230 been passed. In such a case, we know the results of the comparison
231 in case we see it again. These members record a comparison that
232 is known to be true. `comparison_code' holds the rtx code of such
233 a comparison, else it is set to UNKNOWN and the other two
234 comparison members are undefined. `comparison_const' holds
235 the constant being compared against, or zero if the comparison
236 is not against a constant. `comparison_qty' holds the quantity
237 being compared against when the result is known. If the comparison
238 is not with a register, `comparison_qty' is -1. */
240 struct qty_table_elem
242 rtx const_rtx;
243 rtx const_insn;
244 rtx comparison_const;
245 int comparison_qty;
246 unsigned int first_reg, last_reg;
247 /* The sizes of these fields should match the sizes of the
248 code and mode fields of struct rtx_def (see rtl.h). */
249 ENUM_BITFIELD(rtx_code) comparison_code : 16;
250 ENUM_BITFIELD(machine_mode) mode : 8;
253 /* The table of all qtys, indexed by qty number. */
254 static struct qty_table_elem *qty_table;
256 /* Structure used to pass arguments via for_each_rtx to function
257 cse_change_cc_mode. */
258 struct change_cc_mode_args
260 rtx insn;
261 rtx newreg;
264 #ifdef HAVE_cc0
265 /* For machines that have a CC0, we do not record its value in the hash
266 table since its use is guaranteed to be the insn immediately following
267 its definition and any other insn is presumed to invalidate it.
269 Instead, we store below the value last assigned to CC0. If it should
270 happen to be a constant, it is stored in preference to the actual
271 assigned value. In case it is a constant, we store the mode in which
272 the constant should be interpreted. */
274 static rtx prev_insn_cc0;
275 static enum machine_mode prev_insn_cc0_mode;
277 /* Previous actual insn. 0 if at first insn of basic block. */
279 static rtx prev_insn;
280 #endif
282 /* Insn being scanned. */
284 static rtx this_insn;
286 /* Index by register number, gives the number of the next (or
287 previous) register in the chain of registers sharing the same
288 value.
290 Or -1 if this register is at the end of the chain.
292 If reg_qty[N] == N, reg_eqv_table[N].next is undefined. */
294 /* Per-register equivalence chain. */
295 struct reg_eqv_elem
297 int next, prev;
300 /* The table of all register equivalence chains. */
301 static struct reg_eqv_elem *reg_eqv_table;
303 struct cse_reg_info
305 /* Next in hash chain. */
306 struct cse_reg_info *hash_next;
308 /* The next cse_reg_info structure in the free or used list. */
309 struct cse_reg_info *next;
311 /* Search key */
312 unsigned int regno;
314 /* The quantity number of the register's current contents. */
315 int reg_qty;
317 /* The number of times the register has been altered in the current
318 basic block. */
319 int reg_tick;
321 /* The REG_TICK value at which rtx's containing this register are
322 valid in the hash table. If this does not equal the current
323 reg_tick value, such expressions existing in the hash table are
324 invalid. */
325 int reg_in_table;
327 /* The SUBREG that was set when REG_TICK was last incremented. Set
328 to -1 if the last store was to the whole register, not a subreg. */
329 unsigned int subreg_ticked;
332 /* A free list of cse_reg_info entries. */
333 static struct cse_reg_info *cse_reg_info_free_list;
335 /* A used list of cse_reg_info entries. */
336 static struct cse_reg_info *cse_reg_info_used_list;
337 static struct cse_reg_info *cse_reg_info_used_list_end;
339 /* A mapping from registers to cse_reg_info data structures. */
340 #define REGHASH_SHIFT 7
341 #define REGHASH_SIZE (1 << REGHASH_SHIFT)
342 #define REGHASH_MASK (REGHASH_SIZE - 1)
343 static struct cse_reg_info *reg_hash[REGHASH_SIZE];
345 #define REGHASH_FN(REGNO) \
346 (((REGNO) ^ ((REGNO) >> REGHASH_SHIFT)) & REGHASH_MASK)
348 /* The last lookup we did into the cse_reg_info_tree. This allows us
349 to cache repeated lookups. */
350 static unsigned int cached_regno;
351 static struct cse_reg_info *cached_cse_reg_info;
353 /* A HARD_REG_SET containing all the hard registers for which there is
354 currently a REG expression in the hash table. Note the difference
355 from the above variables, which indicate if the REG is mentioned in some
356 expression in the table. */
358 static HARD_REG_SET hard_regs_in_table;
360 /* CUID of insn that starts the basic block currently being cse-processed. */
362 static int cse_basic_block_start;
364 /* CUID of insn that ends the basic block currently being cse-processed. */
366 static int cse_basic_block_end;
368 /* Vector mapping INSN_UIDs to cuids.
369 The cuids are like uids but increase monotonically always.
370 We use them to see whether a reg is used outside a given basic block. */
372 static int *uid_cuid;
374 /* Highest UID in UID_CUID. */
375 static int max_uid;
377 /* Get the cuid of an insn. */
379 #define INSN_CUID(INSN) (uid_cuid[INSN_UID (INSN)])
381 /* Nonzero if this pass has made changes, and therefore it's
382 worthwhile to run the garbage collector. */
384 static int cse_altered;
386 /* Nonzero if cse has altered conditional jump insns
387 in such a way that jump optimization should be redone. */
389 static int cse_jumps_altered;
391 /* Nonzero if we put a LABEL_REF into the hash table for an INSN without a
392 REG_LABEL, we have to rerun jump after CSE to put in the note. */
393 static int recorded_label_ref;
395 /* canon_hash stores 1 in do_not_record
396 if it notices a reference to CC0, PC, or some other volatile
397 subexpression. */
399 static int do_not_record;
401 /* canon_hash stores 1 in hash_arg_in_memory
402 if it notices a reference to memory within the expression being hashed. */
404 static int hash_arg_in_memory;
406 /* The hash table contains buckets which are chains of `struct table_elt's,
407 each recording one expression's information.
408 That expression is in the `exp' field.
410 The canon_exp field contains a canonical (from the point of view of
411 alias analysis) version of the `exp' field.
413 Those elements with the same hash code are chained in both directions
414 through the `next_same_hash' and `prev_same_hash' fields.
416 Each set of expressions with equivalent values
417 are on a two-way chain through the `next_same_value'
418 and `prev_same_value' fields, and all point with
419 the `first_same_value' field at the first element in
420 that chain. The chain is in order of increasing cost.
421 Each element's cost value is in its `cost' field.
423 The `in_memory' field is nonzero for elements that
424 involve any reference to memory. These elements are removed
425 whenever a write is done to an unidentified location in memory.
426 To be safe, we assume that a memory address is unidentified unless
427 the address is either a symbol constant or a constant plus
428 the frame pointer or argument pointer.
430 The `related_value' field is used to connect related expressions
431 (that differ by adding an integer).
432 The related expressions are chained in a circular fashion.
433 `related_value' is zero for expressions for which this
434 chain is not useful.
436 The `cost' field stores the cost of this element's expression.
437 The `regcost' field stores the value returned by approx_reg_cost for
438 this element's expression.
440 The `is_const' flag is set if the element is a constant (including
441 a fixed address).
443 The `flag' field is used as a temporary during some search routines.
445 The `mode' field is usually the same as GET_MODE (`exp'), but
446 if `exp' is a CONST_INT and has no machine mode then the `mode'
447 field is the mode it was being used as. Each constant is
448 recorded separately for each mode it is used with. */
450 struct table_elt
452 rtx exp;
453 rtx canon_exp;
454 struct table_elt *next_same_hash;
455 struct table_elt *prev_same_hash;
456 struct table_elt *next_same_value;
457 struct table_elt *prev_same_value;
458 struct table_elt *first_same_value;
459 struct table_elt *related_value;
460 int cost;
461 int regcost;
462 /* The size of this field should match the size
463 of the mode field of struct rtx_def (see rtl.h). */
464 ENUM_BITFIELD(machine_mode) mode : 8;
465 char in_memory;
466 char is_const;
467 char flag;
470 /* We don't want a lot of buckets, because we rarely have very many
471 things stored in the hash table, and a lot of buckets slows
472 down a lot of loops that happen frequently. */
473 #define HASH_SHIFT 5
474 #define HASH_SIZE (1 << HASH_SHIFT)
475 #define HASH_MASK (HASH_SIZE - 1)
477 /* Compute hash code of X in mode M. Special-case case where X is a pseudo
478 register (hard registers may require `do_not_record' to be set). */
480 #define HASH(X, M) \
481 ((REG_P (X) && REGNO (X) >= FIRST_PSEUDO_REGISTER \
482 ? (((unsigned) REG << 7) + (unsigned) REG_QTY (REGNO (X))) \
483 : canon_hash (X, M)) & HASH_MASK)
485 /* Like HASH, but without side-effects. */
486 #define SAFE_HASH(X, M) \
487 ((REG_P (X) && REGNO (X) >= FIRST_PSEUDO_REGISTER \
488 ? (((unsigned) REG << 7) + (unsigned) REG_QTY (REGNO (X))) \
489 : safe_hash (X, M)) & HASH_MASK)
491 /* Determine whether register number N is considered a fixed register for the
492 purpose of approximating register costs.
493 It is desirable to replace other regs with fixed regs, to reduce need for
494 non-fixed hard regs.
495 A reg wins if it is either the frame pointer or designated as fixed. */
496 #define FIXED_REGNO_P(N) \
497 ((N) == FRAME_POINTER_REGNUM || (N) == HARD_FRAME_POINTER_REGNUM \
498 || fixed_regs[N] || global_regs[N])
500 /* Compute cost of X, as stored in the `cost' field of a table_elt. Fixed
501 hard registers and pointers into the frame are the cheapest with a cost
502 of 0. Next come pseudos with a cost of one and other hard registers with
503 a cost of 2. Aside from these special cases, call `rtx_cost'. */
505 #define CHEAP_REGNO(N) \
506 (REGNO_PTR_FRAME_P(N) \
507 || (HARD_REGISTER_NUM_P (N) \
508 && FIXED_REGNO_P (N) && REGNO_REG_CLASS (N) != NO_REGS))
510 #define COST(X) (REG_P (X) ? 0 : notreg_cost (X, SET))
511 #define COST_IN(X,OUTER) (REG_P (X) ? 0 : notreg_cost (X, OUTER))
513 /* Get the info associated with register N. */
515 #define GET_CSE_REG_INFO(N) \
516 (((N) == cached_regno && cached_cse_reg_info) \
517 ? cached_cse_reg_info : get_cse_reg_info ((N)))
519 /* Get the number of times this register has been updated in this
520 basic block. */
522 #define REG_TICK(N) ((GET_CSE_REG_INFO (N))->reg_tick)
524 /* Get the point at which REG was recorded in the table. */
526 #define REG_IN_TABLE(N) ((GET_CSE_REG_INFO (N))->reg_in_table)
528 /* Get the SUBREG set at the last increment to REG_TICK (-1 if not a
529 SUBREG). */
531 #define SUBREG_TICKED(N) ((GET_CSE_REG_INFO (N))->subreg_ticked)
533 /* Get the quantity number for REG. */
535 #define REG_QTY(N) ((GET_CSE_REG_INFO (N))->reg_qty)
537 /* Determine if the quantity number for register X represents a valid index
538 into the qty_table. */
540 #define REGNO_QTY_VALID_P(N) (REG_QTY (N) >= 0)
542 static struct table_elt *table[HASH_SIZE];
544 /* Chain of `struct table_elt's made so far for this function
545 but currently removed from the table. */
547 static struct table_elt *free_element_chain;
549 /* Number of `struct table_elt' structures made so far for this function. */
551 static int n_elements_made;
553 /* Maximum value `n_elements_made' has had so far in this compilation
554 for functions previously processed. */
556 static int max_elements_made;
558 /* Set to the cost of a constant pool reference if one was found for a
559 symbolic constant. If this was found, it means we should try to
560 convert constants into constant pool entries if they don't fit in
561 the insn. */
563 static int constant_pool_entries_cost;
564 static int constant_pool_entries_regcost;
566 /* This data describes a block that will be processed by cse_basic_block. */
568 struct cse_basic_block_data
570 /* Lowest CUID value of insns in block. */
571 int low_cuid;
572 /* Highest CUID value of insns in block. */
573 int high_cuid;
574 /* Total number of SETs in block. */
575 int nsets;
576 /* Last insn in the block. */
577 rtx last;
578 /* Size of current branch path, if any. */
579 int path_size;
580 /* Current branch path, indicating which branches will be taken. */
581 struct branch_path
583 /* The branch insn. */
584 rtx branch;
585 /* Whether it should be taken or not. AROUND is the same as taken
586 except that it is used when the destination label is not preceded
587 by a BARRIER. */
588 enum taken {PATH_TAKEN, PATH_NOT_TAKEN, PATH_AROUND} status;
589 } *path;
592 static bool fixed_base_plus_p (rtx x);
593 static int notreg_cost (rtx, enum rtx_code);
594 static int approx_reg_cost_1 (rtx *, void *);
595 static int approx_reg_cost (rtx);
596 static int preferable (int, int, int, int);
597 static void new_basic_block (void);
598 static void make_new_qty (unsigned int, enum machine_mode);
599 static void make_regs_eqv (unsigned int, unsigned int);
600 static void delete_reg_equiv (unsigned int);
601 static int mention_regs (rtx);
602 static int insert_regs (rtx, struct table_elt *, int);
603 static void remove_from_table (struct table_elt *, unsigned);
604 static struct table_elt *lookup (rtx, unsigned, enum machine_mode);
605 static struct table_elt *lookup_for_remove (rtx, unsigned, enum machine_mode);
606 static rtx lookup_as_function (rtx, enum rtx_code);
607 static struct table_elt *insert (rtx, struct table_elt *, unsigned,
608 enum machine_mode);
609 static void merge_equiv_classes (struct table_elt *, struct table_elt *);
610 static void invalidate (rtx, enum machine_mode);
611 static int cse_rtx_varies_p (rtx, int);
612 static void remove_invalid_refs (unsigned int);
613 static void remove_invalid_subreg_refs (unsigned int, unsigned int,
614 enum machine_mode);
615 static void rehash_using_reg (rtx);
616 static void invalidate_memory (void);
617 static void invalidate_for_call (void);
618 static rtx use_related_value (rtx, struct table_elt *);
620 static inline unsigned canon_hash (rtx, enum machine_mode);
621 static inline unsigned safe_hash (rtx, enum machine_mode);
622 static unsigned hash_rtx_string (const char *);
624 static rtx canon_reg (rtx, rtx);
625 static void find_best_addr (rtx, rtx *, enum machine_mode);
626 static enum rtx_code find_comparison_args (enum rtx_code, rtx *, rtx *,
627 enum machine_mode *,
628 enum machine_mode *);
629 static rtx fold_rtx (rtx, rtx);
630 static rtx equiv_constant (rtx);
631 static void record_jump_equiv (rtx, int);
632 static void record_jump_cond (enum rtx_code, enum machine_mode, rtx, rtx,
633 int);
634 static void cse_insn (rtx, rtx);
635 static void cse_end_of_basic_block (rtx, struct cse_basic_block_data *,
636 int, int);
637 static int addr_affects_sp_p (rtx);
638 static void invalidate_from_clobbers (rtx);
639 static rtx cse_process_notes (rtx, rtx);
640 static void invalidate_skipped_set (rtx, rtx, void *);
641 static void invalidate_skipped_block (rtx);
642 static rtx cse_basic_block (rtx, rtx, struct branch_path *);
643 static void count_reg_usage (rtx, int *, int);
644 static int check_for_label_ref (rtx *, void *);
645 extern void dump_class (struct table_elt*);
646 static struct cse_reg_info * get_cse_reg_info (unsigned int);
647 static int check_dependence (rtx *, void *);
649 static void flush_hash_table (void);
650 static bool insn_live_p (rtx, int *);
651 static bool set_live_p (rtx, rtx, int *);
652 static bool dead_libcall_p (rtx, int *);
653 static int cse_change_cc_mode (rtx *, void *);
654 static void cse_change_cc_mode_insn (rtx, rtx);
655 static void cse_change_cc_mode_insns (rtx, rtx, rtx);
656 static enum machine_mode cse_cc_succs (basic_block, rtx, rtx, bool);
659 #undef RTL_HOOKS_GEN_LOWPART
660 #define RTL_HOOKS_GEN_LOWPART gen_lowpart_if_possible
662 static const struct rtl_hooks cse_rtl_hooks = RTL_HOOKS_INITIALIZER;
664 /* Nonzero if X has the form (PLUS frame-pointer integer). We check for
665 virtual regs here because the simplify_*_operation routines are called
666 by integrate.c, which is called before virtual register instantiation. */
668 static bool
669 fixed_base_plus_p (rtx x)
671 switch (GET_CODE (x))
673 case REG:
674 if (x == frame_pointer_rtx || x == hard_frame_pointer_rtx)
675 return true;
676 if (x == arg_pointer_rtx && fixed_regs[ARG_POINTER_REGNUM])
677 return true;
678 if (REGNO (x) >= FIRST_VIRTUAL_REGISTER
679 && REGNO (x) <= LAST_VIRTUAL_REGISTER)
680 return true;
681 return false;
683 case PLUS:
684 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
685 return false;
686 return fixed_base_plus_p (XEXP (x, 0));
688 default:
689 return false;
693 /* Dump the expressions in the equivalence class indicated by CLASSP.
694 This function is used only for debugging. */
695 void
696 dump_class (struct table_elt *classp)
698 struct table_elt *elt;
700 fprintf (stderr, "Equivalence chain for ");
701 print_rtl (stderr, classp->exp);
702 fprintf (stderr, ": \n");
704 for (elt = classp->first_same_value; elt; elt = elt->next_same_value)
706 print_rtl (stderr, elt->exp);
707 fprintf (stderr, "\n");
711 /* Subroutine of approx_reg_cost; called through for_each_rtx. */
713 static int
714 approx_reg_cost_1 (rtx *xp, void *data)
716 rtx x = *xp;
717 int *cost_p = data;
719 if (x && REG_P (x))
721 unsigned int regno = REGNO (x);
723 if (! CHEAP_REGNO (regno))
725 if (regno < FIRST_PSEUDO_REGISTER)
727 if (SMALL_REGISTER_CLASSES)
728 return 1;
729 *cost_p += 2;
731 else
732 *cost_p += 1;
736 return 0;
739 /* Return an estimate of the cost of the registers used in an rtx.
740 This is mostly the number of different REG expressions in the rtx;
741 however for some exceptions like fixed registers we use a cost of
742 0. If any other hard register reference occurs, return MAX_COST. */
744 static int
745 approx_reg_cost (rtx x)
747 int cost = 0;
749 if (for_each_rtx (&x, approx_reg_cost_1, (void *) &cost))
750 return MAX_COST;
752 return cost;
755 /* Returns a canonical version of X for the address, from the point of view,
756 that all multiplications are represented as MULT instead of the multiply
757 by a power of 2 being represented as ASHIFT. */
759 static rtx
760 canon_for_address (rtx x)
762 enum rtx_code code;
763 enum machine_mode mode;
764 rtx new = 0;
765 int i;
766 const char *fmt;
768 if (!x)
769 return x;
771 code = GET_CODE (x);
772 mode = GET_MODE (x);
774 switch (code)
776 case ASHIFT:
777 if (GET_CODE (XEXP (x, 1)) == CONST_INT
778 && INTVAL (XEXP (x, 1)) < GET_MODE_BITSIZE (mode)
779 && INTVAL (XEXP (x, 1)) >= 0)
781 new = canon_for_address (XEXP (x, 0));
782 new = gen_rtx_MULT (mode, new,
783 gen_int_mode ((HOST_WIDE_INT) 1
784 << INTVAL (XEXP (x, 1)),
785 mode));
787 break;
788 default:
789 break;
792 if (new)
793 return new;
795 /* Now recursively process each operand of this operation. */
796 fmt = GET_RTX_FORMAT (code);
797 for (i = 0; i < GET_RTX_LENGTH (code); i++)
798 if (fmt[i] == 'e')
800 new = canon_for_address (XEXP (x, i));
801 XEXP (x, i) = new;
803 return x;
806 /* Return a negative value if an rtx A, whose costs are given by COST_A
807 and REGCOST_A, is more desirable than an rtx B.
808 Return a positive value if A is less desirable, or 0 if the two are
809 equally good. */
810 static int
811 preferable (int cost_a, int regcost_a, int cost_b, int regcost_b)
813 /* First, get rid of cases involving expressions that are entirely
814 unwanted. */
815 if (cost_a != cost_b)
817 if (cost_a == MAX_COST)
818 return 1;
819 if (cost_b == MAX_COST)
820 return -1;
823 /* Avoid extending lifetimes of hardregs. */
824 if (regcost_a != regcost_b)
826 if (regcost_a == MAX_COST)
827 return 1;
828 if (regcost_b == MAX_COST)
829 return -1;
832 /* Normal operation costs take precedence. */
833 if (cost_a != cost_b)
834 return cost_a - cost_b;
835 /* Only if these are identical consider effects on register pressure. */
836 if (regcost_a != regcost_b)
837 return regcost_a - regcost_b;
838 return 0;
841 /* Internal function, to compute cost when X is not a register; called
842 from COST macro to keep it simple. */
844 static int
845 notreg_cost (rtx x, enum rtx_code outer)
847 return ((GET_CODE (x) == SUBREG
848 && REG_P (SUBREG_REG (x))
849 && GET_MODE_CLASS (GET_MODE (x)) == MODE_INT
850 && GET_MODE_CLASS (GET_MODE (SUBREG_REG (x))) == MODE_INT
851 && (GET_MODE_SIZE (GET_MODE (x))
852 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (x))))
853 && subreg_lowpart_p (x)
854 && TRULY_NOOP_TRUNCATION (GET_MODE_BITSIZE (GET_MODE (x)),
855 GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x)))))
857 : rtx_cost (x, outer) * 2);
861 static struct cse_reg_info *
862 get_cse_reg_info (unsigned int regno)
864 struct cse_reg_info **hash_head = &reg_hash[REGHASH_FN (regno)];
865 struct cse_reg_info *p;
867 for (p = *hash_head; p != NULL; p = p->hash_next)
868 if (p->regno == regno)
869 break;
871 if (p == NULL)
873 /* Get a new cse_reg_info structure. */
874 if (cse_reg_info_free_list)
876 p = cse_reg_info_free_list;
877 cse_reg_info_free_list = p->next;
879 else
880 p = xmalloc (sizeof (struct cse_reg_info));
882 /* Insert into hash table. */
883 p->hash_next = *hash_head;
884 *hash_head = p;
886 /* Initialize it. */
887 p->reg_tick = 1;
888 p->reg_in_table = -1;
889 p->subreg_ticked = -1;
890 p->reg_qty = -regno - 1;
891 p->regno = regno;
892 p->next = cse_reg_info_used_list;
893 cse_reg_info_used_list = p;
894 if (!cse_reg_info_used_list_end)
895 cse_reg_info_used_list_end = p;
898 /* Cache this lookup; we tend to be looking up information about the
899 same register several times in a row. */
900 cached_regno = regno;
901 cached_cse_reg_info = p;
903 return p;
906 /* Clear the hash table and initialize each register with its own quantity,
907 for a new basic block. */
909 static void
910 new_basic_block (void)
912 int i;
914 next_qty = 0;
916 /* Clear out hash table state for this pass. */
918 memset (reg_hash, 0, sizeof reg_hash);
920 if (cse_reg_info_used_list)
922 cse_reg_info_used_list_end->next = cse_reg_info_free_list;
923 cse_reg_info_free_list = cse_reg_info_used_list;
924 cse_reg_info_used_list = cse_reg_info_used_list_end = 0;
926 cached_cse_reg_info = 0;
928 CLEAR_HARD_REG_SET (hard_regs_in_table);
930 /* The per-quantity values used to be initialized here, but it is
931 much faster to initialize each as it is made in `make_new_qty'. */
933 for (i = 0; i < HASH_SIZE; i++)
935 struct table_elt *first;
937 first = table[i];
938 if (first != NULL)
940 struct table_elt *last = first;
942 table[i] = NULL;
944 while (last->next_same_hash != NULL)
945 last = last->next_same_hash;
947 /* Now relink this hash entire chain into
948 the free element list. */
950 last->next_same_hash = free_element_chain;
951 free_element_chain = first;
955 #ifdef HAVE_cc0
956 prev_insn = 0;
957 prev_insn_cc0 = 0;
958 #endif
961 /* Say that register REG contains a quantity in mode MODE not in any
962 register before and initialize that quantity. */
964 static void
965 make_new_qty (unsigned int reg, enum machine_mode mode)
967 int q;
968 struct qty_table_elem *ent;
969 struct reg_eqv_elem *eqv;
971 gcc_assert (next_qty < max_qty);
973 q = REG_QTY (reg) = next_qty++;
974 ent = &qty_table[q];
975 ent->first_reg = reg;
976 ent->last_reg = reg;
977 ent->mode = mode;
978 ent->const_rtx = ent->const_insn = NULL_RTX;
979 ent->comparison_code = UNKNOWN;
981 eqv = &reg_eqv_table[reg];
982 eqv->next = eqv->prev = -1;
985 /* Make reg NEW equivalent to reg OLD.
986 OLD is not changing; NEW is. */
988 static void
989 make_regs_eqv (unsigned int new, unsigned int old)
991 unsigned int lastr, firstr;
992 int q = REG_QTY (old);
993 struct qty_table_elem *ent;
995 ent = &qty_table[q];
997 /* Nothing should become eqv until it has a "non-invalid" qty number. */
998 gcc_assert (REGNO_QTY_VALID_P (old));
1000 REG_QTY (new) = q;
1001 firstr = ent->first_reg;
1002 lastr = ent->last_reg;
1004 /* Prefer fixed hard registers to anything. Prefer pseudo regs to other
1005 hard regs. Among pseudos, if NEW will live longer than any other reg
1006 of the same qty, and that is beyond the current basic block,
1007 make it the new canonical replacement for this qty. */
1008 if (! (firstr < FIRST_PSEUDO_REGISTER && FIXED_REGNO_P (firstr))
1009 /* Certain fixed registers might be of the class NO_REGS. This means
1010 that not only can they not be allocated by the compiler, but
1011 they cannot be used in substitutions or canonicalizations
1012 either. */
1013 && (new >= FIRST_PSEUDO_REGISTER || REGNO_REG_CLASS (new) != NO_REGS)
1014 && ((new < FIRST_PSEUDO_REGISTER && FIXED_REGNO_P (new))
1015 || (new >= FIRST_PSEUDO_REGISTER
1016 && (firstr < FIRST_PSEUDO_REGISTER
1017 || ((uid_cuid[REGNO_LAST_UID (new)] > cse_basic_block_end
1018 || (uid_cuid[REGNO_FIRST_UID (new)]
1019 < cse_basic_block_start))
1020 && (uid_cuid[REGNO_LAST_UID (new)]
1021 > uid_cuid[REGNO_LAST_UID (firstr)]))))))
1023 reg_eqv_table[firstr].prev = new;
1024 reg_eqv_table[new].next = firstr;
1025 reg_eqv_table[new].prev = -1;
1026 ent->first_reg = new;
1028 else
1030 /* If NEW is a hard reg (known to be non-fixed), insert at end.
1031 Otherwise, insert before any non-fixed hard regs that are at the
1032 end. Registers of class NO_REGS cannot be used as an
1033 equivalent for anything. */
1034 while (lastr < FIRST_PSEUDO_REGISTER && reg_eqv_table[lastr].prev >= 0
1035 && (REGNO_REG_CLASS (lastr) == NO_REGS || ! FIXED_REGNO_P (lastr))
1036 && new >= FIRST_PSEUDO_REGISTER)
1037 lastr = reg_eqv_table[lastr].prev;
1038 reg_eqv_table[new].next = reg_eqv_table[lastr].next;
1039 if (reg_eqv_table[lastr].next >= 0)
1040 reg_eqv_table[reg_eqv_table[lastr].next].prev = new;
1041 else
1042 qty_table[q].last_reg = new;
1043 reg_eqv_table[lastr].next = new;
1044 reg_eqv_table[new].prev = lastr;
1048 /* Remove REG from its equivalence class. */
1050 static void
1051 delete_reg_equiv (unsigned int reg)
1053 struct qty_table_elem *ent;
1054 int q = REG_QTY (reg);
1055 int p, n;
1057 /* If invalid, do nothing. */
1058 if (! REGNO_QTY_VALID_P (reg))
1059 return;
1061 ent = &qty_table[q];
1063 p = reg_eqv_table[reg].prev;
1064 n = reg_eqv_table[reg].next;
1066 if (n != -1)
1067 reg_eqv_table[n].prev = p;
1068 else
1069 ent->last_reg = p;
1070 if (p != -1)
1071 reg_eqv_table[p].next = n;
1072 else
1073 ent->first_reg = n;
1075 REG_QTY (reg) = -reg - 1;
1078 /* Remove any invalid expressions from the hash table
1079 that refer to any of the registers contained in expression X.
1081 Make sure that newly inserted references to those registers
1082 as subexpressions will be considered valid.
1084 mention_regs is not called when a register itself
1085 is being stored in the table.
1087 Return 1 if we have done something that may have changed the hash code
1088 of X. */
1090 static int
1091 mention_regs (rtx x)
1093 enum rtx_code code;
1094 int i, j;
1095 const char *fmt;
1096 int changed = 0;
1098 if (x == 0)
1099 return 0;
1101 code = GET_CODE (x);
1102 if (code == REG)
1104 unsigned int regno = REGNO (x);
1105 unsigned int endregno
1106 = regno + (regno >= FIRST_PSEUDO_REGISTER ? 1
1107 : hard_regno_nregs[regno][GET_MODE (x)]);
1108 unsigned int i;
1110 for (i = regno; i < endregno; i++)
1112 if (REG_IN_TABLE (i) >= 0 && REG_IN_TABLE (i) != REG_TICK (i))
1113 remove_invalid_refs (i);
1115 REG_IN_TABLE (i) = REG_TICK (i);
1116 SUBREG_TICKED (i) = -1;
1119 return 0;
1122 /* If this is a SUBREG, we don't want to discard other SUBREGs of the same
1123 pseudo if they don't use overlapping words. We handle only pseudos
1124 here for simplicity. */
1125 if (code == SUBREG && REG_P (SUBREG_REG (x))
1126 && REGNO (SUBREG_REG (x)) >= FIRST_PSEUDO_REGISTER)
1128 unsigned int i = REGNO (SUBREG_REG (x));
1130 if (REG_IN_TABLE (i) >= 0 && REG_IN_TABLE (i) != REG_TICK (i))
1132 /* If REG_IN_TABLE (i) differs from REG_TICK (i) by one, and
1133 the last store to this register really stored into this
1134 subreg, then remove the memory of this subreg.
1135 Otherwise, remove any memory of the entire register and
1136 all its subregs from the table. */
1137 if (REG_TICK (i) - REG_IN_TABLE (i) > 1
1138 || SUBREG_TICKED (i) != REGNO (SUBREG_REG (x)))
1139 remove_invalid_refs (i);
1140 else
1141 remove_invalid_subreg_refs (i, SUBREG_BYTE (x), GET_MODE (x));
1144 REG_IN_TABLE (i) = REG_TICK (i);
1145 SUBREG_TICKED (i) = REGNO (SUBREG_REG (x));
1146 return 0;
1149 /* If X is a comparison or a COMPARE and either operand is a register
1150 that does not have a quantity, give it one. This is so that a later
1151 call to record_jump_equiv won't cause X to be assigned a different
1152 hash code and not found in the table after that call.
1154 It is not necessary to do this here, since rehash_using_reg can
1155 fix up the table later, but doing this here eliminates the need to
1156 call that expensive function in the most common case where the only
1157 use of the register is in the comparison. */
1159 if (code == COMPARE || COMPARISON_P (x))
1161 if (REG_P (XEXP (x, 0))
1162 && ! REGNO_QTY_VALID_P (REGNO (XEXP (x, 0))))
1163 if (insert_regs (XEXP (x, 0), NULL, 0))
1165 rehash_using_reg (XEXP (x, 0));
1166 changed = 1;
1169 if (REG_P (XEXP (x, 1))
1170 && ! REGNO_QTY_VALID_P (REGNO (XEXP (x, 1))))
1171 if (insert_regs (XEXP (x, 1), NULL, 0))
1173 rehash_using_reg (XEXP (x, 1));
1174 changed = 1;
1178 fmt = GET_RTX_FORMAT (code);
1179 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1180 if (fmt[i] == 'e')
1181 changed |= mention_regs (XEXP (x, i));
1182 else if (fmt[i] == 'E')
1183 for (j = 0; j < XVECLEN (x, i); j++)
1184 changed |= mention_regs (XVECEXP (x, i, j));
1186 return changed;
1189 /* Update the register quantities for inserting X into the hash table
1190 with a value equivalent to CLASSP.
1191 (If the class does not contain a REG, it is irrelevant.)
1192 If MODIFIED is nonzero, X is a destination; it is being modified.
1193 Note that delete_reg_equiv should be called on a register
1194 before insert_regs is done on that register with MODIFIED != 0.
1196 Nonzero value means that elements of reg_qty have changed
1197 so X's hash code may be different. */
1199 static int
1200 insert_regs (rtx x, struct table_elt *classp, int modified)
1202 if (REG_P (x))
1204 unsigned int regno = REGNO (x);
1205 int qty_valid;
1207 /* If REGNO is in the equivalence table already but is of the
1208 wrong mode for that equivalence, don't do anything here. */
1210 qty_valid = REGNO_QTY_VALID_P (regno);
1211 if (qty_valid)
1213 struct qty_table_elem *ent = &qty_table[REG_QTY (regno)];
1215 if (ent->mode != GET_MODE (x))
1216 return 0;
1219 if (modified || ! qty_valid)
1221 if (classp)
1222 for (classp = classp->first_same_value;
1223 classp != 0;
1224 classp = classp->next_same_value)
1225 if (REG_P (classp->exp)
1226 && GET_MODE (classp->exp) == GET_MODE (x))
1228 make_regs_eqv (regno, REGNO (classp->exp));
1229 return 1;
1232 /* Mention_regs for a SUBREG checks if REG_TICK is exactly one larger
1233 than REG_IN_TABLE to find out if there was only a single preceding
1234 invalidation - for the SUBREG - or another one, which would be
1235 for the full register. However, if we find here that REG_TICK
1236 indicates that the register is invalid, it means that it has
1237 been invalidated in a separate operation. The SUBREG might be used
1238 now (then this is a recursive call), or we might use the full REG
1239 now and a SUBREG of it later. So bump up REG_TICK so that
1240 mention_regs will do the right thing. */
1241 if (! modified
1242 && REG_IN_TABLE (regno) >= 0
1243 && REG_TICK (regno) == REG_IN_TABLE (regno) + 1)
1244 REG_TICK (regno)++;
1245 make_new_qty (regno, GET_MODE (x));
1246 return 1;
1249 return 0;
1252 /* If X is a SUBREG, we will likely be inserting the inner register in the
1253 table. If that register doesn't have an assigned quantity number at
1254 this point but does later, the insertion that we will be doing now will
1255 not be accessible because its hash code will have changed. So assign
1256 a quantity number now. */
1258 else if (GET_CODE (x) == SUBREG && REG_P (SUBREG_REG (x))
1259 && ! REGNO_QTY_VALID_P (REGNO (SUBREG_REG (x))))
1261 insert_regs (SUBREG_REG (x), NULL, 0);
1262 mention_regs (x);
1263 return 1;
1265 else
1266 return mention_regs (x);
1269 /* Look in or update the hash table. */
1271 /* Remove table element ELT from use in the table.
1272 HASH is its hash code, made using the HASH macro.
1273 It's an argument because often that is known in advance
1274 and we save much time not recomputing it. */
1276 static void
1277 remove_from_table (struct table_elt *elt, unsigned int hash)
1279 if (elt == 0)
1280 return;
1282 /* Mark this element as removed. See cse_insn. */
1283 elt->first_same_value = 0;
1285 /* Remove the table element from its equivalence class. */
1288 struct table_elt *prev = elt->prev_same_value;
1289 struct table_elt *next = elt->next_same_value;
1291 if (next)
1292 next->prev_same_value = prev;
1294 if (prev)
1295 prev->next_same_value = next;
1296 else
1298 struct table_elt *newfirst = next;
1299 while (next)
1301 next->first_same_value = newfirst;
1302 next = next->next_same_value;
1307 /* Remove the table element from its hash bucket. */
1310 struct table_elt *prev = elt->prev_same_hash;
1311 struct table_elt *next = elt->next_same_hash;
1313 if (next)
1314 next->prev_same_hash = prev;
1316 if (prev)
1317 prev->next_same_hash = next;
1318 else if (table[hash] == elt)
1319 table[hash] = next;
1320 else
1322 /* This entry is not in the proper hash bucket. This can happen
1323 when two classes were merged by `merge_equiv_classes'. Search
1324 for the hash bucket that it heads. This happens only very
1325 rarely, so the cost is acceptable. */
1326 for (hash = 0; hash < HASH_SIZE; hash++)
1327 if (table[hash] == elt)
1328 table[hash] = next;
1332 /* Remove the table element from its related-value circular chain. */
1334 if (elt->related_value != 0 && elt->related_value != elt)
1336 struct table_elt *p = elt->related_value;
1338 while (p->related_value != elt)
1339 p = p->related_value;
1340 p->related_value = elt->related_value;
1341 if (p->related_value == p)
1342 p->related_value = 0;
1345 /* Now add it to the free element chain. */
1346 elt->next_same_hash = free_element_chain;
1347 free_element_chain = elt;
1350 /* Look up X in the hash table and return its table element,
1351 or 0 if X is not in the table.
1353 MODE is the machine-mode of X, or if X is an integer constant
1354 with VOIDmode then MODE is the mode with which X will be used.
1356 Here we are satisfied to find an expression whose tree structure
1357 looks like X. */
1359 static struct table_elt *
1360 lookup (rtx x, unsigned int hash, enum machine_mode mode)
1362 struct table_elt *p;
1364 for (p = table[hash]; p; p = p->next_same_hash)
1365 if (mode == p->mode && ((x == p->exp && REG_P (x))
1366 || exp_equiv_p (x, p->exp, !REG_P (x), false)))
1367 return p;
1369 return 0;
1372 /* Like `lookup' but don't care whether the table element uses invalid regs.
1373 Also ignore discrepancies in the machine mode of a register. */
1375 static struct table_elt *
1376 lookup_for_remove (rtx x, unsigned int hash, enum machine_mode mode)
1378 struct table_elt *p;
1380 if (REG_P (x))
1382 unsigned int regno = REGNO (x);
1384 /* Don't check the machine mode when comparing registers;
1385 invalidating (REG:SI 0) also invalidates (REG:DF 0). */
1386 for (p = table[hash]; p; p = p->next_same_hash)
1387 if (REG_P (p->exp)
1388 && REGNO (p->exp) == regno)
1389 return p;
1391 else
1393 for (p = table[hash]; p; p = p->next_same_hash)
1394 if (mode == p->mode
1395 && (x == p->exp || exp_equiv_p (x, p->exp, 0, false)))
1396 return p;
1399 return 0;
1402 /* Look for an expression equivalent to X and with code CODE.
1403 If one is found, return that expression. */
1405 static rtx
1406 lookup_as_function (rtx x, enum rtx_code code)
1408 struct table_elt *p
1409 = lookup (x, SAFE_HASH (x, VOIDmode), GET_MODE (x));
1411 /* If we are looking for a CONST_INT, the mode doesn't really matter, as
1412 long as we are narrowing. So if we looked in vain for a mode narrower
1413 than word_mode before, look for word_mode now. */
1414 if (p == 0 && code == CONST_INT
1415 && GET_MODE_SIZE (GET_MODE (x)) < GET_MODE_SIZE (word_mode))
1417 x = copy_rtx (x);
1418 PUT_MODE (x, word_mode);
1419 p = lookup (x, SAFE_HASH (x, VOIDmode), word_mode);
1422 if (p == 0)
1423 return 0;
1425 for (p = p->first_same_value; p; p = p->next_same_value)
1426 if (GET_CODE (p->exp) == code
1427 /* Make sure this is a valid entry in the table. */
1428 && exp_equiv_p (p->exp, p->exp, 1, false))
1429 return p->exp;
1431 return 0;
1434 /* Insert X in the hash table, assuming HASH is its hash code
1435 and CLASSP is an element of the class it should go in
1436 (or 0 if a new class should be made).
1437 It is inserted at the proper position to keep the class in
1438 the order cheapest first.
1440 MODE is the machine-mode of X, or if X is an integer constant
1441 with VOIDmode then MODE is the mode with which X will be used.
1443 For elements of equal cheapness, the most recent one
1444 goes in front, except that the first element in the list
1445 remains first unless a cheaper element is added. The order of
1446 pseudo-registers does not matter, as canon_reg will be called to
1447 find the cheapest when a register is retrieved from the table.
1449 The in_memory field in the hash table element is set to 0.
1450 The caller must set it nonzero if appropriate.
1452 You should call insert_regs (X, CLASSP, MODIFY) before calling here,
1453 and if insert_regs returns a nonzero value
1454 you must then recompute its hash code before calling here.
1456 If necessary, update table showing constant values of quantities. */
1458 #define CHEAPER(X, Y) \
1459 (preferable ((X)->cost, (X)->regcost, (Y)->cost, (Y)->regcost) < 0)
1461 static struct table_elt *
1462 insert (rtx x, struct table_elt *classp, unsigned int hash, enum machine_mode mode)
1464 struct table_elt *elt;
1466 /* If X is a register and we haven't made a quantity for it,
1467 something is wrong. */
1468 gcc_assert (!REG_P (x) || REGNO_QTY_VALID_P (REGNO (x)));
1470 /* If X is a hard register, show it is being put in the table. */
1471 if (REG_P (x) && REGNO (x) < FIRST_PSEUDO_REGISTER)
1473 unsigned int regno = REGNO (x);
1474 unsigned int endregno = regno + hard_regno_nregs[regno][GET_MODE (x)];
1475 unsigned int i;
1477 for (i = regno; i < endregno; i++)
1478 SET_HARD_REG_BIT (hard_regs_in_table, i);
1481 /* Put an element for X into the right hash bucket. */
1483 elt = free_element_chain;
1484 if (elt)
1485 free_element_chain = elt->next_same_hash;
1486 else
1488 n_elements_made++;
1489 elt = xmalloc (sizeof (struct table_elt));
1492 elt->exp = x;
1493 elt->canon_exp = NULL_RTX;
1494 elt->cost = COST (x);
1495 elt->regcost = approx_reg_cost (x);
1496 elt->next_same_value = 0;
1497 elt->prev_same_value = 0;
1498 elt->next_same_hash = table[hash];
1499 elt->prev_same_hash = 0;
1500 elt->related_value = 0;
1501 elt->in_memory = 0;
1502 elt->mode = mode;
1503 elt->is_const = (CONSTANT_P (x) || fixed_base_plus_p (x));
1505 if (table[hash])
1506 table[hash]->prev_same_hash = elt;
1507 table[hash] = elt;
1509 /* Put it into the proper value-class. */
1510 if (classp)
1512 classp = classp->first_same_value;
1513 if (CHEAPER (elt, classp))
1514 /* Insert at the head of the class. */
1516 struct table_elt *p;
1517 elt->next_same_value = classp;
1518 classp->prev_same_value = elt;
1519 elt->first_same_value = elt;
1521 for (p = classp; p; p = p->next_same_value)
1522 p->first_same_value = elt;
1524 else
1526 /* Insert not at head of the class. */
1527 /* Put it after the last element cheaper than X. */
1528 struct table_elt *p, *next;
1530 for (p = classp; (next = p->next_same_value) && CHEAPER (next, elt);
1531 p = next);
1533 /* Put it after P and before NEXT. */
1534 elt->next_same_value = next;
1535 if (next)
1536 next->prev_same_value = elt;
1538 elt->prev_same_value = p;
1539 p->next_same_value = elt;
1540 elt->first_same_value = classp;
1543 else
1544 elt->first_same_value = elt;
1546 /* If this is a constant being set equivalent to a register or a register
1547 being set equivalent to a constant, note the constant equivalence.
1549 If this is a constant, it cannot be equivalent to a different constant,
1550 and a constant is the only thing that can be cheaper than a register. So
1551 we know the register is the head of the class (before the constant was
1552 inserted).
1554 If this is a register that is not already known equivalent to a
1555 constant, we must check the entire class.
1557 If this is a register that is already known equivalent to an insn,
1558 update the qtys `const_insn' to show that `this_insn' is the latest
1559 insn making that quantity equivalent to the constant. */
1561 if (elt->is_const && classp && REG_P (classp->exp)
1562 && !REG_P (x))
1564 int exp_q = REG_QTY (REGNO (classp->exp));
1565 struct qty_table_elem *exp_ent = &qty_table[exp_q];
1567 exp_ent->const_rtx = gen_lowpart (exp_ent->mode, x);
1568 exp_ent->const_insn = this_insn;
1571 else if (REG_P (x)
1572 && classp
1573 && ! qty_table[REG_QTY (REGNO (x))].const_rtx
1574 && ! elt->is_const)
1576 struct table_elt *p;
1578 for (p = classp; p != 0; p = p->next_same_value)
1580 if (p->is_const && !REG_P (p->exp))
1582 int x_q = REG_QTY (REGNO (x));
1583 struct qty_table_elem *x_ent = &qty_table[x_q];
1585 x_ent->const_rtx
1586 = gen_lowpart (GET_MODE (x), p->exp);
1587 x_ent->const_insn = this_insn;
1588 break;
1593 else if (REG_P (x)
1594 && qty_table[REG_QTY (REGNO (x))].const_rtx
1595 && GET_MODE (x) == qty_table[REG_QTY (REGNO (x))].mode)
1596 qty_table[REG_QTY (REGNO (x))].const_insn = this_insn;
1598 /* If this is a constant with symbolic value,
1599 and it has a term with an explicit integer value,
1600 link it up with related expressions. */
1601 if (GET_CODE (x) == CONST)
1603 rtx subexp = get_related_value (x);
1604 unsigned subhash;
1605 struct table_elt *subelt, *subelt_prev;
1607 if (subexp != 0)
1609 /* Get the integer-free subexpression in the hash table. */
1610 subhash = SAFE_HASH (subexp, mode);
1611 subelt = lookup (subexp, subhash, mode);
1612 if (subelt == 0)
1613 subelt = insert (subexp, NULL, subhash, mode);
1614 /* Initialize SUBELT's circular chain if it has none. */
1615 if (subelt->related_value == 0)
1616 subelt->related_value = subelt;
1617 /* Find the element in the circular chain that precedes SUBELT. */
1618 subelt_prev = subelt;
1619 while (subelt_prev->related_value != subelt)
1620 subelt_prev = subelt_prev->related_value;
1621 /* Put new ELT into SUBELT's circular chain just before SUBELT.
1622 This way the element that follows SUBELT is the oldest one. */
1623 elt->related_value = subelt_prev->related_value;
1624 subelt_prev->related_value = elt;
1628 return elt;
1631 /* Given two equivalence classes, CLASS1 and CLASS2, put all the entries from
1632 CLASS2 into CLASS1. This is done when we have reached an insn which makes
1633 the two classes equivalent.
1635 CLASS1 will be the surviving class; CLASS2 should not be used after this
1636 call.
1638 Any invalid entries in CLASS2 will not be copied. */
1640 static void
1641 merge_equiv_classes (struct table_elt *class1, struct table_elt *class2)
1643 struct table_elt *elt, *next, *new;
1645 /* Ensure we start with the head of the classes. */
1646 class1 = class1->first_same_value;
1647 class2 = class2->first_same_value;
1649 /* If they were already equal, forget it. */
1650 if (class1 == class2)
1651 return;
1653 for (elt = class2; elt; elt = next)
1655 unsigned int hash;
1656 rtx exp = elt->exp;
1657 enum machine_mode mode = elt->mode;
1659 next = elt->next_same_value;
1661 /* Remove old entry, make a new one in CLASS1's class.
1662 Don't do this for invalid entries as we cannot find their
1663 hash code (it also isn't necessary). */
1664 if (REG_P (exp) || exp_equiv_p (exp, exp, 1, false))
1666 bool need_rehash = false;
1668 hash_arg_in_memory = 0;
1669 hash = HASH (exp, mode);
1671 if (REG_P (exp))
1673 need_rehash = REGNO_QTY_VALID_P (REGNO (exp));
1674 delete_reg_equiv (REGNO (exp));
1677 remove_from_table (elt, hash);
1679 if (insert_regs (exp, class1, 0) || need_rehash)
1681 rehash_using_reg (exp);
1682 hash = HASH (exp, mode);
1684 new = insert (exp, class1, hash, mode);
1685 new->in_memory = hash_arg_in_memory;
1690 /* Flush the entire hash table. */
1692 static void
1693 flush_hash_table (void)
1695 int i;
1696 struct table_elt *p;
1698 for (i = 0; i < HASH_SIZE; i++)
1699 for (p = table[i]; p; p = table[i])
1701 /* Note that invalidate can remove elements
1702 after P in the current hash chain. */
1703 if (REG_P (p->exp))
1704 invalidate (p->exp, p->mode);
1705 else
1706 remove_from_table (p, i);
1710 /* Function called for each rtx to check whether true dependence exist. */
1711 struct check_dependence_data
1713 enum machine_mode mode;
1714 rtx exp;
1715 rtx addr;
1718 static int
1719 check_dependence (rtx *x, void *data)
1721 struct check_dependence_data *d = (struct check_dependence_data *) data;
1722 if (*x && MEM_P (*x))
1723 return canon_true_dependence (d->exp, d->mode, d->addr, *x,
1724 cse_rtx_varies_p);
1725 else
1726 return 0;
1729 /* Remove from the hash table, or mark as invalid, all expressions whose
1730 values could be altered by storing in X. X is a register, a subreg, or
1731 a memory reference with nonvarying address (because, when a memory
1732 reference with a varying address is stored in, all memory references are
1733 removed by invalidate_memory so specific invalidation is superfluous).
1734 FULL_MODE, if not VOIDmode, indicates that this much should be
1735 invalidated instead of just the amount indicated by the mode of X. This
1736 is only used for bitfield stores into memory.
1738 A nonvarying address may be just a register or just a symbol reference,
1739 or it may be either of those plus a numeric offset. */
1741 static void
1742 invalidate (rtx x, enum machine_mode full_mode)
1744 int i;
1745 struct table_elt *p;
1746 rtx addr;
1748 switch (GET_CODE (x))
1750 case REG:
1752 /* If X is a register, dependencies on its contents are recorded
1753 through the qty number mechanism. Just change the qty number of
1754 the register, mark it as invalid for expressions that refer to it,
1755 and remove it itself. */
1756 unsigned int regno = REGNO (x);
1757 unsigned int hash = HASH (x, GET_MODE (x));
1759 /* Remove REGNO from any quantity list it might be on and indicate
1760 that its value might have changed. If it is a pseudo, remove its
1761 entry from the hash table.
1763 For a hard register, we do the first two actions above for any
1764 additional hard registers corresponding to X. Then, if any of these
1765 registers are in the table, we must remove any REG entries that
1766 overlap these registers. */
1768 delete_reg_equiv (regno);
1769 REG_TICK (regno)++;
1770 SUBREG_TICKED (regno) = -1;
1772 if (regno >= FIRST_PSEUDO_REGISTER)
1774 /* Because a register can be referenced in more than one mode,
1775 we might have to remove more than one table entry. */
1776 struct table_elt *elt;
1778 while ((elt = lookup_for_remove (x, hash, GET_MODE (x))))
1779 remove_from_table (elt, hash);
1781 else
1783 HOST_WIDE_INT in_table
1784 = TEST_HARD_REG_BIT (hard_regs_in_table, regno);
1785 unsigned int endregno
1786 = regno + hard_regno_nregs[regno][GET_MODE (x)];
1787 unsigned int tregno, tendregno, rn;
1788 struct table_elt *p, *next;
1790 CLEAR_HARD_REG_BIT (hard_regs_in_table, regno);
1792 for (rn = regno + 1; rn < endregno; rn++)
1794 in_table |= TEST_HARD_REG_BIT (hard_regs_in_table, rn);
1795 CLEAR_HARD_REG_BIT (hard_regs_in_table, rn);
1796 delete_reg_equiv (rn);
1797 REG_TICK (rn)++;
1798 SUBREG_TICKED (rn) = -1;
1801 if (in_table)
1802 for (hash = 0; hash < HASH_SIZE; hash++)
1803 for (p = table[hash]; p; p = next)
1805 next = p->next_same_hash;
1807 if (!REG_P (p->exp)
1808 || REGNO (p->exp) >= FIRST_PSEUDO_REGISTER)
1809 continue;
1811 tregno = REGNO (p->exp);
1812 tendregno
1813 = tregno + hard_regno_nregs[tregno][GET_MODE (p->exp)];
1814 if (tendregno > regno && tregno < endregno)
1815 remove_from_table (p, hash);
1819 return;
1821 case SUBREG:
1822 invalidate (SUBREG_REG (x), VOIDmode);
1823 return;
1825 case PARALLEL:
1826 for (i = XVECLEN (x, 0) - 1; i >= 0; --i)
1827 invalidate (XVECEXP (x, 0, i), VOIDmode);
1828 return;
1830 case EXPR_LIST:
1831 /* This is part of a disjoint return value; extract the location in
1832 question ignoring the offset. */
1833 invalidate (XEXP (x, 0), VOIDmode);
1834 return;
1836 case MEM:
1837 addr = canon_rtx (get_addr (XEXP (x, 0)));
1838 /* Calculate the canonical version of X here so that
1839 true_dependence doesn't generate new RTL for X on each call. */
1840 x = canon_rtx (x);
1842 /* Remove all hash table elements that refer to overlapping pieces of
1843 memory. */
1844 if (full_mode == VOIDmode)
1845 full_mode = GET_MODE (x);
1847 for (i = 0; i < HASH_SIZE; i++)
1849 struct table_elt *next;
1851 for (p = table[i]; p; p = next)
1853 next = p->next_same_hash;
1854 if (p->in_memory)
1856 struct check_dependence_data d;
1858 /* Just canonicalize the expression once;
1859 otherwise each time we call invalidate
1860 true_dependence will canonicalize the
1861 expression again. */
1862 if (!p->canon_exp)
1863 p->canon_exp = canon_rtx (p->exp);
1864 d.exp = x;
1865 d.addr = addr;
1866 d.mode = full_mode;
1867 if (for_each_rtx (&p->canon_exp, check_dependence, &d))
1868 remove_from_table (p, i);
1872 return;
1874 default:
1875 gcc_unreachable ();
1879 /* Remove all expressions that refer to register REGNO,
1880 since they are already invalid, and we are about to
1881 mark that register valid again and don't want the old
1882 expressions to reappear as valid. */
1884 static void
1885 remove_invalid_refs (unsigned int regno)
1887 unsigned int i;
1888 struct table_elt *p, *next;
1890 for (i = 0; i < HASH_SIZE; i++)
1891 for (p = table[i]; p; p = next)
1893 next = p->next_same_hash;
1894 if (!REG_P (p->exp)
1895 && refers_to_regno_p (regno, regno + 1, p->exp, (rtx *) 0))
1896 remove_from_table (p, i);
1900 /* Likewise for a subreg with subreg_reg REGNO, subreg_byte OFFSET,
1901 and mode MODE. */
1902 static void
1903 remove_invalid_subreg_refs (unsigned int regno, unsigned int offset,
1904 enum machine_mode mode)
1906 unsigned int i;
1907 struct table_elt *p, *next;
1908 unsigned int end = offset + (GET_MODE_SIZE (mode) - 1);
1910 for (i = 0; i < HASH_SIZE; i++)
1911 for (p = table[i]; p; p = next)
1913 rtx exp = p->exp;
1914 next = p->next_same_hash;
1916 if (!REG_P (exp)
1917 && (GET_CODE (exp) != SUBREG
1918 || !REG_P (SUBREG_REG (exp))
1919 || REGNO (SUBREG_REG (exp)) != regno
1920 || (((SUBREG_BYTE (exp)
1921 + (GET_MODE_SIZE (GET_MODE (exp)) - 1)) >= offset)
1922 && SUBREG_BYTE (exp) <= end))
1923 && refers_to_regno_p (regno, regno + 1, p->exp, (rtx *) 0))
1924 remove_from_table (p, i);
1928 /* Recompute the hash codes of any valid entries in the hash table that
1929 reference X, if X is a register, or SUBREG_REG (X) if X is a SUBREG.
1931 This is called when we make a jump equivalence. */
1933 static void
1934 rehash_using_reg (rtx x)
1936 unsigned int i;
1937 struct table_elt *p, *next;
1938 unsigned hash;
1940 if (GET_CODE (x) == SUBREG)
1941 x = SUBREG_REG (x);
1943 /* If X is not a register or if the register is known not to be in any
1944 valid entries in the table, we have no work to do. */
1946 if (!REG_P (x)
1947 || REG_IN_TABLE (REGNO (x)) < 0
1948 || REG_IN_TABLE (REGNO (x)) != REG_TICK (REGNO (x)))
1949 return;
1951 /* Scan all hash chains looking for valid entries that mention X.
1952 If we find one and it is in the wrong hash chain, move it. */
1954 for (i = 0; i < HASH_SIZE; i++)
1955 for (p = table[i]; p; p = next)
1957 next = p->next_same_hash;
1958 if (reg_mentioned_p (x, p->exp)
1959 && exp_equiv_p (p->exp, p->exp, 1, false)
1960 && i != (hash = SAFE_HASH (p->exp, p->mode)))
1962 if (p->next_same_hash)
1963 p->next_same_hash->prev_same_hash = p->prev_same_hash;
1965 if (p->prev_same_hash)
1966 p->prev_same_hash->next_same_hash = p->next_same_hash;
1967 else
1968 table[i] = p->next_same_hash;
1970 p->next_same_hash = table[hash];
1971 p->prev_same_hash = 0;
1972 if (table[hash])
1973 table[hash]->prev_same_hash = p;
1974 table[hash] = p;
1979 /* Remove from the hash table any expression that is a call-clobbered
1980 register. Also update their TICK values. */
1982 static void
1983 invalidate_for_call (void)
1985 unsigned int regno, endregno;
1986 unsigned int i;
1987 unsigned hash;
1988 struct table_elt *p, *next;
1989 int in_table = 0;
1991 /* Go through all the hard registers. For each that is clobbered in
1992 a CALL_INSN, remove the register from quantity chains and update
1993 reg_tick if defined. Also see if any of these registers is currently
1994 in the table. */
1996 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
1997 if (TEST_HARD_REG_BIT (regs_invalidated_by_call, regno))
1999 delete_reg_equiv (regno);
2000 if (REG_TICK (regno) >= 0)
2002 REG_TICK (regno)++;
2003 SUBREG_TICKED (regno) = -1;
2006 in_table |= (TEST_HARD_REG_BIT (hard_regs_in_table, regno) != 0);
2009 /* In the case where we have no call-clobbered hard registers in the
2010 table, we are done. Otherwise, scan the table and remove any
2011 entry that overlaps a call-clobbered register. */
2013 if (in_table)
2014 for (hash = 0; hash < HASH_SIZE; hash++)
2015 for (p = table[hash]; p; p = next)
2017 next = p->next_same_hash;
2019 if (!REG_P (p->exp)
2020 || REGNO (p->exp) >= FIRST_PSEUDO_REGISTER)
2021 continue;
2023 regno = REGNO (p->exp);
2024 endregno = regno + hard_regno_nregs[regno][GET_MODE (p->exp)];
2026 for (i = regno; i < endregno; i++)
2027 if (TEST_HARD_REG_BIT (regs_invalidated_by_call, i))
2029 remove_from_table (p, hash);
2030 break;
2035 /* Given an expression X of type CONST,
2036 and ELT which is its table entry (or 0 if it
2037 is not in the hash table),
2038 return an alternate expression for X as a register plus integer.
2039 If none can be found, return 0. */
2041 static rtx
2042 use_related_value (rtx x, struct table_elt *elt)
2044 struct table_elt *relt = 0;
2045 struct table_elt *p, *q;
2046 HOST_WIDE_INT offset;
2048 /* First, is there anything related known?
2049 If we have a table element, we can tell from that.
2050 Otherwise, must look it up. */
2052 if (elt != 0 && elt->related_value != 0)
2053 relt = elt;
2054 else if (elt == 0 && GET_CODE (x) == CONST)
2056 rtx subexp = get_related_value (x);
2057 if (subexp != 0)
2058 relt = lookup (subexp,
2059 SAFE_HASH (subexp, GET_MODE (subexp)),
2060 GET_MODE (subexp));
2063 if (relt == 0)
2064 return 0;
2066 /* Search all related table entries for one that has an
2067 equivalent register. */
2069 p = relt;
2070 while (1)
2072 /* This loop is strange in that it is executed in two different cases.
2073 The first is when X is already in the table. Then it is searching
2074 the RELATED_VALUE list of X's class (RELT). The second case is when
2075 X is not in the table. Then RELT points to a class for the related
2076 value.
2078 Ensure that, whatever case we are in, that we ignore classes that have
2079 the same value as X. */
2081 if (rtx_equal_p (x, p->exp))
2082 q = 0;
2083 else
2084 for (q = p->first_same_value; q; q = q->next_same_value)
2085 if (REG_P (q->exp))
2086 break;
2088 if (q)
2089 break;
2091 p = p->related_value;
2093 /* We went all the way around, so there is nothing to be found.
2094 Alternatively, perhaps RELT was in the table for some other reason
2095 and it has no related values recorded. */
2096 if (p == relt || p == 0)
2097 break;
2100 if (q == 0)
2101 return 0;
2103 offset = (get_integer_term (x) - get_integer_term (p->exp));
2104 /* Note: OFFSET may be 0 if P->xexp and X are related by commutativity. */
2105 return plus_constant (q->exp, offset);
2108 /* Hash a string. Just add its bytes up. */
2109 static inline unsigned
2110 hash_rtx_string (const char *ps)
2112 unsigned hash = 0;
2113 const unsigned char *p = (const unsigned char *) ps;
2115 if (p)
2116 while (*p)
2117 hash += *p++;
2119 return hash;
2122 /* Hash an rtx. We are careful to make sure the value is never negative.
2123 Equivalent registers hash identically.
2124 MODE is used in hashing for CONST_INTs only;
2125 otherwise the mode of X is used.
2127 Store 1 in DO_NOT_RECORD_P if any subexpression is volatile.
2129 If HASH_ARG_IN_MEMORY_P is not NULL, store 1 in it if X contains
2130 a MEM rtx which does not have the RTX_UNCHANGING_P bit set.
2132 Note that cse_insn knows that the hash code of a MEM expression
2133 is just (int) MEM plus the hash code of the address. */
2135 unsigned
2136 hash_rtx (rtx x, enum machine_mode mode, int *do_not_record_p,
2137 int *hash_arg_in_memory_p, bool have_reg_qty)
2139 int i, j;
2140 unsigned hash = 0;
2141 enum rtx_code code;
2142 const char *fmt;
2144 /* Used to turn recursion into iteration. We can't rely on GCC's
2145 tail-recursion elimination since we need to keep accumulating values
2146 in HASH. */
2147 repeat:
2148 if (x == 0)
2149 return hash;
2151 code = GET_CODE (x);
2152 switch (code)
2154 case REG:
2156 unsigned int regno = REGNO (x);
2158 if (!reload_completed)
2160 /* On some machines, we can't record any non-fixed hard register,
2161 because extending its life will cause reload problems. We
2162 consider ap, fp, sp, gp to be fixed for this purpose.
2164 We also consider CCmode registers to be fixed for this purpose;
2165 failure to do so leads to failure to simplify 0<100 type of
2166 conditionals.
2168 On all machines, we can't record any global registers.
2169 Nor should we record any register that is in a small
2170 class, as defined by CLASS_LIKELY_SPILLED_P. */
2171 bool record;
2173 if (regno >= FIRST_PSEUDO_REGISTER)
2174 record = true;
2175 else if (x == frame_pointer_rtx
2176 || x == hard_frame_pointer_rtx
2177 || x == arg_pointer_rtx
2178 || x == stack_pointer_rtx
2179 || x == pic_offset_table_rtx)
2180 record = true;
2181 else if (global_regs[regno])
2182 record = false;
2183 else if (fixed_regs[regno])
2184 record = true;
2185 else if (GET_MODE_CLASS (GET_MODE (x)) == MODE_CC)
2186 record = true;
2187 else if (SMALL_REGISTER_CLASSES)
2188 record = false;
2189 else if (CLASS_LIKELY_SPILLED_P (REGNO_REG_CLASS (regno)))
2190 record = false;
2191 else
2192 record = true;
2194 if (!record)
2196 *do_not_record_p = 1;
2197 return 0;
2201 hash += ((unsigned int) REG << 7);
2202 hash += (have_reg_qty ? (unsigned) REG_QTY (regno) : regno);
2203 return hash;
2206 /* We handle SUBREG of a REG specially because the underlying
2207 reg changes its hash value with every value change; we don't
2208 want to have to forget unrelated subregs when one subreg changes. */
2209 case SUBREG:
2211 if (REG_P (SUBREG_REG (x)))
2213 hash += (((unsigned int) SUBREG << 7)
2214 + REGNO (SUBREG_REG (x))
2215 + (SUBREG_BYTE (x) / UNITS_PER_WORD));
2216 return hash;
2218 break;
2221 case CONST_INT:
2222 hash += (((unsigned int) CONST_INT << 7) + (unsigned int) mode
2223 + (unsigned int) INTVAL (x));
2224 return hash;
2226 case CONST_DOUBLE:
2227 /* This is like the general case, except that it only counts
2228 the integers representing the constant. */
2229 hash += (unsigned int) code + (unsigned int) GET_MODE (x);
2230 if (GET_MODE (x) != VOIDmode)
2231 hash += real_hash (CONST_DOUBLE_REAL_VALUE (x));
2232 else
2233 hash += ((unsigned int) CONST_DOUBLE_LOW (x)
2234 + (unsigned int) CONST_DOUBLE_HIGH (x));
2235 return hash;
2237 case CONST_VECTOR:
2239 int units;
2240 rtx elt;
2242 units = CONST_VECTOR_NUNITS (x);
2244 for (i = 0; i < units; ++i)
2246 elt = CONST_VECTOR_ELT (x, i);
2247 hash += hash_rtx (elt, GET_MODE (elt), do_not_record_p,
2248 hash_arg_in_memory_p, have_reg_qty);
2251 return hash;
2254 /* Assume there is only one rtx object for any given label. */
2255 case LABEL_REF:
2256 /* We don't hash on the address of the CODE_LABEL to avoid bootstrap
2257 differences and differences between each stage's debugging dumps. */
2258 hash += (((unsigned int) LABEL_REF << 7)
2259 + CODE_LABEL_NUMBER (XEXP (x, 0)));
2260 return hash;
2262 case SYMBOL_REF:
2264 /* Don't hash on the symbol's address to avoid bootstrap differences.
2265 Different hash values may cause expressions to be recorded in
2266 different orders and thus different registers to be used in the
2267 final assembler. This also avoids differences in the dump files
2268 between various stages. */
2269 unsigned int h = 0;
2270 const unsigned char *p = (const unsigned char *) XSTR (x, 0);
2272 while (*p)
2273 h += (h << 7) + *p++; /* ??? revisit */
2275 hash += ((unsigned int) SYMBOL_REF << 7) + h;
2276 return hash;
2279 case MEM:
2280 /* We don't record if marked volatile or if BLKmode since we don't
2281 know the size of the move. */
2282 if (MEM_VOLATILE_P (x) || GET_MODE (x) == BLKmode)
2284 *do_not_record_p = 1;
2285 return 0;
2287 if (hash_arg_in_memory_p && !MEM_READONLY_P (x))
2288 *hash_arg_in_memory_p = 1;
2290 /* Now that we have already found this special case,
2291 might as well speed it up as much as possible. */
2292 hash += (unsigned) MEM;
2293 x = XEXP (x, 0);
2294 goto repeat;
2296 case USE:
2297 /* A USE that mentions non-volatile memory needs special
2298 handling since the MEM may be BLKmode which normally
2299 prevents an entry from being made. Pure calls are
2300 marked by a USE which mentions BLKmode memory.
2301 See calls.c:emit_call_1. */
2302 if (MEM_P (XEXP (x, 0))
2303 && ! MEM_VOLATILE_P (XEXP (x, 0)))
2305 hash += (unsigned) USE;
2306 x = XEXP (x, 0);
2308 if (hash_arg_in_memory_p && !MEM_READONLY_P (x))
2309 *hash_arg_in_memory_p = 1;
2311 /* Now that we have already found this special case,
2312 might as well speed it up as much as possible. */
2313 hash += (unsigned) MEM;
2314 x = XEXP (x, 0);
2315 goto repeat;
2317 break;
2319 case PRE_DEC:
2320 case PRE_INC:
2321 case POST_DEC:
2322 case POST_INC:
2323 case PRE_MODIFY:
2324 case POST_MODIFY:
2325 case PC:
2326 case CC0:
2327 case CALL:
2328 case UNSPEC_VOLATILE:
2329 *do_not_record_p = 1;
2330 return 0;
2332 case ASM_OPERANDS:
2333 if (MEM_VOLATILE_P (x))
2335 *do_not_record_p = 1;
2336 return 0;
2338 else
2340 /* We don't want to take the filename and line into account. */
2341 hash += (unsigned) code + (unsigned) GET_MODE (x)
2342 + hash_rtx_string (ASM_OPERANDS_TEMPLATE (x))
2343 + hash_rtx_string (ASM_OPERANDS_OUTPUT_CONSTRAINT (x))
2344 + (unsigned) ASM_OPERANDS_OUTPUT_IDX (x);
2346 if (ASM_OPERANDS_INPUT_LENGTH (x))
2348 for (i = 1; i < ASM_OPERANDS_INPUT_LENGTH (x); i++)
2350 hash += (hash_rtx (ASM_OPERANDS_INPUT (x, i),
2351 GET_MODE (ASM_OPERANDS_INPUT (x, i)),
2352 do_not_record_p, hash_arg_in_memory_p,
2353 have_reg_qty)
2354 + hash_rtx_string
2355 (ASM_OPERANDS_INPUT_CONSTRAINT (x, i)));
2358 hash += hash_rtx_string (ASM_OPERANDS_INPUT_CONSTRAINT (x, 0));
2359 x = ASM_OPERANDS_INPUT (x, 0);
2360 mode = GET_MODE (x);
2361 goto repeat;
2364 return hash;
2366 break;
2368 default:
2369 break;
2372 i = GET_RTX_LENGTH (code) - 1;
2373 hash += (unsigned) code + (unsigned) GET_MODE (x);
2374 fmt = GET_RTX_FORMAT (code);
2375 for (; i >= 0; i--)
2377 switch (fmt[i])
2379 case 'e':
2380 /* If we are about to do the last recursive call
2381 needed at this level, change it into iteration.
2382 This function is called enough to be worth it. */
2383 if (i == 0)
2385 x = XEXP (x, i);
2386 goto repeat;
2389 hash += hash_rtx (XEXP (x, i), 0, do_not_record_p,
2390 hash_arg_in_memory_p, have_reg_qty);
2391 break;
2393 case 'E':
2394 for (j = 0; j < XVECLEN (x, i); j++)
2395 hash += hash_rtx (XVECEXP (x, i, j), 0, do_not_record_p,
2396 hash_arg_in_memory_p, have_reg_qty);
2397 break;
2399 case 's':
2400 hash += hash_rtx_string (XSTR (x, i));
2401 break;
2403 case 'i':
2404 hash += (unsigned int) XINT (x, i);
2405 break;
2407 case '0': case 't':
2408 /* Unused. */
2409 break;
2411 default:
2412 gcc_unreachable ();
2416 return hash;
2419 /* Hash an rtx X for cse via hash_rtx.
2420 Stores 1 in do_not_record if any subexpression is volatile.
2421 Stores 1 in hash_arg_in_memory if X contains a mem rtx which
2422 does not have the RTX_UNCHANGING_P bit set. */
2424 static inline unsigned
2425 canon_hash (rtx x, enum machine_mode mode)
2427 return hash_rtx (x, mode, &do_not_record, &hash_arg_in_memory, true);
2430 /* Like canon_hash but with no side effects, i.e. do_not_record
2431 and hash_arg_in_memory are not changed. */
2433 static inline unsigned
2434 safe_hash (rtx x, enum machine_mode mode)
2436 int dummy_do_not_record;
2437 return hash_rtx (x, mode, &dummy_do_not_record, NULL, true);
2440 /* Return 1 iff X and Y would canonicalize into the same thing,
2441 without actually constructing the canonicalization of either one.
2442 If VALIDATE is nonzero,
2443 we assume X is an expression being processed from the rtl
2444 and Y was found in the hash table. We check register refs
2445 in Y for being marked as valid.
2447 If FOR_GCSE is true, we compare X and Y for equivalence for GCSE. */
2450 exp_equiv_p (rtx x, rtx y, int validate, bool for_gcse)
2452 int i, j;
2453 enum rtx_code code;
2454 const char *fmt;
2456 /* Note: it is incorrect to assume an expression is equivalent to itself
2457 if VALIDATE is nonzero. */
2458 if (x == y && !validate)
2459 return 1;
2461 if (x == 0 || y == 0)
2462 return x == y;
2464 code = GET_CODE (x);
2465 if (code != GET_CODE (y))
2466 return 0;
2468 /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent. */
2469 if (GET_MODE (x) != GET_MODE (y))
2470 return 0;
2472 switch (code)
2474 case PC:
2475 case CC0:
2476 case CONST_INT:
2477 return x == y;
2479 case LABEL_REF:
2480 return XEXP (x, 0) == XEXP (y, 0);
2482 case SYMBOL_REF:
2483 return XSTR (x, 0) == XSTR (y, 0);
2485 case REG:
2486 if (for_gcse)
2487 return REGNO (x) == REGNO (y);
2488 else
2490 unsigned int regno = REGNO (y);
2491 unsigned int i;
2492 unsigned int endregno
2493 = regno + (regno >= FIRST_PSEUDO_REGISTER ? 1
2494 : hard_regno_nregs[regno][GET_MODE (y)]);
2496 /* If the quantities are not the same, the expressions are not
2497 equivalent. If there are and we are not to validate, they
2498 are equivalent. Otherwise, ensure all regs are up-to-date. */
2500 if (REG_QTY (REGNO (x)) != REG_QTY (regno))
2501 return 0;
2503 if (! validate)
2504 return 1;
2506 for (i = regno; i < endregno; i++)
2507 if (REG_IN_TABLE (i) != REG_TICK (i))
2508 return 0;
2510 return 1;
2513 case MEM:
2514 if (for_gcse)
2516 /* Can't merge two expressions in different alias sets, since we
2517 can decide that the expression is transparent in a block when
2518 it isn't, due to it being set with the different alias set. */
2519 if (MEM_ALIAS_SET (x) != MEM_ALIAS_SET (y))
2520 return 0;
2522 /* A volatile mem should not be considered equivalent to any
2523 other. */
2524 if (MEM_VOLATILE_P (x) || MEM_VOLATILE_P (y))
2525 return 0;
2527 break;
2529 /* For commutative operations, check both orders. */
2530 case PLUS:
2531 case MULT:
2532 case AND:
2533 case IOR:
2534 case XOR:
2535 case NE:
2536 case EQ:
2537 return ((exp_equiv_p (XEXP (x, 0), XEXP (y, 0),
2538 validate, for_gcse)
2539 && exp_equiv_p (XEXP (x, 1), XEXP (y, 1),
2540 validate, for_gcse))
2541 || (exp_equiv_p (XEXP (x, 0), XEXP (y, 1),
2542 validate, for_gcse)
2543 && exp_equiv_p (XEXP (x, 1), XEXP (y, 0),
2544 validate, for_gcse)));
2546 case ASM_OPERANDS:
2547 /* We don't use the generic code below because we want to
2548 disregard filename and line numbers. */
2550 /* A volatile asm isn't equivalent to any other. */
2551 if (MEM_VOLATILE_P (x) || MEM_VOLATILE_P (y))
2552 return 0;
2554 if (GET_MODE (x) != GET_MODE (y)
2555 || strcmp (ASM_OPERANDS_TEMPLATE (x), ASM_OPERANDS_TEMPLATE (y))
2556 || strcmp (ASM_OPERANDS_OUTPUT_CONSTRAINT (x),
2557 ASM_OPERANDS_OUTPUT_CONSTRAINT (y))
2558 || ASM_OPERANDS_OUTPUT_IDX (x) != ASM_OPERANDS_OUTPUT_IDX (y)
2559 || ASM_OPERANDS_INPUT_LENGTH (x) != ASM_OPERANDS_INPUT_LENGTH (y))
2560 return 0;
2562 if (ASM_OPERANDS_INPUT_LENGTH (x))
2564 for (i = ASM_OPERANDS_INPUT_LENGTH (x) - 1; i >= 0; i--)
2565 if (! exp_equiv_p (ASM_OPERANDS_INPUT (x, i),
2566 ASM_OPERANDS_INPUT (y, i),
2567 validate, for_gcse)
2568 || strcmp (ASM_OPERANDS_INPUT_CONSTRAINT (x, i),
2569 ASM_OPERANDS_INPUT_CONSTRAINT (y, i)))
2570 return 0;
2573 return 1;
2575 default:
2576 break;
2579 /* Compare the elements. If any pair of corresponding elements
2580 fail to match, return 0 for the whole thing. */
2582 fmt = GET_RTX_FORMAT (code);
2583 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2585 switch (fmt[i])
2587 case 'e':
2588 if (! exp_equiv_p (XEXP (x, i), XEXP (y, i),
2589 validate, for_gcse))
2590 return 0;
2591 break;
2593 case 'E':
2594 if (XVECLEN (x, i) != XVECLEN (y, i))
2595 return 0;
2596 for (j = 0; j < XVECLEN (x, i); j++)
2597 if (! exp_equiv_p (XVECEXP (x, i, j), XVECEXP (y, i, j),
2598 validate, for_gcse))
2599 return 0;
2600 break;
2602 case 's':
2603 if (strcmp (XSTR (x, i), XSTR (y, i)))
2604 return 0;
2605 break;
2607 case 'i':
2608 if (XINT (x, i) != XINT (y, i))
2609 return 0;
2610 break;
2612 case 'w':
2613 if (XWINT (x, i) != XWINT (y, i))
2614 return 0;
2615 break;
2617 case '0':
2618 case 't':
2619 break;
2621 default:
2622 gcc_unreachable ();
2626 return 1;
2629 /* Return 1 if X has a value that can vary even between two
2630 executions of the program. 0 means X can be compared reliably
2631 against certain constants or near-constants. */
2633 static int
2634 cse_rtx_varies_p (rtx x, int from_alias)
2636 /* We need not check for X and the equivalence class being of the same
2637 mode because if X is equivalent to a constant in some mode, it
2638 doesn't vary in any mode. */
2640 if (REG_P (x)
2641 && REGNO_QTY_VALID_P (REGNO (x)))
2643 int x_q = REG_QTY (REGNO (x));
2644 struct qty_table_elem *x_ent = &qty_table[x_q];
2646 if (GET_MODE (x) == x_ent->mode
2647 && x_ent->const_rtx != NULL_RTX)
2648 return 0;
2651 if (GET_CODE (x) == PLUS
2652 && GET_CODE (XEXP (x, 1)) == CONST_INT
2653 && REG_P (XEXP (x, 0))
2654 && REGNO_QTY_VALID_P (REGNO (XEXP (x, 0))))
2656 int x0_q = REG_QTY (REGNO (XEXP (x, 0)));
2657 struct qty_table_elem *x0_ent = &qty_table[x0_q];
2659 if ((GET_MODE (XEXP (x, 0)) == x0_ent->mode)
2660 && x0_ent->const_rtx != NULL_RTX)
2661 return 0;
2664 /* This can happen as the result of virtual register instantiation, if
2665 the initial constant is too large to be a valid address. This gives
2666 us a three instruction sequence, load large offset into a register,
2667 load fp minus a constant into a register, then a MEM which is the
2668 sum of the two `constant' registers. */
2669 if (GET_CODE (x) == PLUS
2670 && REG_P (XEXP (x, 0))
2671 && REG_P (XEXP (x, 1))
2672 && REGNO_QTY_VALID_P (REGNO (XEXP (x, 0)))
2673 && REGNO_QTY_VALID_P (REGNO (XEXP (x, 1))))
2675 int x0_q = REG_QTY (REGNO (XEXP (x, 0)));
2676 int x1_q = REG_QTY (REGNO (XEXP (x, 1)));
2677 struct qty_table_elem *x0_ent = &qty_table[x0_q];
2678 struct qty_table_elem *x1_ent = &qty_table[x1_q];
2680 if ((GET_MODE (XEXP (x, 0)) == x0_ent->mode)
2681 && x0_ent->const_rtx != NULL_RTX
2682 && (GET_MODE (XEXP (x, 1)) == x1_ent->mode)
2683 && x1_ent->const_rtx != NULL_RTX)
2684 return 0;
2687 return rtx_varies_p (x, from_alias);
2690 /* Subroutine of canon_reg. Pass *XLOC through canon_reg, and validate
2691 the result if necessary. INSN is as for canon_reg. */
2693 static void
2694 validate_canon_reg (rtx *xloc, rtx insn)
2696 rtx new = canon_reg (*xloc, insn);
2697 int insn_code;
2699 /* If replacing pseudo with hard reg or vice versa, ensure the
2700 insn remains valid. Likewise if the insn has MATCH_DUPs. */
2701 if (insn != 0 && new != 0
2702 && REG_P (new) && REG_P (*xloc)
2703 && (((REGNO (new) < FIRST_PSEUDO_REGISTER)
2704 != (REGNO (*xloc) < FIRST_PSEUDO_REGISTER))
2705 || GET_MODE (new) != GET_MODE (*xloc)
2706 || (insn_code = recog_memoized (insn)) < 0
2707 || insn_data[insn_code].n_dups > 0))
2708 validate_change (insn, xloc, new, 1);
2709 else
2710 *xloc = new;
2713 /* Canonicalize an expression:
2714 replace each register reference inside it
2715 with the "oldest" equivalent register.
2717 If INSN is nonzero and we are replacing a pseudo with a hard register
2718 or vice versa, validate_change is used to ensure that INSN remains valid
2719 after we make our substitution. The calls are made with IN_GROUP nonzero
2720 so apply_change_group must be called upon the outermost return from this
2721 function (unless INSN is zero). The result of apply_change_group can
2722 generally be discarded since the changes we are making are optional. */
2724 static rtx
2725 canon_reg (rtx x, rtx insn)
2727 int i;
2728 enum rtx_code code;
2729 const char *fmt;
2731 if (x == 0)
2732 return x;
2734 code = GET_CODE (x);
2735 switch (code)
2737 case PC:
2738 case CC0:
2739 case CONST:
2740 case CONST_INT:
2741 case CONST_DOUBLE:
2742 case CONST_VECTOR:
2743 case SYMBOL_REF:
2744 case LABEL_REF:
2745 case ADDR_VEC:
2746 case ADDR_DIFF_VEC:
2747 return x;
2749 case REG:
2751 int first;
2752 int q;
2753 struct qty_table_elem *ent;
2755 /* Never replace a hard reg, because hard regs can appear
2756 in more than one machine mode, and we must preserve the mode
2757 of each occurrence. Also, some hard regs appear in
2758 MEMs that are shared and mustn't be altered. Don't try to
2759 replace any reg that maps to a reg of class NO_REGS. */
2760 if (REGNO (x) < FIRST_PSEUDO_REGISTER
2761 || ! REGNO_QTY_VALID_P (REGNO (x)))
2762 return x;
2764 q = REG_QTY (REGNO (x));
2765 ent = &qty_table[q];
2766 first = ent->first_reg;
2767 return (first >= FIRST_PSEUDO_REGISTER ? regno_reg_rtx[first]
2768 : REGNO_REG_CLASS (first) == NO_REGS ? x
2769 : gen_rtx_REG (ent->mode, first));
2772 default:
2773 break;
2776 fmt = GET_RTX_FORMAT (code);
2777 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2779 int j;
2781 if (fmt[i] == 'e')
2782 validate_canon_reg (&XEXP (x, i), insn);
2783 else if (fmt[i] == 'E')
2784 for (j = 0; j < XVECLEN (x, i); j++)
2785 validate_canon_reg (&XVECEXP (x, i, j), insn);
2788 return x;
2791 /* LOC is a location within INSN that is an operand address (the contents of
2792 a MEM). Find the best equivalent address to use that is valid for this
2793 insn.
2795 On most CISC machines, complicated address modes are costly, and rtx_cost
2796 is a good approximation for that cost. However, most RISC machines have
2797 only a few (usually only one) memory reference formats. If an address is
2798 valid at all, it is often just as cheap as any other address. Hence, for
2799 RISC machines, we use `address_cost' to compare the costs of various
2800 addresses. For two addresses of equal cost, choose the one with the
2801 highest `rtx_cost' value as that has the potential of eliminating the
2802 most insns. For equal costs, we choose the first in the equivalence
2803 class. Note that we ignore the fact that pseudo registers are cheaper than
2804 hard registers here because we would also prefer the pseudo registers. */
2806 static void
2807 find_best_addr (rtx insn, rtx *loc, enum machine_mode mode)
2809 struct table_elt *elt;
2810 rtx addr = *loc;
2811 struct table_elt *p;
2812 int found_better = 1;
2813 int save_do_not_record = do_not_record;
2814 int save_hash_arg_in_memory = hash_arg_in_memory;
2815 int addr_volatile;
2816 int regno;
2817 unsigned hash;
2819 /* Do not try to replace constant addresses or addresses of local and
2820 argument slots. These MEM expressions are made only once and inserted
2821 in many instructions, as well as being used to control symbol table
2822 output. It is not safe to clobber them.
2824 There are some uncommon cases where the address is already in a register
2825 for some reason, but we cannot take advantage of that because we have
2826 no easy way to unshare the MEM. In addition, looking up all stack
2827 addresses is costly. */
2828 if ((GET_CODE (addr) == PLUS
2829 && REG_P (XEXP (addr, 0))
2830 && GET_CODE (XEXP (addr, 1)) == CONST_INT
2831 && (regno = REGNO (XEXP (addr, 0)),
2832 regno == FRAME_POINTER_REGNUM || regno == HARD_FRAME_POINTER_REGNUM
2833 || regno == ARG_POINTER_REGNUM))
2834 || (REG_P (addr)
2835 && (regno = REGNO (addr), regno == FRAME_POINTER_REGNUM
2836 || regno == HARD_FRAME_POINTER_REGNUM
2837 || regno == ARG_POINTER_REGNUM))
2838 || CONSTANT_ADDRESS_P (addr))
2839 return;
2841 /* If this address is not simply a register, try to fold it. This will
2842 sometimes simplify the expression. Many simplifications
2843 will not be valid, but some, usually applying the associative rule, will
2844 be valid and produce better code. */
2845 if (!REG_P (addr))
2847 rtx folded = fold_rtx (copy_rtx (addr), NULL_RTX);
2848 int addr_folded_cost = address_cost (folded, mode);
2849 int addr_cost = address_cost (addr, mode);
2851 if ((addr_folded_cost < addr_cost
2852 || (addr_folded_cost == addr_cost
2853 /* ??? The rtx_cost comparison is left over from an older
2854 version of this code. It is probably no longer helpful. */
2855 && (rtx_cost (folded, MEM) > rtx_cost (addr, MEM)
2856 || approx_reg_cost (folded) < approx_reg_cost (addr))))
2857 && validate_change (insn, loc, folded, 0))
2858 addr = folded;
2861 /* If this address is not in the hash table, we can't look for equivalences
2862 of the whole address. Also, ignore if volatile. */
2864 do_not_record = 0;
2865 hash = HASH (addr, Pmode);
2866 addr_volatile = do_not_record;
2867 do_not_record = save_do_not_record;
2868 hash_arg_in_memory = save_hash_arg_in_memory;
2870 if (addr_volatile)
2871 return;
2873 elt = lookup (addr, hash, Pmode);
2875 if (elt)
2877 /* We need to find the best (under the criteria documented above) entry
2878 in the class that is valid. We use the `flag' field to indicate
2879 choices that were invalid and iterate until we can't find a better
2880 one that hasn't already been tried. */
2882 for (p = elt->first_same_value; p; p = p->next_same_value)
2883 p->flag = 0;
2885 while (found_better)
2887 int best_addr_cost = address_cost (*loc, mode);
2888 int best_rtx_cost = (elt->cost + 1) >> 1;
2889 int exp_cost;
2890 struct table_elt *best_elt = elt;
2892 found_better = 0;
2893 for (p = elt->first_same_value; p; p = p->next_same_value)
2894 if (! p->flag)
2896 if ((REG_P (p->exp)
2897 || exp_equiv_p (p->exp, p->exp, 1, false))
2898 && ((exp_cost = address_cost (p->exp, mode)) < best_addr_cost
2899 || (exp_cost == best_addr_cost
2900 && ((p->cost + 1) >> 1) > best_rtx_cost)))
2902 found_better = 1;
2903 best_addr_cost = exp_cost;
2904 best_rtx_cost = (p->cost + 1) >> 1;
2905 best_elt = p;
2909 if (found_better)
2911 if (validate_change (insn, loc,
2912 canon_reg (copy_rtx (best_elt->exp),
2913 NULL_RTX), 0))
2914 return;
2915 else
2916 best_elt->flag = 1;
2921 /* If the address is a binary operation with the first operand a register
2922 and the second a constant, do the same as above, but looking for
2923 equivalences of the register. Then try to simplify before checking for
2924 the best address to use. This catches a few cases: First is when we
2925 have REG+const and the register is another REG+const. We can often merge
2926 the constants and eliminate one insn and one register. It may also be
2927 that a machine has a cheap REG+REG+const. Finally, this improves the
2928 code on the Alpha for unaligned byte stores. */
2930 if (flag_expensive_optimizations
2931 && ARITHMETIC_P (*loc)
2932 && REG_P (XEXP (*loc, 0)))
2934 rtx op1 = XEXP (*loc, 1);
2936 do_not_record = 0;
2937 hash = HASH (XEXP (*loc, 0), Pmode);
2938 do_not_record = save_do_not_record;
2939 hash_arg_in_memory = save_hash_arg_in_memory;
2941 elt = lookup (XEXP (*loc, 0), hash, Pmode);
2942 if (elt == 0)
2943 return;
2945 /* We need to find the best (under the criteria documented above) entry
2946 in the class that is valid. We use the `flag' field to indicate
2947 choices that were invalid and iterate until we can't find a better
2948 one that hasn't already been tried. */
2950 for (p = elt->first_same_value; p; p = p->next_same_value)
2951 p->flag = 0;
2953 while (found_better)
2955 int best_addr_cost = address_cost (*loc, mode);
2956 int best_rtx_cost = (COST (*loc) + 1) >> 1;
2957 struct table_elt *best_elt = elt;
2958 rtx best_rtx = *loc;
2959 int count;
2961 /* This is at worst case an O(n^2) algorithm, so limit our search
2962 to the first 32 elements on the list. This avoids trouble
2963 compiling code with very long basic blocks that can easily
2964 call simplify_gen_binary so many times that we run out of
2965 memory. */
2967 found_better = 0;
2968 for (p = elt->first_same_value, count = 0;
2969 p && count < 32;
2970 p = p->next_same_value, count++)
2971 if (! p->flag
2972 && (REG_P (p->exp)
2973 || exp_equiv_p (p->exp, p->exp, 1, false)))
2975 rtx new = simplify_gen_binary (GET_CODE (*loc), Pmode,
2976 p->exp, op1);
2977 int new_cost;
2979 /* Get the canonical version of the address so we can accept
2980 more. */
2981 new = canon_for_address (new);
2983 new_cost = address_cost (new, mode);
2985 if (new_cost < best_addr_cost
2986 || (new_cost == best_addr_cost
2987 && (COST (new) + 1) >> 1 > best_rtx_cost))
2989 found_better = 1;
2990 best_addr_cost = new_cost;
2991 best_rtx_cost = (COST (new) + 1) >> 1;
2992 best_elt = p;
2993 best_rtx = new;
2997 if (found_better)
2999 if (validate_change (insn, loc,
3000 canon_reg (copy_rtx (best_rtx),
3001 NULL_RTX), 0))
3002 return;
3003 else
3004 best_elt->flag = 1;
3010 /* Given an operation (CODE, *PARG1, *PARG2), where code is a comparison
3011 operation (EQ, NE, GT, etc.), follow it back through the hash table and
3012 what values are being compared.
3014 *PARG1 and *PARG2 are updated to contain the rtx representing the values
3015 actually being compared. For example, if *PARG1 was (cc0) and *PARG2
3016 was (const_int 0), *PARG1 and *PARG2 will be set to the objects that were
3017 compared to produce cc0.
3019 The return value is the comparison operator and is either the code of
3020 A or the code corresponding to the inverse of the comparison. */
3022 static enum rtx_code
3023 find_comparison_args (enum rtx_code code, rtx *parg1, rtx *parg2,
3024 enum machine_mode *pmode1, enum machine_mode *pmode2)
3026 rtx arg1, arg2;
3028 arg1 = *parg1, arg2 = *parg2;
3030 /* If ARG2 is const0_rtx, see what ARG1 is equivalent to. */
3032 while (arg2 == CONST0_RTX (GET_MODE (arg1)))
3034 /* Set nonzero when we find something of interest. */
3035 rtx x = 0;
3036 int reverse_code = 0;
3037 struct table_elt *p = 0;
3039 /* If arg1 is a COMPARE, extract the comparison arguments from it.
3040 On machines with CC0, this is the only case that can occur, since
3041 fold_rtx will return the COMPARE or item being compared with zero
3042 when given CC0. */
3044 if (GET_CODE (arg1) == COMPARE && arg2 == const0_rtx)
3045 x = arg1;
3047 /* If ARG1 is a comparison operator and CODE is testing for
3048 STORE_FLAG_VALUE, get the inner arguments. */
3050 else if (COMPARISON_P (arg1))
3052 #ifdef FLOAT_STORE_FLAG_VALUE
3053 REAL_VALUE_TYPE fsfv;
3054 #endif
3056 if (code == NE
3057 || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_INT
3058 && code == LT && STORE_FLAG_VALUE == -1)
3059 #ifdef FLOAT_STORE_FLAG_VALUE
3060 || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_FLOAT
3061 && (fsfv = FLOAT_STORE_FLAG_VALUE (GET_MODE (arg1)),
3062 REAL_VALUE_NEGATIVE (fsfv)))
3063 #endif
3065 x = arg1;
3066 else if (code == EQ
3067 || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_INT
3068 && code == GE && STORE_FLAG_VALUE == -1)
3069 #ifdef FLOAT_STORE_FLAG_VALUE
3070 || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_FLOAT
3071 && (fsfv = FLOAT_STORE_FLAG_VALUE (GET_MODE (arg1)),
3072 REAL_VALUE_NEGATIVE (fsfv)))
3073 #endif
3075 x = arg1, reverse_code = 1;
3078 /* ??? We could also check for
3080 (ne (and (eq (...) (const_int 1))) (const_int 0))
3082 and related forms, but let's wait until we see them occurring. */
3084 if (x == 0)
3085 /* Look up ARG1 in the hash table and see if it has an equivalence
3086 that lets us see what is being compared. */
3087 p = lookup (arg1, SAFE_HASH (arg1, GET_MODE (arg1)), GET_MODE (arg1));
3088 if (p)
3090 p = p->first_same_value;
3092 /* If what we compare is already known to be constant, that is as
3093 good as it gets.
3094 We need to break the loop in this case, because otherwise we
3095 can have an infinite loop when looking at a reg that is known
3096 to be a constant which is the same as a comparison of a reg
3097 against zero which appears later in the insn stream, which in
3098 turn is constant and the same as the comparison of the first reg
3099 against zero... */
3100 if (p->is_const)
3101 break;
3104 for (; p; p = p->next_same_value)
3106 enum machine_mode inner_mode = GET_MODE (p->exp);
3107 #ifdef FLOAT_STORE_FLAG_VALUE
3108 REAL_VALUE_TYPE fsfv;
3109 #endif
3111 /* If the entry isn't valid, skip it. */
3112 if (! exp_equiv_p (p->exp, p->exp, 1, false))
3113 continue;
3115 if (GET_CODE (p->exp) == COMPARE
3116 /* Another possibility is that this machine has a compare insn
3117 that includes the comparison code. In that case, ARG1 would
3118 be equivalent to a comparison operation that would set ARG1 to
3119 either STORE_FLAG_VALUE or zero. If this is an NE operation,
3120 ORIG_CODE is the actual comparison being done; if it is an EQ,
3121 we must reverse ORIG_CODE. On machine with a negative value
3122 for STORE_FLAG_VALUE, also look at LT and GE operations. */
3123 || ((code == NE
3124 || (code == LT
3125 && GET_MODE_CLASS (inner_mode) == MODE_INT
3126 && (GET_MODE_BITSIZE (inner_mode)
3127 <= HOST_BITS_PER_WIDE_INT)
3128 && (STORE_FLAG_VALUE
3129 & ((HOST_WIDE_INT) 1
3130 << (GET_MODE_BITSIZE (inner_mode) - 1))))
3131 #ifdef FLOAT_STORE_FLAG_VALUE
3132 || (code == LT
3133 && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
3134 && (fsfv = FLOAT_STORE_FLAG_VALUE (GET_MODE (arg1)),
3135 REAL_VALUE_NEGATIVE (fsfv)))
3136 #endif
3138 && COMPARISON_P (p->exp)))
3140 x = p->exp;
3141 break;
3143 else if ((code == EQ
3144 || (code == GE
3145 && GET_MODE_CLASS (inner_mode) == MODE_INT
3146 && (GET_MODE_BITSIZE (inner_mode)
3147 <= HOST_BITS_PER_WIDE_INT)
3148 && (STORE_FLAG_VALUE
3149 & ((HOST_WIDE_INT) 1
3150 << (GET_MODE_BITSIZE (inner_mode) - 1))))
3151 #ifdef FLOAT_STORE_FLAG_VALUE
3152 || (code == GE
3153 && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
3154 && (fsfv = FLOAT_STORE_FLAG_VALUE (GET_MODE (arg1)),
3155 REAL_VALUE_NEGATIVE (fsfv)))
3156 #endif
3158 && COMPARISON_P (p->exp))
3160 reverse_code = 1;
3161 x = p->exp;
3162 break;
3165 /* If this non-trapping address, e.g. fp + constant, the
3166 equivalent is a better operand since it may let us predict
3167 the value of the comparison. */
3168 else if (!rtx_addr_can_trap_p (p->exp))
3170 arg1 = p->exp;
3171 continue;
3175 /* If we didn't find a useful equivalence for ARG1, we are done.
3176 Otherwise, set up for the next iteration. */
3177 if (x == 0)
3178 break;
3180 /* If we need to reverse the comparison, make sure that that is
3181 possible -- we can't necessarily infer the value of GE from LT
3182 with floating-point operands. */
3183 if (reverse_code)
3185 enum rtx_code reversed = reversed_comparison_code (x, NULL_RTX);
3186 if (reversed == UNKNOWN)
3187 break;
3188 else
3189 code = reversed;
3191 else if (COMPARISON_P (x))
3192 code = GET_CODE (x);
3193 arg1 = XEXP (x, 0), arg2 = XEXP (x, 1);
3196 /* Return our results. Return the modes from before fold_rtx
3197 because fold_rtx might produce const_int, and then it's too late. */
3198 *pmode1 = GET_MODE (arg1), *pmode2 = GET_MODE (arg2);
3199 *parg1 = fold_rtx (arg1, 0), *parg2 = fold_rtx (arg2, 0);
3201 return code;
3204 /* If X is a nontrivial arithmetic operation on an argument
3205 for which a constant value can be determined, return
3206 the result of operating on that value, as a constant.
3207 Otherwise, return X, possibly with one or more operands
3208 modified by recursive calls to this function.
3210 If X is a register whose contents are known, we do NOT
3211 return those contents here. equiv_constant is called to
3212 perform that task.
3214 INSN is the insn that we may be modifying. If it is 0, make a copy
3215 of X before modifying it. */
3217 static rtx
3218 fold_rtx (rtx x, rtx insn)
3220 enum rtx_code code;
3221 enum machine_mode mode;
3222 const char *fmt;
3223 int i;
3224 rtx new = 0;
3225 int copied = 0;
3226 int must_swap = 0;
3228 /* Folded equivalents of first two operands of X. */
3229 rtx folded_arg0;
3230 rtx folded_arg1;
3232 /* Constant equivalents of first three operands of X;
3233 0 when no such equivalent is known. */
3234 rtx const_arg0;
3235 rtx const_arg1;
3236 rtx const_arg2;
3238 /* The mode of the first operand of X. We need this for sign and zero
3239 extends. */
3240 enum machine_mode mode_arg0;
3242 if (x == 0)
3243 return x;
3245 mode = GET_MODE (x);
3246 code = GET_CODE (x);
3247 switch (code)
3249 case CONST:
3250 case CONST_INT:
3251 case CONST_DOUBLE:
3252 case CONST_VECTOR:
3253 case SYMBOL_REF:
3254 case LABEL_REF:
3255 case REG:
3256 /* No use simplifying an EXPR_LIST
3257 since they are used only for lists of args
3258 in a function call's REG_EQUAL note. */
3259 case EXPR_LIST:
3260 return x;
3262 #ifdef HAVE_cc0
3263 case CC0:
3264 return prev_insn_cc0;
3265 #endif
3267 case PC:
3268 /* If the next insn is a CODE_LABEL followed by a jump table,
3269 PC's value is a LABEL_REF pointing to that label. That
3270 lets us fold switch statements on the VAX. */
3272 rtx next;
3273 if (insn && tablejump_p (insn, &next, NULL))
3274 return gen_rtx_LABEL_REF (Pmode, next);
3276 break;
3278 case SUBREG:
3279 /* See if we previously assigned a constant value to this SUBREG. */
3280 if ((new = lookup_as_function (x, CONST_INT)) != 0
3281 || (new = lookup_as_function (x, CONST_DOUBLE)) != 0)
3282 return new;
3284 /* If this is a paradoxical SUBREG, we have no idea what value the
3285 extra bits would have. However, if the operand is equivalent
3286 to a SUBREG whose operand is the same as our mode, and all the
3287 modes are within a word, we can just use the inner operand
3288 because these SUBREGs just say how to treat the register.
3290 Similarly if we find an integer constant. */
3292 if (GET_MODE_SIZE (mode) > GET_MODE_SIZE (GET_MODE (SUBREG_REG (x))))
3294 enum machine_mode imode = GET_MODE (SUBREG_REG (x));
3295 struct table_elt *elt;
3297 if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD
3298 && GET_MODE_SIZE (imode) <= UNITS_PER_WORD
3299 && (elt = lookup (SUBREG_REG (x), HASH (SUBREG_REG (x), imode),
3300 imode)) != 0)
3301 for (elt = elt->first_same_value; elt; elt = elt->next_same_value)
3303 if (CONSTANT_P (elt->exp)
3304 && GET_MODE (elt->exp) == VOIDmode)
3305 return elt->exp;
3307 if (GET_CODE (elt->exp) == SUBREG
3308 && GET_MODE (SUBREG_REG (elt->exp)) == mode
3309 && exp_equiv_p (elt->exp, elt->exp, 1, false))
3310 return copy_rtx (SUBREG_REG (elt->exp));
3313 return x;
3316 /* Fold SUBREG_REG. If it changed, see if we can simplify the SUBREG.
3317 We might be able to if the SUBREG is extracting a single word in an
3318 integral mode or extracting the low part. */
3320 folded_arg0 = fold_rtx (SUBREG_REG (x), insn);
3321 const_arg0 = equiv_constant (folded_arg0);
3322 if (const_arg0)
3323 folded_arg0 = const_arg0;
3325 if (folded_arg0 != SUBREG_REG (x))
3327 new = simplify_subreg (mode, folded_arg0,
3328 GET_MODE (SUBREG_REG (x)), SUBREG_BYTE (x));
3329 if (new)
3330 return new;
3333 if (REG_P (folded_arg0)
3334 && GET_MODE_SIZE (mode) < GET_MODE_SIZE (GET_MODE (folded_arg0)))
3336 struct table_elt *elt;
3338 elt = lookup (folded_arg0,
3339 HASH (folded_arg0, GET_MODE (folded_arg0)),
3340 GET_MODE (folded_arg0));
3342 if (elt)
3343 elt = elt->first_same_value;
3345 if (subreg_lowpart_p (x))
3346 /* If this is a narrowing SUBREG and our operand is a REG, see
3347 if we can find an equivalence for REG that is an arithmetic
3348 operation in a wider mode where both operands are paradoxical
3349 SUBREGs from objects of our result mode. In that case, we
3350 couldn-t report an equivalent value for that operation, since we
3351 don't know what the extra bits will be. But we can find an
3352 equivalence for this SUBREG by folding that operation in the
3353 narrow mode. This allows us to fold arithmetic in narrow modes
3354 when the machine only supports word-sized arithmetic.
3356 Also look for a case where we have a SUBREG whose operand
3357 is the same as our result. If both modes are smaller
3358 than a word, we are simply interpreting a register in
3359 different modes and we can use the inner value. */
3361 for (; elt; elt = elt->next_same_value)
3363 enum rtx_code eltcode = GET_CODE (elt->exp);
3365 /* Just check for unary and binary operations. */
3366 if (UNARY_P (elt->exp)
3367 && eltcode != SIGN_EXTEND
3368 && eltcode != ZERO_EXTEND
3369 && GET_CODE (XEXP (elt->exp, 0)) == SUBREG
3370 && GET_MODE (SUBREG_REG (XEXP (elt->exp, 0))) == mode
3371 && (GET_MODE_CLASS (mode)
3372 == GET_MODE_CLASS (GET_MODE (XEXP (elt->exp, 0)))))
3374 rtx op0 = SUBREG_REG (XEXP (elt->exp, 0));
3376 if (!REG_P (op0) && ! CONSTANT_P (op0))
3377 op0 = fold_rtx (op0, NULL_RTX);
3379 op0 = equiv_constant (op0);
3380 if (op0)
3381 new = simplify_unary_operation (GET_CODE (elt->exp), mode,
3382 op0, mode);
3384 else if (ARITHMETIC_P (elt->exp)
3385 && eltcode != DIV && eltcode != MOD
3386 && eltcode != UDIV && eltcode != UMOD
3387 && eltcode != ASHIFTRT && eltcode != LSHIFTRT
3388 && eltcode != ROTATE && eltcode != ROTATERT
3389 && ((GET_CODE (XEXP (elt->exp, 0)) == SUBREG
3390 && (GET_MODE (SUBREG_REG (XEXP (elt->exp, 0)))
3391 == mode))
3392 || CONSTANT_P (XEXP (elt->exp, 0)))
3393 && ((GET_CODE (XEXP (elt->exp, 1)) == SUBREG
3394 && (GET_MODE (SUBREG_REG (XEXP (elt->exp, 1)))
3395 == mode))
3396 || CONSTANT_P (XEXP (elt->exp, 1))))
3398 rtx op0 = gen_lowpart_common (mode, XEXP (elt->exp, 0));
3399 rtx op1 = gen_lowpart_common (mode, XEXP (elt->exp, 1));
3401 if (op0 && !REG_P (op0) && ! CONSTANT_P (op0))
3402 op0 = fold_rtx (op0, NULL_RTX);
3404 if (op0)
3405 op0 = equiv_constant (op0);
3407 if (op1 && !REG_P (op1) && ! CONSTANT_P (op1))
3408 op1 = fold_rtx (op1, NULL_RTX);
3410 if (op1)
3411 op1 = equiv_constant (op1);
3413 /* If we are looking for the low SImode part of
3414 (ashift:DI c (const_int 32)), it doesn't work
3415 to compute that in SImode, because a 32-bit shift
3416 in SImode is unpredictable. We know the value is 0. */
3417 if (op0 && op1
3418 && GET_CODE (elt->exp) == ASHIFT
3419 && GET_CODE (op1) == CONST_INT
3420 && INTVAL (op1) >= GET_MODE_BITSIZE (mode))
3422 if (INTVAL (op1)
3423 < GET_MODE_BITSIZE (GET_MODE (elt->exp)))
3424 /* If the count fits in the inner mode's width,
3425 but exceeds the outer mode's width,
3426 the value will get truncated to 0
3427 by the subreg. */
3428 new = CONST0_RTX (mode);
3429 else
3430 /* If the count exceeds even the inner mode's width,
3431 don't fold this expression. */
3432 new = 0;
3434 else if (op0 && op1)
3435 new = simplify_binary_operation (GET_CODE (elt->exp), mode, op0, op1);
3438 else if (GET_CODE (elt->exp) == SUBREG
3439 && GET_MODE (SUBREG_REG (elt->exp)) == mode
3440 && (GET_MODE_SIZE (GET_MODE (folded_arg0))
3441 <= UNITS_PER_WORD)
3442 && exp_equiv_p (elt->exp, elt->exp, 1, false))
3443 new = copy_rtx (SUBREG_REG (elt->exp));
3445 if (new)
3446 return new;
3448 else
3449 /* A SUBREG resulting from a zero extension may fold to zero if
3450 it extracts higher bits than the ZERO_EXTEND's source bits.
3451 FIXME: if combine tried to, er, combine these instructions,
3452 this transformation may be moved to simplify_subreg. */
3453 for (; elt; elt = elt->next_same_value)
3455 if (GET_CODE (elt->exp) == ZERO_EXTEND
3456 && subreg_lsb (x)
3457 >= GET_MODE_BITSIZE (GET_MODE (XEXP (elt->exp, 0))))
3458 return CONST0_RTX (mode);
3462 return x;
3464 case NOT:
3465 case NEG:
3466 /* If we have (NOT Y), see if Y is known to be (NOT Z).
3467 If so, (NOT Y) simplifies to Z. Similarly for NEG. */
3468 new = lookup_as_function (XEXP (x, 0), code);
3469 if (new)
3470 return fold_rtx (copy_rtx (XEXP (new, 0)), insn);
3471 break;
3473 case MEM:
3474 /* If we are not actually processing an insn, don't try to find the
3475 best address. Not only don't we care, but we could modify the
3476 MEM in an invalid way since we have no insn to validate against. */
3477 if (insn != 0)
3478 find_best_addr (insn, &XEXP (x, 0), GET_MODE (x));
3481 /* Even if we don't fold in the insn itself,
3482 we can safely do so here, in hopes of getting a constant. */
3483 rtx addr = fold_rtx (XEXP (x, 0), NULL_RTX);
3484 rtx base = 0;
3485 HOST_WIDE_INT offset = 0;
3487 if (REG_P (addr)
3488 && REGNO_QTY_VALID_P (REGNO (addr)))
3490 int addr_q = REG_QTY (REGNO (addr));
3491 struct qty_table_elem *addr_ent = &qty_table[addr_q];
3493 if (GET_MODE (addr) == addr_ent->mode
3494 && addr_ent->const_rtx != NULL_RTX)
3495 addr = addr_ent->const_rtx;
3498 /* If address is constant, split it into a base and integer offset. */
3499 if (GET_CODE (addr) == SYMBOL_REF || GET_CODE (addr) == LABEL_REF)
3500 base = addr;
3501 else if (GET_CODE (addr) == CONST && GET_CODE (XEXP (addr, 0)) == PLUS
3502 && GET_CODE (XEXP (XEXP (addr, 0), 1)) == CONST_INT)
3504 base = XEXP (XEXP (addr, 0), 0);
3505 offset = INTVAL (XEXP (XEXP (addr, 0), 1));
3507 else if (GET_CODE (addr) == LO_SUM
3508 && GET_CODE (XEXP (addr, 1)) == SYMBOL_REF)
3509 base = XEXP (addr, 1);
3511 /* If this is a constant pool reference, we can fold it into its
3512 constant to allow better value tracking. */
3513 if (base && GET_CODE (base) == SYMBOL_REF
3514 && CONSTANT_POOL_ADDRESS_P (base))
3516 rtx constant = get_pool_constant (base);
3517 enum machine_mode const_mode = get_pool_mode (base);
3518 rtx new;
3520 if (CONSTANT_P (constant) && GET_CODE (constant) != CONST_INT)
3522 constant_pool_entries_cost = COST (constant);
3523 constant_pool_entries_regcost = approx_reg_cost (constant);
3526 /* If we are loading the full constant, we have an equivalence. */
3527 if (offset == 0 && mode == const_mode)
3528 return constant;
3530 /* If this actually isn't a constant (weird!), we can't do
3531 anything. Otherwise, handle the two most common cases:
3532 extracting a word from a multi-word constant, and extracting
3533 the low-order bits. Other cases don't seem common enough to
3534 worry about. */
3535 if (! CONSTANT_P (constant))
3536 return x;
3538 if (GET_MODE_CLASS (mode) == MODE_INT
3539 && GET_MODE_SIZE (mode) == UNITS_PER_WORD
3540 && offset % UNITS_PER_WORD == 0
3541 && (new = operand_subword (constant,
3542 offset / UNITS_PER_WORD,
3543 0, const_mode)) != 0)
3544 return new;
3546 if (((BYTES_BIG_ENDIAN
3547 && offset == GET_MODE_SIZE (GET_MODE (constant)) - 1)
3548 || (! BYTES_BIG_ENDIAN && offset == 0))
3549 && (new = gen_lowpart (mode, constant)) != 0)
3550 return new;
3553 /* If this is a reference to a label at a known position in a jump
3554 table, we also know its value. */
3555 if (base && GET_CODE (base) == LABEL_REF)
3557 rtx label = XEXP (base, 0);
3558 rtx table_insn = NEXT_INSN (label);
3560 if (table_insn && JUMP_P (table_insn)
3561 && GET_CODE (PATTERN (table_insn)) == ADDR_VEC)
3563 rtx table = PATTERN (table_insn);
3565 if (offset >= 0
3566 && (offset / GET_MODE_SIZE (GET_MODE (table))
3567 < XVECLEN (table, 0)))
3568 return XVECEXP (table, 0,
3569 offset / GET_MODE_SIZE (GET_MODE (table)));
3571 if (table_insn && JUMP_P (table_insn)
3572 && GET_CODE (PATTERN (table_insn)) == ADDR_DIFF_VEC)
3574 rtx table = PATTERN (table_insn);
3576 if (offset >= 0
3577 && (offset / GET_MODE_SIZE (GET_MODE (table))
3578 < XVECLEN (table, 1)))
3580 offset /= GET_MODE_SIZE (GET_MODE (table));
3581 new = gen_rtx_MINUS (Pmode, XVECEXP (table, 1, offset),
3582 XEXP (table, 0));
3584 if (GET_MODE (table) != Pmode)
3585 new = gen_rtx_TRUNCATE (GET_MODE (table), new);
3587 /* Indicate this is a constant. This isn't a
3588 valid form of CONST, but it will only be used
3589 to fold the next insns and then discarded, so
3590 it should be safe.
3592 Note this expression must be explicitly discarded,
3593 by cse_insn, else it may end up in a REG_EQUAL note
3594 and "escape" to cause problems elsewhere. */
3595 return gen_rtx_CONST (GET_MODE (new), new);
3600 return x;
3603 #ifdef NO_FUNCTION_CSE
3604 case CALL:
3605 if (CONSTANT_P (XEXP (XEXP (x, 0), 0)))
3606 return x;
3607 break;
3608 #endif
3610 case ASM_OPERANDS:
3611 for (i = ASM_OPERANDS_INPUT_LENGTH (x) - 1; i >= 0; i--)
3612 validate_change (insn, &ASM_OPERANDS_INPUT (x, i),
3613 fold_rtx (ASM_OPERANDS_INPUT (x, i), insn), 0);
3614 break;
3616 default:
3617 break;
3620 const_arg0 = 0;
3621 const_arg1 = 0;
3622 const_arg2 = 0;
3623 mode_arg0 = VOIDmode;
3625 /* Try folding our operands.
3626 Then see which ones have constant values known. */
3628 fmt = GET_RTX_FORMAT (code);
3629 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3630 if (fmt[i] == 'e')
3632 rtx arg = XEXP (x, i);
3633 rtx folded_arg = arg, const_arg = 0;
3634 enum machine_mode mode_arg = GET_MODE (arg);
3635 rtx cheap_arg, expensive_arg;
3636 rtx replacements[2];
3637 int j;
3638 int old_cost = COST_IN (XEXP (x, i), code);
3640 /* Most arguments are cheap, so handle them specially. */
3641 switch (GET_CODE (arg))
3643 case REG:
3644 /* This is the same as calling equiv_constant; it is duplicated
3645 here for speed. */
3646 if (REGNO_QTY_VALID_P (REGNO (arg)))
3648 int arg_q = REG_QTY (REGNO (arg));
3649 struct qty_table_elem *arg_ent = &qty_table[arg_q];
3651 if (arg_ent->const_rtx != NULL_RTX
3652 && !REG_P (arg_ent->const_rtx)
3653 && GET_CODE (arg_ent->const_rtx) != PLUS)
3654 const_arg
3655 = gen_lowpart (GET_MODE (arg),
3656 arg_ent->const_rtx);
3658 break;
3660 case CONST:
3661 case CONST_INT:
3662 case SYMBOL_REF:
3663 case LABEL_REF:
3664 case CONST_DOUBLE:
3665 case CONST_VECTOR:
3666 const_arg = arg;
3667 break;
3669 #ifdef HAVE_cc0
3670 case CC0:
3671 folded_arg = prev_insn_cc0;
3672 mode_arg = prev_insn_cc0_mode;
3673 const_arg = equiv_constant (folded_arg);
3674 break;
3675 #endif
3677 default:
3678 folded_arg = fold_rtx (arg, insn);
3679 const_arg = equiv_constant (folded_arg);
3682 /* For the first three operands, see if the operand
3683 is constant or equivalent to a constant. */
3684 switch (i)
3686 case 0:
3687 folded_arg0 = folded_arg;
3688 const_arg0 = const_arg;
3689 mode_arg0 = mode_arg;
3690 break;
3691 case 1:
3692 folded_arg1 = folded_arg;
3693 const_arg1 = const_arg;
3694 break;
3695 case 2:
3696 const_arg2 = const_arg;
3697 break;
3700 /* Pick the least expensive of the folded argument and an
3701 equivalent constant argument. */
3702 if (const_arg == 0 || const_arg == folded_arg
3703 || COST_IN (const_arg, code) > COST_IN (folded_arg, code))
3704 cheap_arg = folded_arg, expensive_arg = const_arg;
3705 else
3706 cheap_arg = const_arg, expensive_arg = folded_arg;
3708 /* Try to replace the operand with the cheapest of the two
3709 possibilities. If it doesn't work and this is either of the first
3710 two operands of a commutative operation, try swapping them.
3711 If THAT fails, try the more expensive, provided it is cheaper
3712 than what is already there. */
3714 if (cheap_arg == XEXP (x, i))
3715 continue;
3717 if (insn == 0 && ! copied)
3719 x = copy_rtx (x);
3720 copied = 1;
3723 /* Order the replacements from cheapest to most expensive. */
3724 replacements[0] = cheap_arg;
3725 replacements[1] = expensive_arg;
3727 for (j = 0; j < 2 && replacements[j]; j++)
3729 int new_cost = COST_IN (replacements[j], code);
3731 /* Stop if what existed before was cheaper. Prefer constants
3732 in the case of a tie. */
3733 if (new_cost > old_cost
3734 || (new_cost == old_cost && CONSTANT_P (XEXP (x, i))))
3735 break;
3737 /* It's not safe to substitute the operand of a conversion
3738 operator with a constant, as the conversion's identity
3739 depends upon the mode of it's operand. This optimization
3740 is handled by the call to simplify_unary_operation. */
3741 if (GET_RTX_CLASS (code) == RTX_UNARY
3742 && GET_MODE (replacements[j]) != mode_arg0
3743 && (code == ZERO_EXTEND
3744 || code == SIGN_EXTEND
3745 || code == TRUNCATE
3746 || code == FLOAT_TRUNCATE
3747 || code == FLOAT_EXTEND
3748 || code == FLOAT
3749 || code == FIX
3750 || code == UNSIGNED_FLOAT
3751 || code == UNSIGNED_FIX))
3752 continue;
3754 if (validate_change (insn, &XEXP (x, i), replacements[j], 0))
3755 break;
3757 if (GET_RTX_CLASS (code) == RTX_COMM_COMPARE
3758 || GET_RTX_CLASS (code) == RTX_COMM_ARITH)
3760 validate_change (insn, &XEXP (x, i), XEXP (x, 1 - i), 1);
3761 validate_change (insn, &XEXP (x, 1 - i), replacements[j], 1);
3763 if (apply_change_group ())
3765 /* Swap them back to be invalid so that this loop can
3766 continue and flag them to be swapped back later. */
3767 rtx tem;
3769 tem = XEXP (x, 0); XEXP (x, 0) = XEXP (x, 1);
3770 XEXP (x, 1) = tem;
3771 must_swap = 1;
3772 break;
3778 else
3780 if (fmt[i] == 'E')
3781 /* Don't try to fold inside of a vector of expressions.
3782 Doing nothing is harmless. */
3786 /* If a commutative operation, place a constant integer as the second
3787 operand unless the first operand is also a constant integer. Otherwise,
3788 place any constant second unless the first operand is also a constant. */
3790 if (COMMUTATIVE_P (x))
3792 if (must_swap
3793 || swap_commutative_operands_p (const_arg0 ? const_arg0
3794 : XEXP (x, 0),
3795 const_arg1 ? const_arg1
3796 : XEXP (x, 1)))
3798 rtx tem = XEXP (x, 0);
3800 if (insn == 0 && ! copied)
3802 x = copy_rtx (x);
3803 copied = 1;
3806 validate_change (insn, &XEXP (x, 0), XEXP (x, 1), 1);
3807 validate_change (insn, &XEXP (x, 1), tem, 1);
3808 if (apply_change_group ())
3810 tem = const_arg0, const_arg0 = const_arg1, const_arg1 = tem;
3811 tem = folded_arg0, folded_arg0 = folded_arg1, folded_arg1 = tem;
3816 /* If X is an arithmetic operation, see if we can simplify it. */
3818 switch (GET_RTX_CLASS (code))
3820 case RTX_UNARY:
3822 int is_const = 0;
3824 /* We can't simplify extension ops unless we know the
3825 original mode. */
3826 if ((code == ZERO_EXTEND || code == SIGN_EXTEND)
3827 && mode_arg0 == VOIDmode)
3828 break;
3830 /* If we had a CONST, strip it off and put it back later if we
3831 fold. */
3832 if (const_arg0 != 0 && GET_CODE (const_arg0) == CONST)
3833 is_const = 1, const_arg0 = XEXP (const_arg0, 0);
3835 new = simplify_unary_operation (code, mode,
3836 const_arg0 ? const_arg0 : folded_arg0,
3837 mode_arg0);
3838 /* NEG of PLUS could be converted into MINUS, but that causes
3839 expressions of the form
3840 (CONST (MINUS (CONST_INT) (SYMBOL_REF)))
3841 which many ports mistakenly treat as LEGITIMATE_CONSTANT_P.
3842 FIXME: those ports should be fixed. */
3843 if (new != 0 && is_const
3844 && GET_CODE (new) == PLUS
3845 && (GET_CODE (XEXP (new, 0)) == SYMBOL_REF
3846 || GET_CODE (XEXP (new, 0)) == LABEL_REF)
3847 && GET_CODE (XEXP (new, 1)) == CONST_INT)
3848 new = gen_rtx_CONST (mode, new);
3850 break;
3852 case RTX_COMPARE:
3853 case RTX_COMM_COMPARE:
3854 /* See what items are actually being compared and set FOLDED_ARG[01]
3855 to those values and CODE to the actual comparison code. If any are
3856 constant, set CONST_ARG0 and CONST_ARG1 appropriately. We needn't
3857 do anything if both operands are already known to be constant. */
3859 /* ??? Vector mode comparisons are not supported yet. */
3860 if (VECTOR_MODE_P (mode))
3861 break;
3863 if (const_arg0 == 0 || const_arg1 == 0)
3865 struct table_elt *p0, *p1;
3866 rtx true_rtx = const_true_rtx, false_rtx = const0_rtx;
3867 enum machine_mode mode_arg1;
3869 #ifdef FLOAT_STORE_FLAG_VALUE
3870 if (GET_MODE_CLASS (mode) == MODE_FLOAT)
3872 true_rtx = (CONST_DOUBLE_FROM_REAL_VALUE
3873 (FLOAT_STORE_FLAG_VALUE (mode), mode));
3874 false_rtx = CONST0_RTX (mode);
3876 #endif
3878 code = find_comparison_args (code, &folded_arg0, &folded_arg1,
3879 &mode_arg0, &mode_arg1);
3881 /* If the mode is VOIDmode or a MODE_CC mode, we don't know
3882 what kinds of things are being compared, so we can't do
3883 anything with this comparison. */
3885 if (mode_arg0 == VOIDmode || GET_MODE_CLASS (mode_arg0) == MODE_CC)
3886 break;
3888 const_arg0 = equiv_constant (folded_arg0);
3889 const_arg1 = equiv_constant (folded_arg1);
3891 /* If we do not now have two constants being compared, see
3892 if we can nevertheless deduce some things about the
3893 comparison. */
3894 if (const_arg0 == 0 || const_arg1 == 0)
3896 /* Some addresses are known to be nonzero. We don't know
3897 their sign, but equality comparisons are known. */
3898 if (const_arg1 == const0_rtx
3899 && nonzero_address_p (folded_arg0))
3901 if (code == EQ)
3902 return false_rtx;
3903 else if (code == NE)
3904 return true_rtx;
3907 /* See if the two operands are the same. */
3909 if (folded_arg0 == folded_arg1
3910 || (REG_P (folded_arg0)
3911 && REG_P (folded_arg1)
3912 && (REG_QTY (REGNO (folded_arg0))
3913 == REG_QTY (REGNO (folded_arg1))))
3914 || ((p0 = lookup (folded_arg0,
3915 SAFE_HASH (folded_arg0, mode_arg0),
3916 mode_arg0))
3917 && (p1 = lookup (folded_arg1,
3918 SAFE_HASH (folded_arg1, mode_arg0),
3919 mode_arg0))
3920 && p0->first_same_value == p1->first_same_value))
3922 /* Sadly two equal NaNs are not equivalent. */
3923 if (!HONOR_NANS (mode_arg0))
3924 return ((code == EQ || code == LE || code == GE
3925 || code == LEU || code == GEU || code == UNEQ
3926 || code == UNLE || code == UNGE
3927 || code == ORDERED)
3928 ? true_rtx : false_rtx);
3929 /* Take care for the FP compares we can resolve. */
3930 if (code == UNEQ || code == UNLE || code == UNGE)
3931 return true_rtx;
3932 if (code == LTGT || code == LT || code == GT)
3933 return false_rtx;
3936 /* If FOLDED_ARG0 is a register, see if the comparison we are
3937 doing now is either the same as we did before or the reverse
3938 (we only check the reverse if not floating-point). */
3939 else if (REG_P (folded_arg0))
3941 int qty = REG_QTY (REGNO (folded_arg0));
3943 if (REGNO_QTY_VALID_P (REGNO (folded_arg0)))
3945 struct qty_table_elem *ent = &qty_table[qty];
3947 if ((comparison_dominates_p (ent->comparison_code, code)
3948 || (! FLOAT_MODE_P (mode_arg0)
3949 && comparison_dominates_p (ent->comparison_code,
3950 reverse_condition (code))))
3951 && (rtx_equal_p (ent->comparison_const, folded_arg1)
3952 || (const_arg1
3953 && rtx_equal_p (ent->comparison_const,
3954 const_arg1))
3955 || (REG_P (folded_arg1)
3956 && (REG_QTY (REGNO (folded_arg1)) == ent->comparison_qty))))
3957 return (comparison_dominates_p (ent->comparison_code, code)
3958 ? true_rtx : false_rtx);
3964 /* If we are comparing against zero, see if the first operand is
3965 equivalent to an IOR with a constant. If so, we may be able to
3966 determine the result of this comparison. */
3968 if (const_arg1 == const0_rtx)
3970 rtx y = lookup_as_function (folded_arg0, IOR);
3971 rtx inner_const;
3973 if (y != 0
3974 && (inner_const = equiv_constant (XEXP (y, 1))) != 0
3975 && GET_CODE (inner_const) == CONST_INT
3976 && INTVAL (inner_const) != 0)
3978 int sign_bitnum = GET_MODE_BITSIZE (mode_arg0) - 1;
3979 int has_sign = (HOST_BITS_PER_WIDE_INT >= sign_bitnum
3980 && (INTVAL (inner_const)
3981 & ((HOST_WIDE_INT) 1 << sign_bitnum)));
3982 rtx true_rtx = const_true_rtx, false_rtx = const0_rtx;
3984 #ifdef FLOAT_STORE_FLAG_VALUE
3985 if (GET_MODE_CLASS (mode) == MODE_FLOAT)
3987 true_rtx = (CONST_DOUBLE_FROM_REAL_VALUE
3988 (FLOAT_STORE_FLAG_VALUE (mode), mode));
3989 false_rtx = CONST0_RTX (mode);
3991 #endif
3993 switch (code)
3995 case EQ:
3996 return false_rtx;
3997 case NE:
3998 return true_rtx;
3999 case LT: case LE:
4000 if (has_sign)
4001 return true_rtx;
4002 break;
4003 case GT: case GE:
4004 if (has_sign)
4005 return false_rtx;
4006 break;
4007 default:
4008 break;
4014 rtx op0 = const_arg0 ? const_arg0 : folded_arg0;
4015 rtx op1 = const_arg1 ? const_arg1 : folded_arg1;
4016 new = simplify_relational_operation (code, mode, mode_arg0, op0, op1);
4018 break;
4020 case RTX_BIN_ARITH:
4021 case RTX_COMM_ARITH:
4022 switch (code)
4024 case PLUS:
4025 /* If the second operand is a LABEL_REF, see if the first is a MINUS
4026 with that LABEL_REF as its second operand. If so, the result is
4027 the first operand of that MINUS. This handles switches with an
4028 ADDR_DIFF_VEC table. */
4029 if (const_arg1 && GET_CODE (const_arg1) == LABEL_REF)
4031 rtx y
4032 = GET_CODE (folded_arg0) == MINUS ? folded_arg0
4033 : lookup_as_function (folded_arg0, MINUS);
4035 if (y != 0 && GET_CODE (XEXP (y, 1)) == LABEL_REF
4036 && XEXP (XEXP (y, 1), 0) == XEXP (const_arg1, 0))
4037 return XEXP (y, 0);
4039 /* Now try for a CONST of a MINUS like the above. */
4040 if ((y = (GET_CODE (folded_arg0) == CONST ? folded_arg0
4041 : lookup_as_function (folded_arg0, CONST))) != 0
4042 && GET_CODE (XEXP (y, 0)) == MINUS
4043 && GET_CODE (XEXP (XEXP (y, 0), 1)) == LABEL_REF
4044 && XEXP (XEXP (XEXP (y, 0), 1), 0) == XEXP (const_arg1, 0))
4045 return XEXP (XEXP (y, 0), 0);
4048 /* Likewise if the operands are in the other order. */
4049 if (const_arg0 && GET_CODE (const_arg0) == LABEL_REF)
4051 rtx y
4052 = GET_CODE (folded_arg1) == MINUS ? folded_arg1
4053 : lookup_as_function (folded_arg1, MINUS);
4055 if (y != 0 && GET_CODE (XEXP (y, 1)) == LABEL_REF
4056 && XEXP (XEXP (y, 1), 0) == XEXP (const_arg0, 0))
4057 return XEXP (y, 0);
4059 /* Now try for a CONST of a MINUS like the above. */
4060 if ((y = (GET_CODE (folded_arg1) == CONST ? folded_arg1
4061 : lookup_as_function (folded_arg1, CONST))) != 0
4062 && GET_CODE (XEXP (y, 0)) == MINUS
4063 && GET_CODE (XEXP (XEXP (y, 0), 1)) == LABEL_REF
4064 && XEXP (XEXP (XEXP (y, 0), 1), 0) == XEXP (const_arg0, 0))
4065 return XEXP (XEXP (y, 0), 0);
4068 /* If second operand is a register equivalent to a negative
4069 CONST_INT, see if we can find a register equivalent to the
4070 positive constant. Make a MINUS if so. Don't do this for
4071 a non-negative constant since we might then alternate between
4072 choosing positive and negative constants. Having the positive
4073 constant previously-used is the more common case. Be sure
4074 the resulting constant is non-negative; if const_arg1 were
4075 the smallest negative number this would overflow: depending
4076 on the mode, this would either just be the same value (and
4077 hence not save anything) or be incorrect. */
4078 if (const_arg1 != 0 && GET_CODE (const_arg1) == CONST_INT
4079 && INTVAL (const_arg1) < 0
4080 /* This used to test
4082 -INTVAL (const_arg1) >= 0
4084 But The Sun V5.0 compilers mis-compiled that test. So
4085 instead we test for the problematic value in a more direct
4086 manner and hope the Sun compilers get it correct. */
4087 && INTVAL (const_arg1) !=
4088 ((HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT - 1))
4089 && REG_P (folded_arg1))
4091 rtx new_const = GEN_INT (-INTVAL (const_arg1));
4092 struct table_elt *p
4093 = lookup (new_const, SAFE_HASH (new_const, mode), mode);
4095 if (p)
4096 for (p = p->first_same_value; p; p = p->next_same_value)
4097 if (REG_P (p->exp))
4098 return simplify_gen_binary (MINUS, mode, folded_arg0,
4099 canon_reg (p->exp, NULL_RTX));
4101 goto from_plus;
4103 case MINUS:
4104 /* If we have (MINUS Y C), see if Y is known to be (PLUS Z C2).
4105 If so, produce (PLUS Z C2-C). */
4106 if (const_arg1 != 0 && GET_CODE (const_arg1) == CONST_INT)
4108 rtx y = lookup_as_function (XEXP (x, 0), PLUS);
4109 if (y && GET_CODE (XEXP (y, 1)) == CONST_INT)
4110 return fold_rtx (plus_constant (copy_rtx (y),
4111 -INTVAL (const_arg1)),
4112 NULL_RTX);
4115 /* Fall through. */
4117 from_plus:
4118 case SMIN: case SMAX: case UMIN: case UMAX:
4119 case IOR: case AND: case XOR:
4120 case MULT:
4121 case ASHIFT: case LSHIFTRT: case ASHIFTRT:
4122 /* If we have (<op> <reg> <const_int>) for an associative OP and REG
4123 is known to be of similar form, we may be able to replace the
4124 operation with a combined operation. This may eliminate the
4125 intermediate operation if every use is simplified in this way.
4126 Note that the similar optimization done by combine.c only works
4127 if the intermediate operation's result has only one reference. */
4129 if (REG_P (folded_arg0)
4130 && const_arg1 && GET_CODE (const_arg1) == CONST_INT)
4132 int is_shift
4133 = (code == ASHIFT || code == ASHIFTRT || code == LSHIFTRT);
4134 rtx y = lookup_as_function (folded_arg0, code);
4135 rtx inner_const;
4136 enum rtx_code associate_code;
4137 rtx new_const;
4139 if (y == 0
4140 || 0 == (inner_const
4141 = equiv_constant (fold_rtx (XEXP (y, 1), 0)))
4142 || GET_CODE (inner_const) != CONST_INT
4143 /* If we have compiled a statement like
4144 "if (x == (x & mask1))", and now are looking at
4145 "x & mask2", we will have a case where the first operand
4146 of Y is the same as our first operand. Unless we detect
4147 this case, an infinite loop will result. */
4148 || XEXP (y, 0) == folded_arg0)
4149 break;
4151 /* Don't associate these operations if they are a PLUS with the
4152 same constant and it is a power of two. These might be doable
4153 with a pre- or post-increment. Similarly for two subtracts of
4154 identical powers of two with post decrement. */
4156 if (code == PLUS && const_arg1 == inner_const
4157 && ((HAVE_PRE_INCREMENT
4158 && exact_log2 (INTVAL (const_arg1)) >= 0)
4159 || (HAVE_POST_INCREMENT
4160 && exact_log2 (INTVAL (const_arg1)) >= 0)
4161 || (HAVE_PRE_DECREMENT
4162 && exact_log2 (- INTVAL (const_arg1)) >= 0)
4163 || (HAVE_POST_DECREMENT
4164 && exact_log2 (- INTVAL (const_arg1)) >= 0)))
4165 break;
4167 /* Compute the code used to compose the constants. For example,
4168 A-C1-C2 is A-(C1 + C2), so if CODE == MINUS, we want PLUS. */
4170 associate_code = (is_shift || code == MINUS ? PLUS : code);
4172 new_const = simplify_binary_operation (associate_code, mode,
4173 const_arg1, inner_const);
4175 if (new_const == 0)
4176 break;
4178 /* If we are associating shift operations, don't let this
4179 produce a shift of the size of the object or larger.
4180 This could occur when we follow a sign-extend by a right
4181 shift on a machine that does a sign-extend as a pair
4182 of shifts. */
4184 if (is_shift && GET_CODE (new_const) == CONST_INT
4185 && INTVAL (new_const) >= GET_MODE_BITSIZE (mode))
4187 /* As an exception, we can turn an ASHIFTRT of this
4188 form into a shift of the number of bits - 1. */
4189 if (code == ASHIFTRT)
4190 new_const = GEN_INT (GET_MODE_BITSIZE (mode) - 1);
4191 else
4192 break;
4195 y = copy_rtx (XEXP (y, 0));
4197 /* If Y contains our first operand (the most common way this
4198 can happen is if Y is a MEM), we would do into an infinite
4199 loop if we tried to fold it. So don't in that case. */
4201 if (! reg_mentioned_p (folded_arg0, y))
4202 y = fold_rtx (y, insn);
4204 return simplify_gen_binary (code, mode, y, new_const);
4206 break;
4208 case DIV: case UDIV:
4209 /* ??? The associative optimization performed immediately above is
4210 also possible for DIV and UDIV using associate_code of MULT.
4211 However, we would need extra code to verify that the
4212 multiplication does not overflow, that is, there is no overflow
4213 in the calculation of new_const. */
4214 break;
4216 default:
4217 break;
4220 new = simplify_binary_operation (code, mode,
4221 const_arg0 ? const_arg0 : folded_arg0,
4222 const_arg1 ? const_arg1 : folded_arg1);
4223 break;
4225 case RTX_OBJ:
4226 /* (lo_sum (high X) X) is simply X. */
4227 if (code == LO_SUM && const_arg0 != 0
4228 && GET_CODE (const_arg0) == HIGH
4229 && rtx_equal_p (XEXP (const_arg0, 0), const_arg1))
4230 return const_arg1;
4231 break;
4233 case RTX_TERNARY:
4234 case RTX_BITFIELD_OPS:
4235 new = simplify_ternary_operation (code, mode, mode_arg0,
4236 const_arg0 ? const_arg0 : folded_arg0,
4237 const_arg1 ? const_arg1 : folded_arg1,
4238 const_arg2 ? const_arg2 : XEXP (x, 2));
4239 break;
4241 default:
4242 break;
4245 return new ? new : x;
4248 /* Return a constant value currently equivalent to X.
4249 Return 0 if we don't know one. */
4251 static rtx
4252 equiv_constant (rtx x)
4254 if (REG_P (x)
4255 && REGNO_QTY_VALID_P (REGNO (x)))
4257 int x_q = REG_QTY (REGNO (x));
4258 struct qty_table_elem *x_ent = &qty_table[x_q];
4260 if (x_ent->const_rtx)
4261 x = gen_lowpart (GET_MODE (x), x_ent->const_rtx);
4264 if (x == 0 || CONSTANT_P (x))
4265 return x;
4267 /* If X is a MEM, try to fold it outside the context of any insn to see if
4268 it might be equivalent to a constant. That handles the case where it
4269 is a constant-pool reference. Then try to look it up in the hash table
4270 in case it is something whose value we have seen before. */
4272 if (MEM_P (x))
4274 struct table_elt *elt;
4276 x = fold_rtx (x, NULL_RTX);
4277 if (CONSTANT_P (x))
4278 return x;
4280 elt = lookup (x, SAFE_HASH (x, GET_MODE (x)), GET_MODE (x));
4281 if (elt == 0)
4282 return 0;
4284 for (elt = elt->first_same_value; elt; elt = elt->next_same_value)
4285 if (elt->is_const && CONSTANT_P (elt->exp))
4286 return elt->exp;
4289 return 0;
4292 /* Assuming that X is an rtx (e.g., MEM, REG or SUBREG) for a fixed-point
4293 number, return an rtx (MEM, SUBREG, or CONST_INT) that refers to the
4294 least-significant part of X.
4295 MODE specifies how big a part of X to return.
4297 If the requested operation cannot be done, 0 is returned.
4299 This is similar to gen_lowpart_general in emit-rtl.c. */
4302 gen_lowpart_if_possible (enum machine_mode mode, rtx x)
4304 rtx result = gen_lowpart_common (mode, x);
4306 if (result)
4307 return result;
4308 else if (MEM_P (x))
4310 /* This is the only other case we handle. */
4311 int offset = 0;
4312 rtx new;
4314 if (WORDS_BIG_ENDIAN)
4315 offset = (MAX (GET_MODE_SIZE (GET_MODE (x)), UNITS_PER_WORD)
4316 - MAX (GET_MODE_SIZE (mode), UNITS_PER_WORD));
4317 if (BYTES_BIG_ENDIAN)
4318 /* Adjust the address so that the address-after-the-data is
4319 unchanged. */
4320 offset -= (MIN (UNITS_PER_WORD, GET_MODE_SIZE (mode))
4321 - MIN (UNITS_PER_WORD, GET_MODE_SIZE (GET_MODE (x))));
4323 new = adjust_address_nv (x, mode, offset);
4324 if (! memory_address_p (mode, XEXP (new, 0)))
4325 return 0;
4327 return new;
4329 else
4330 return 0;
4333 /* Given INSN, a jump insn, PATH_TAKEN indicates if we are following the "taken"
4334 branch. It will be zero if not.
4336 In certain cases, this can cause us to add an equivalence. For example,
4337 if we are following the taken case of
4338 if (i == 2)
4339 we can add the fact that `i' and '2' are now equivalent.
4341 In any case, we can record that this comparison was passed. If the same
4342 comparison is seen later, we will know its value. */
4344 static void
4345 record_jump_equiv (rtx insn, int taken)
4347 int cond_known_true;
4348 rtx op0, op1;
4349 rtx set;
4350 enum machine_mode mode, mode0, mode1;
4351 int reversed_nonequality = 0;
4352 enum rtx_code code;
4354 /* Ensure this is the right kind of insn. */
4355 if (! any_condjump_p (insn))
4356 return;
4357 set = pc_set (insn);
4359 /* See if this jump condition is known true or false. */
4360 if (taken)
4361 cond_known_true = (XEXP (SET_SRC (set), 2) == pc_rtx);
4362 else
4363 cond_known_true = (XEXP (SET_SRC (set), 1) == pc_rtx);
4365 /* Get the type of comparison being done and the operands being compared.
4366 If we had to reverse a non-equality condition, record that fact so we
4367 know that it isn't valid for floating-point. */
4368 code = GET_CODE (XEXP (SET_SRC (set), 0));
4369 op0 = fold_rtx (XEXP (XEXP (SET_SRC (set), 0), 0), insn);
4370 op1 = fold_rtx (XEXP (XEXP (SET_SRC (set), 0), 1), insn);
4372 code = find_comparison_args (code, &op0, &op1, &mode0, &mode1);
4373 if (! cond_known_true)
4375 code = reversed_comparison_code_parts (code, op0, op1, insn);
4377 /* Don't remember if we can't find the inverse. */
4378 if (code == UNKNOWN)
4379 return;
4382 /* The mode is the mode of the non-constant. */
4383 mode = mode0;
4384 if (mode1 != VOIDmode)
4385 mode = mode1;
4387 record_jump_cond (code, mode, op0, op1, reversed_nonequality);
4390 /* Yet another form of subreg creation. In this case, we want something in
4391 MODE, and we should assume OP has MODE iff it is naturally modeless. */
4393 static rtx
4394 record_jump_cond_subreg (enum machine_mode mode, rtx op)
4396 enum machine_mode op_mode = GET_MODE (op);
4397 if (op_mode == mode || op_mode == VOIDmode)
4398 return op;
4399 return lowpart_subreg (mode, op, op_mode);
4402 /* We know that comparison CODE applied to OP0 and OP1 in MODE is true.
4403 REVERSED_NONEQUALITY is nonzero if CODE had to be swapped.
4404 Make any useful entries we can with that information. Called from
4405 above function and called recursively. */
4407 static void
4408 record_jump_cond (enum rtx_code code, enum machine_mode mode, rtx op0,
4409 rtx op1, int reversed_nonequality)
4411 unsigned op0_hash, op1_hash;
4412 int op0_in_memory, op1_in_memory;
4413 struct table_elt *op0_elt, *op1_elt;
4415 /* If OP0 and OP1 are known equal, and either is a paradoxical SUBREG,
4416 we know that they are also equal in the smaller mode (this is also
4417 true for all smaller modes whether or not there is a SUBREG, but
4418 is not worth testing for with no SUBREG). */
4420 /* Note that GET_MODE (op0) may not equal MODE. */
4421 if (code == EQ && GET_CODE (op0) == SUBREG
4422 && (GET_MODE_SIZE (GET_MODE (op0))
4423 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (op0)))))
4425 enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op0));
4426 rtx tem = record_jump_cond_subreg (inner_mode, op1);
4427 if (tem)
4428 record_jump_cond (code, mode, SUBREG_REG (op0), tem,
4429 reversed_nonequality);
4432 if (code == EQ && GET_CODE (op1) == SUBREG
4433 && (GET_MODE_SIZE (GET_MODE (op1))
4434 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (op1)))))
4436 enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op1));
4437 rtx tem = record_jump_cond_subreg (inner_mode, op0);
4438 if (tem)
4439 record_jump_cond (code, mode, SUBREG_REG (op1), tem,
4440 reversed_nonequality);
4443 /* Similarly, if this is an NE comparison, and either is a SUBREG
4444 making a smaller mode, we know the whole thing is also NE. */
4446 /* Note that GET_MODE (op0) may not equal MODE;
4447 if we test MODE instead, we can get an infinite recursion
4448 alternating between two modes each wider than MODE. */
4450 if (code == NE && GET_CODE (op0) == SUBREG
4451 && subreg_lowpart_p (op0)
4452 && (GET_MODE_SIZE (GET_MODE (op0))
4453 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (op0)))))
4455 enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op0));
4456 rtx tem = record_jump_cond_subreg (inner_mode, op1);
4457 if (tem)
4458 record_jump_cond (code, mode, SUBREG_REG (op0), tem,
4459 reversed_nonequality);
4462 if (code == NE && GET_CODE (op1) == SUBREG
4463 && subreg_lowpart_p (op1)
4464 && (GET_MODE_SIZE (GET_MODE (op1))
4465 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (op1)))))
4467 enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op1));
4468 rtx tem = record_jump_cond_subreg (inner_mode, op0);
4469 if (tem)
4470 record_jump_cond (code, mode, SUBREG_REG (op1), tem,
4471 reversed_nonequality);
4474 /* Hash both operands. */
4476 do_not_record = 0;
4477 hash_arg_in_memory = 0;
4478 op0_hash = HASH (op0, mode);
4479 op0_in_memory = hash_arg_in_memory;
4481 if (do_not_record)
4482 return;
4484 do_not_record = 0;
4485 hash_arg_in_memory = 0;
4486 op1_hash = HASH (op1, mode);
4487 op1_in_memory = hash_arg_in_memory;
4489 if (do_not_record)
4490 return;
4492 /* Look up both operands. */
4493 op0_elt = lookup (op0, op0_hash, mode);
4494 op1_elt = lookup (op1, op1_hash, mode);
4496 /* If both operands are already equivalent or if they are not in the
4497 table but are identical, do nothing. */
4498 if ((op0_elt != 0 && op1_elt != 0
4499 && op0_elt->first_same_value == op1_elt->first_same_value)
4500 || op0 == op1 || rtx_equal_p (op0, op1))
4501 return;
4503 /* If we aren't setting two things equal all we can do is save this
4504 comparison. Similarly if this is floating-point. In the latter
4505 case, OP1 might be zero and both -0.0 and 0.0 are equal to it.
4506 If we record the equality, we might inadvertently delete code
4507 whose intent was to change -0 to +0. */
4509 if (code != EQ || FLOAT_MODE_P (GET_MODE (op0)))
4511 struct qty_table_elem *ent;
4512 int qty;
4514 /* If we reversed a floating-point comparison, if OP0 is not a
4515 register, or if OP1 is neither a register or constant, we can't
4516 do anything. */
4518 if (!REG_P (op1))
4519 op1 = equiv_constant (op1);
4521 if ((reversed_nonequality && FLOAT_MODE_P (mode))
4522 || !REG_P (op0) || op1 == 0)
4523 return;
4525 /* Put OP0 in the hash table if it isn't already. This gives it a
4526 new quantity number. */
4527 if (op0_elt == 0)
4529 if (insert_regs (op0, NULL, 0))
4531 rehash_using_reg (op0);
4532 op0_hash = HASH (op0, mode);
4534 /* If OP0 is contained in OP1, this changes its hash code
4535 as well. Faster to rehash than to check, except
4536 for the simple case of a constant. */
4537 if (! CONSTANT_P (op1))
4538 op1_hash = HASH (op1,mode);
4541 op0_elt = insert (op0, NULL, op0_hash, mode);
4542 op0_elt->in_memory = op0_in_memory;
4545 qty = REG_QTY (REGNO (op0));
4546 ent = &qty_table[qty];
4548 ent->comparison_code = code;
4549 if (REG_P (op1))
4551 /* Look it up again--in case op0 and op1 are the same. */
4552 op1_elt = lookup (op1, op1_hash, mode);
4554 /* Put OP1 in the hash table so it gets a new quantity number. */
4555 if (op1_elt == 0)
4557 if (insert_regs (op1, NULL, 0))
4559 rehash_using_reg (op1);
4560 op1_hash = HASH (op1, mode);
4563 op1_elt = insert (op1, NULL, op1_hash, mode);
4564 op1_elt->in_memory = op1_in_memory;
4567 ent->comparison_const = NULL_RTX;
4568 ent->comparison_qty = REG_QTY (REGNO (op1));
4570 else
4572 ent->comparison_const = op1;
4573 ent->comparison_qty = -1;
4576 return;
4579 /* If either side is still missing an equivalence, make it now,
4580 then merge the equivalences. */
4582 if (op0_elt == 0)
4584 if (insert_regs (op0, NULL, 0))
4586 rehash_using_reg (op0);
4587 op0_hash = HASH (op0, mode);
4590 op0_elt = insert (op0, NULL, op0_hash, mode);
4591 op0_elt->in_memory = op0_in_memory;
4594 if (op1_elt == 0)
4596 if (insert_regs (op1, NULL, 0))
4598 rehash_using_reg (op1);
4599 op1_hash = HASH (op1, mode);
4602 op1_elt = insert (op1, NULL, op1_hash, mode);
4603 op1_elt->in_memory = op1_in_memory;
4606 merge_equiv_classes (op0_elt, op1_elt);
4609 /* CSE processing for one instruction.
4610 First simplify sources and addresses of all assignments
4611 in the instruction, using previously-computed equivalents values.
4612 Then install the new sources and destinations in the table
4613 of available values.
4615 If LIBCALL_INSN is nonzero, don't record any equivalence made in
4616 the insn. It means that INSN is inside libcall block. In this
4617 case LIBCALL_INSN is the corresponding insn with REG_LIBCALL. */
4619 /* Data on one SET contained in the instruction. */
4621 struct set
4623 /* The SET rtx itself. */
4624 rtx rtl;
4625 /* The SET_SRC of the rtx (the original value, if it is changing). */
4626 rtx src;
4627 /* The hash-table element for the SET_SRC of the SET. */
4628 struct table_elt *src_elt;
4629 /* Hash value for the SET_SRC. */
4630 unsigned src_hash;
4631 /* Hash value for the SET_DEST. */
4632 unsigned dest_hash;
4633 /* The SET_DEST, with SUBREG, etc., stripped. */
4634 rtx inner_dest;
4635 /* Nonzero if the SET_SRC is in memory. */
4636 char src_in_memory;
4637 /* Nonzero if the SET_SRC contains something
4638 whose value cannot be predicted and understood. */
4639 char src_volatile;
4640 /* Original machine mode, in case it becomes a CONST_INT.
4641 The size of this field should match the size of the mode
4642 field of struct rtx_def (see rtl.h). */
4643 ENUM_BITFIELD(machine_mode) mode : 8;
4644 /* A constant equivalent for SET_SRC, if any. */
4645 rtx src_const;
4646 /* Original SET_SRC value used for libcall notes. */
4647 rtx orig_src;
4648 /* Hash value of constant equivalent for SET_SRC. */
4649 unsigned src_const_hash;
4650 /* Table entry for constant equivalent for SET_SRC, if any. */
4651 struct table_elt *src_const_elt;
4654 static void
4655 cse_insn (rtx insn, rtx libcall_insn)
4657 rtx x = PATTERN (insn);
4658 int i;
4659 rtx tem;
4660 int n_sets = 0;
4662 #ifdef HAVE_cc0
4663 /* Records what this insn does to set CC0. */
4664 rtx this_insn_cc0 = 0;
4665 enum machine_mode this_insn_cc0_mode = VOIDmode;
4666 #endif
4668 rtx src_eqv = 0;
4669 struct table_elt *src_eqv_elt = 0;
4670 int src_eqv_volatile = 0;
4671 int src_eqv_in_memory = 0;
4672 unsigned src_eqv_hash = 0;
4674 struct set *sets = (struct set *) 0;
4676 this_insn = insn;
4678 /* Find all the SETs and CLOBBERs in this instruction.
4679 Record all the SETs in the array `set' and count them.
4680 Also determine whether there is a CLOBBER that invalidates
4681 all memory references, or all references at varying addresses. */
4683 if (CALL_P (insn))
4685 for (tem = CALL_INSN_FUNCTION_USAGE (insn); tem; tem = XEXP (tem, 1))
4687 if (GET_CODE (XEXP (tem, 0)) == CLOBBER)
4688 invalidate (SET_DEST (XEXP (tem, 0)), VOIDmode);
4689 XEXP (tem, 0) = canon_reg (XEXP (tem, 0), insn);
4693 if (GET_CODE (x) == SET)
4695 sets = alloca (sizeof (struct set));
4696 sets[0].rtl = x;
4698 /* Ignore SETs that are unconditional jumps.
4699 They never need cse processing, so this does not hurt.
4700 The reason is not efficiency but rather
4701 so that we can test at the end for instructions
4702 that have been simplified to unconditional jumps
4703 and not be misled by unchanged instructions
4704 that were unconditional jumps to begin with. */
4705 if (SET_DEST (x) == pc_rtx
4706 && GET_CODE (SET_SRC (x)) == LABEL_REF)
4709 /* Don't count call-insns, (set (reg 0) (call ...)), as a set.
4710 The hard function value register is used only once, to copy to
4711 someplace else, so it isn't worth cse'ing (and on 80386 is unsafe)!
4712 Ensure we invalidate the destination register. On the 80386 no
4713 other code would invalidate it since it is a fixed_reg.
4714 We need not check the return of apply_change_group; see canon_reg. */
4716 else if (GET_CODE (SET_SRC (x)) == CALL)
4718 canon_reg (SET_SRC (x), insn);
4719 apply_change_group ();
4720 fold_rtx (SET_SRC (x), insn);
4721 invalidate (SET_DEST (x), VOIDmode);
4723 else
4724 n_sets = 1;
4726 else if (GET_CODE (x) == PARALLEL)
4728 int lim = XVECLEN (x, 0);
4730 sets = alloca (lim * sizeof (struct set));
4732 /* Find all regs explicitly clobbered in this insn,
4733 and ensure they are not replaced with any other regs
4734 elsewhere in this insn.
4735 When a reg that is clobbered is also used for input,
4736 we should presume that that is for a reason,
4737 and we should not substitute some other register
4738 which is not supposed to be clobbered.
4739 Therefore, this loop cannot be merged into the one below
4740 because a CALL may precede a CLOBBER and refer to the
4741 value clobbered. We must not let a canonicalization do
4742 anything in that case. */
4743 for (i = 0; i < lim; i++)
4745 rtx y = XVECEXP (x, 0, i);
4746 if (GET_CODE (y) == CLOBBER)
4748 rtx clobbered = XEXP (y, 0);
4750 if (REG_P (clobbered)
4751 || GET_CODE (clobbered) == SUBREG)
4752 invalidate (clobbered, VOIDmode);
4753 else if (GET_CODE (clobbered) == STRICT_LOW_PART
4754 || GET_CODE (clobbered) == ZERO_EXTRACT)
4755 invalidate (XEXP (clobbered, 0), GET_MODE (clobbered));
4759 for (i = 0; i < lim; i++)
4761 rtx y = XVECEXP (x, 0, i);
4762 if (GET_CODE (y) == SET)
4764 /* As above, we ignore unconditional jumps and call-insns and
4765 ignore the result of apply_change_group. */
4766 if (GET_CODE (SET_SRC (y)) == CALL)
4768 canon_reg (SET_SRC (y), insn);
4769 apply_change_group ();
4770 fold_rtx (SET_SRC (y), insn);
4771 invalidate (SET_DEST (y), VOIDmode);
4773 else if (SET_DEST (y) == pc_rtx
4774 && GET_CODE (SET_SRC (y)) == LABEL_REF)
4776 else
4777 sets[n_sets++].rtl = y;
4779 else if (GET_CODE (y) == CLOBBER)
4781 /* If we clobber memory, canon the address.
4782 This does nothing when a register is clobbered
4783 because we have already invalidated the reg. */
4784 if (MEM_P (XEXP (y, 0)))
4785 canon_reg (XEXP (y, 0), NULL_RTX);
4787 else if (GET_CODE (y) == USE
4788 && ! (REG_P (XEXP (y, 0))
4789 && REGNO (XEXP (y, 0)) < FIRST_PSEUDO_REGISTER))
4790 canon_reg (y, NULL_RTX);
4791 else if (GET_CODE (y) == CALL)
4793 /* The result of apply_change_group can be ignored; see
4794 canon_reg. */
4795 canon_reg (y, insn);
4796 apply_change_group ();
4797 fold_rtx (y, insn);
4801 else if (GET_CODE (x) == CLOBBER)
4803 if (MEM_P (XEXP (x, 0)))
4804 canon_reg (XEXP (x, 0), NULL_RTX);
4807 /* Canonicalize a USE of a pseudo register or memory location. */
4808 else if (GET_CODE (x) == USE
4809 && ! (REG_P (XEXP (x, 0))
4810 && REGNO (XEXP (x, 0)) < FIRST_PSEUDO_REGISTER))
4811 canon_reg (XEXP (x, 0), NULL_RTX);
4812 else if (GET_CODE (x) == CALL)
4814 /* The result of apply_change_group can be ignored; see canon_reg. */
4815 canon_reg (x, insn);
4816 apply_change_group ();
4817 fold_rtx (x, insn);
4820 /* Store the equivalent value in SRC_EQV, if different, or if the DEST
4821 is a STRICT_LOW_PART. The latter condition is necessary because SRC_EQV
4822 is handled specially for this case, and if it isn't set, then there will
4823 be no equivalence for the destination. */
4824 if (n_sets == 1 && REG_NOTES (insn) != 0
4825 && (tem = find_reg_note (insn, REG_EQUAL, NULL_RTX)) != 0
4826 && (! rtx_equal_p (XEXP (tem, 0), SET_SRC (sets[0].rtl))
4827 || GET_CODE (SET_DEST (sets[0].rtl)) == STRICT_LOW_PART))
4829 src_eqv = fold_rtx (canon_reg (XEXP (tem, 0), NULL_RTX), insn);
4830 XEXP (tem, 0) = src_eqv;
4833 /* Canonicalize sources and addresses of destinations.
4834 We do this in a separate pass to avoid problems when a MATCH_DUP is
4835 present in the insn pattern. In that case, we want to ensure that
4836 we don't break the duplicate nature of the pattern. So we will replace
4837 both operands at the same time. Otherwise, we would fail to find an
4838 equivalent substitution in the loop calling validate_change below.
4840 We used to suppress canonicalization of DEST if it appears in SRC,
4841 but we don't do this any more. */
4843 for (i = 0; i < n_sets; i++)
4845 rtx dest = SET_DEST (sets[i].rtl);
4846 rtx src = SET_SRC (sets[i].rtl);
4847 rtx new = canon_reg (src, insn);
4848 int insn_code;
4850 sets[i].orig_src = src;
4851 if ((REG_P (new) && REG_P (src)
4852 && ((REGNO (new) < FIRST_PSEUDO_REGISTER)
4853 != (REGNO (src) < FIRST_PSEUDO_REGISTER)))
4854 || (insn_code = recog_memoized (insn)) < 0
4855 || insn_data[insn_code].n_dups > 0)
4856 validate_change (insn, &SET_SRC (sets[i].rtl), new, 1);
4857 else
4858 SET_SRC (sets[i].rtl) = new;
4860 if (GET_CODE (dest) == ZERO_EXTRACT)
4862 validate_change (insn, &XEXP (dest, 1),
4863 canon_reg (XEXP (dest, 1), insn), 1);
4864 validate_change (insn, &XEXP (dest, 2),
4865 canon_reg (XEXP (dest, 2), insn), 1);
4868 while (GET_CODE (dest) == SUBREG
4869 || GET_CODE (dest) == ZERO_EXTRACT
4870 || GET_CODE (dest) == STRICT_LOW_PART)
4871 dest = XEXP (dest, 0);
4873 if (MEM_P (dest))
4874 canon_reg (dest, insn);
4877 /* Now that we have done all the replacements, we can apply the change
4878 group and see if they all work. Note that this will cause some
4879 canonicalizations that would have worked individually not to be applied
4880 because some other canonicalization didn't work, but this should not
4881 occur often.
4883 The result of apply_change_group can be ignored; see canon_reg. */
4885 apply_change_group ();
4887 /* Set sets[i].src_elt to the class each source belongs to.
4888 Detect assignments from or to volatile things
4889 and set set[i] to zero so they will be ignored
4890 in the rest of this function.
4892 Nothing in this loop changes the hash table or the register chains. */
4894 for (i = 0; i < n_sets; i++)
4896 rtx src, dest;
4897 rtx src_folded;
4898 struct table_elt *elt = 0, *p;
4899 enum machine_mode mode;
4900 rtx src_eqv_here;
4901 rtx src_const = 0;
4902 rtx src_related = 0;
4903 struct table_elt *src_const_elt = 0;
4904 int src_cost = MAX_COST;
4905 int src_eqv_cost = MAX_COST;
4906 int src_folded_cost = MAX_COST;
4907 int src_related_cost = MAX_COST;
4908 int src_elt_cost = MAX_COST;
4909 int src_regcost = MAX_COST;
4910 int src_eqv_regcost = MAX_COST;
4911 int src_folded_regcost = MAX_COST;
4912 int src_related_regcost = MAX_COST;
4913 int src_elt_regcost = MAX_COST;
4914 /* Set nonzero if we need to call force_const_mem on with the
4915 contents of src_folded before using it. */
4916 int src_folded_force_flag = 0;
4918 dest = SET_DEST (sets[i].rtl);
4919 src = SET_SRC (sets[i].rtl);
4921 /* If SRC is a constant that has no machine mode,
4922 hash it with the destination's machine mode.
4923 This way we can keep different modes separate. */
4925 mode = GET_MODE (src) == VOIDmode ? GET_MODE (dest) : GET_MODE (src);
4926 sets[i].mode = mode;
4928 if (src_eqv)
4930 enum machine_mode eqvmode = mode;
4931 if (GET_CODE (dest) == STRICT_LOW_PART)
4932 eqvmode = GET_MODE (SUBREG_REG (XEXP (dest, 0)));
4933 do_not_record = 0;
4934 hash_arg_in_memory = 0;
4935 src_eqv_hash = HASH (src_eqv, eqvmode);
4937 /* Find the equivalence class for the equivalent expression. */
4939 if (!do_not_record)
4940 src_eqv_elt = lookup (src_eqv, src_eqv_hash, eqvmode);
4942 src_eqv_volatile = do_not_record;
4943 src_eqv_in_memory = hash_arg_in_memory;
4946 /* If this is a STRICT_LOW_PART assignment, src_eqv corresponds to the
4947 value of the INNER register, not the destination. So it is not
4948 a valid substitution for the source. But save it for later. */
4949 if (GET_CODE (dest) == STRICT_LOW_PART)
4950 src_eqv_here = 0;
4951 else
4952 src_eqv_here = src_eqv;
4954 /* Simplify and foldable subexpressions in SRC. Then get the fully-
4955 simplified result, which may not necessarily be valid. */
4956 src_folded = fold_rtx (src, insn);
4958 #if 0
4959 /* ??? This caused bad code to be generated for the m68k port with -O2.
4960 Suppose src is (CONST_INT -1), and that after truncation src_folded
4961 is (CONST_INT 3). Suppose src_folded is then used for src_const.
4962 At the end we will add src and src_const to the same equivalence
4963 class. We now have 3 and -1 on the same equivalence class. This
4964 causes later instructions to be mis-optimized. */
4965 /* If storing a constant in a bitfield, pre-truncate the constant
4966 so we will be able to record it later. */
4967 if (GET_CODE (SET_DEST (sets[i].rtl)) == ZERO_EXTRACT)
4969 rtx width = XEXP (SET_DEST (sets[i].rtl), 1);
4971 if (GET_CODE (src) == CONST_INT
4972 && GET_CODE (width) == CONST_INT
4973 && INTVAL (width) < HOST_BITS_PER_WIDE_INT
4974 && (INTVAL (src) & ((HOST_WIDE_INT) (-1) << INTVAL (width))))
4975 src_folded
4976 = GEN_INT (INTVAL (src) & (((HOST_WIDE_INT) 1
4977 << INTVAL (width)) - 1));
4979 #endif
4981 /* Compute SRC's hash code, and also notice if it
4982 should not be recorded at all. In that case,
4983 prevent any further processing of this assignment. */
4984 do_not_record = 0;
4985 hash_arg_in_memory = 0;
4987 sets[i].src = src;
4988 sets[i].src_hash = HASH (src, mode);
4989 sets[i].src_volatile = do_not_record;
4990 sets[i].src_in_memory = hash_arg_in_memory;
4992 /* If SRC is a MEM, there is a REG_EQUIV note for SRC, and DEST is
4993 a pseudo, do not record SRC. Using SRC as a replacement for
4994 anything else will be incorrect in that situation. Note that
4995 this usually occurs only for stack slots, in which case all the
4996 RTL would be referring to SRC, so we don't lose any optimization
4997 opportunities by not having SRC in the hash table. */
4999 if (MEM_P (src)
5000 && find_reg_note (insn, REG_EQUIV, NULL_RTX) != 0
5001 && REG_P (dest)
5002 && REGNO (dest) >= FIRST_PSEUDO_REGISTER)
5003 sets[i].src_volatile = 1;
5005 #if 0
5006 /* It is no longer clear why we used to do this, but it doesn't
5007 appear to still be needed. So let's try without it since this
5008 code hurts cse'ing widened ops. */
5009 /* If source is a paradoxical subreg (such as QI treated as an SI),
5010 treat it as volatile. It may do the work of an SI in one context
5011 where the extra bits are not being used, but cannot replace an SI
5012 in general. */
5013 if (GET_CODE (src) == SUBREG
5014 && (GET_MODE_SIZE (GET_MODE (src))
5015 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (src)))))
5016 sets[i].src_volatile = 1;
5017 #endif
5019 /* Locate all possible equivalent forms for SRC. Try to replace
5020 SRC in the insn with each cheaper equivalent.
5022 We have the following types of equivalents: SRC itself, a folded
5023 version, a value given in a REG_EQUAL note, or a value related
5024 to a constant.
5026 Each of these equivalents may be part of an additional class
5027 of equivalents (if more than one is in the table, they must be in
5028 the same class; we check for this).
5030 If the source is volatile, we don't do any table lookups.
5032 We note any constant equivalent for possible later use in a
5033 REG_NOTE. */
5035 if (!sets[i].src_volatile)
5036 elt = lookup (src, sets[i].src_hash, mode);
5038 sets[i].src_elt = elt;
5040 if (elt && src_eqv_here && src_eqv_elt)
5042 if (elt->first_same_value != src_eqv_elt->first_same_value)
5044 /* The REG_EQUAL is indicating that two formerly distinct
5045 classes are now equivalent. So merge them. */
5046 merge_equiv_classes (elt, src_eqv_elt);
5047 src_eqv_hash = HASH (src_eqv, elt->mode);
5048 src_eqv_elt = lookup (src_eqv, src_eqv_hash, elt->mode);
5051 src_eqv_here = 0;
5054 else if (src_eqv_elt)
5055 elt = src_eqv_elt;
5057 /* Try to find a constant somewhere and record it in `src_const'.
5058 Record its table element, if any, in `src_const_elt'. Look in
5059 any known equivalences first. (If the constant is not in the
5060 table, also set `sets[i].src_const_hash'). */
5061 if (elt)
5062 for (p = elt->first_same_value; p; p = p->next_same_value)
5063 if (p->is_const)
5065 src_const = p->exp;
5066 src_const_elt = elt;
5067 break;
5070 if (src_const == 0
5071 && (CONSTANT_P (src_folded)
5072 /* Consider (minus (label_ref L1) (label_ref L2)) as
5073 "constant" here so we will record it. This allows us
5074 to fold switch statements when an ADDR_DIFF_VEC is used. */
5075 || (GET_CODE (src_folded) == MINUS
5076 && GET_CODE (XEXP (src_folded, 0)) == LABEL_REF
5077 && GET_CODE (XEXP (src_folded, 1)) == LABEL_REF)))
5078 src_const = src_folded, src_const_elt = elt;
5079 else if (src_const == 0 && src_eqv_here && CONSTANT_P (src_eqv_here))
5080 src_const = src_eqv_here, src_const_elt = src_eqv_elt;
5082 /* If we don't know if the constant is in the table, get its
5083 hash code and look it up. */
5084 if (src_const && src_const_elt == 0)
5086 sets[i].src_const_hash = HASH (src_const, mode);
5087 src_const_elt = lookup (src_const, sets[i].src_const_hash, mode);
5090 sets[i].src_const = src_const;
5091 sets[i].src_const_elt = src_const_elt;
5093 /* If the constant and our source are both in the table, mark them as
5094 equivalent. Otherwise, if a constant is in the table but the source
5095 isn't, set ELT to it. */
5096 if (src_const_elt && elt
5097 && src_const_elt->first_same_value != elt->first_same_value)
5098 merge_equiv_classes (elt, src_const_elt);
5099 else if (src_const_elt && elt == 0)
5100 elt = src_const_elt;
5102 /* See if there is a register linearly related to a constant
5103 equivalent of SRC. */
5104 if (src_const
5105 && (GET_CODE (src_const) == CONST
5106 || (src_const_elt && src_const_elt->related_value != 0)))
5108 src_related = use_related_value (src_const, src_const_elt);
5109 if (src_related)
5111 struct table_elt *src_related_elt
5112 = lookup (src_related, HASH (src_related, mode), mode);
5113 if (src_related_elt && elt)
5115 if (elt->first_same_value
5116 != src_related_elt->first_same_value)
5117 /* This can occur when we previously saw a CONST
5118 involving a SYMBOL_REF and then see the SYMBOL_REF
5119 twice. Merge the involved classes. */
5120 merge_equiv_classes (elt, src_related_elt);
5122 src_related = 0;
5123 src_related_elt = 0;
5125 else if (src_related_elt && elt == 0)
5126 elt = src_related_elt;
5130 /* See if we have a CONST_INT that is already in a register in a
5131 wider mode. */
5133 if (src_const && src_related == 0 && GET_CODE (src_const) == CONST_INT
5134 && GET_MODE_CLASS (mode) == MODE_INT
5135 && GET_MODE_BITSIZE (mode) < BITS_PER_WORD)
5137 enum machine_mode wider_mode;
5139 for (wider_mode = GET_MODE_WIDER_MODE (mode);
5140 GET_MODE_BITSIZE (wider_mode) <= BITS_PER_WORD
5141 && src_related == 0;
5142 wider_mode = GET_MODE_WIDER_MODE (wider_mode))
5144 struct table_elt *const_elt
5145 = lookup (src_const, HASH (src_const, wider_mode), wider_mode);
5147 if (const_elt == 0)
5148 continue;
5150 for (const_elt = const_elt->first_same_value;
5151 const_elt; const_elt = const_elt->next_same_value)
5152 if (REG_P (const_elt->exp))
5154 src_related = gen_lowpart (mode,
5155 const_elt->exp);
5156 break;
5161 /* Another possibility is that we have an AND with a constant in
5162 a mode narrower than a word. If so, it might have been generated
5163 as part of an "if" which would narrow the AND. If we already
5164 have done the AND in a wider mode, we can use a SUBREG of that
5165 value. */
5167 if (flag_expensive_optimizations && ! src_related
5168 && GET_CODE (src) == AND && GET_CODE (XEXP (src, 1)) == CONST_INT
5169 && GET_MODE_SIZE (mode) < UNITS_PER_WORD)
5171 enum machine_mode tmode;
5172 rtx new_and = gen_rtx_AND (VOIDmode, NULL_RTX, XEXP (src, 1));
5174 for (tmode = GET_MODE_WIDER_MODE (mode);
5175 GET_MODE_SIZE (tmode) <= UNITS_PER_WORD;
5176 tmode = GET_MODE_WIDER_MODE (tmode))
5178 rtx inner = gen_lowpart (tmode, XEXP (src, 0));
5179 struct table_elt *larger_elt;
5181 if (inner)
5183 PUT_MODE (new_and, tmode);
5184 XEXP (new_and, 0) = inner;
5185 larger_elt = lookup (new_and, HASH (new_and, tmode), tmode);
5186 if (larger_elt == 0)
5187 continue;
5189 for (larger_elt = larger_elt->first_same_value;
5190 larger_elt; larger_elt = larger_elt->next_same_value)
5191 if (REG_P (larger_elt->exp))
5193 src_related
5194 = gen_lowpart (mode, larger_elt->exp);
5195 break;
5198 if (src_related)
5199 break;
5204 #ifdef LOAD_EXTEND_OP
5205 /* See if a MEM has already been loaded with a widening operation;
5206 if it has, we can use a subreg of that. Many CISC machines
5207 also have such operations, but this is only likely to be
5208 beneficial on these machines. */
5210 if (flag_expensive_optimizations && src_related == 0
5211 && (GET_MODE_SIZE (mode) < UNITS_PER_WORD)
5212 && GET_MODE_CLASS (mode) == MODE_INT
5213 && MEM_P (src) && ! do_not_record
5214 && LOAD_EXTEND_OP (mode) != UNKNOWN)
5216 struct rtx_def memory_extend_buf;
5217 rtx memory_extend_rtx = &memory_extend_buf;
5218 enum machine_mode tmode;
5220 /* Set what we are trying to extend and the operation it might
5221 have been extended with. */
5222 memset (memory_extend_rtx, 0, sizeof(*memory_extend_rtx));
5223 PUT_CODE (memory_extend_rtx, LOAD_EXTEND_OP (mode));
5224 XEXP (memory_extend_rtx, 0) = src;
5226 for (tmode = GET_MODE_WIDER_MODE (mode);
5227 GET_MODE_SIZE (tmode) <= UNITS_PER_WORD;
5228 tmode = GET_MODE_WIDER_MODE (tmode))
5230 struct table_elt *larger_elt;
5232 PUT_MODE (memory_extend_rtx, tmode);
5233 larger_elt = lookup (memory_extend_rtx,
5234 HASH (memory_extend_rtx, tmode), tmode);
5235 if (larger_elt == 0)
5236 continue;
5238 for (larger_elt = larger_elt->first_same_value;
5239 larger_elt; larger_elt = larger_elt->next_same_value)
5240 if (REG_P (larger_elt->exp))
5242 src_related = gen_lowpart (mode,
5243 larger_elt->exp);
5244 break;
5247 if (src_related)
5248 break;
5251 #endif /* LOAD_EXTEND_OP */
5253 if (src == src_folded)
5254 src_folded = 0;
5256 /* At this point, ELT, if nonzero, points to a class of expressions
5257 equivalent to the source of this SET and SRC, SRC_EQV, SRC_FOLDED,
5258 and SRC_RELATED, if nonzero, each contain additional equivalent
5259 expressions. Prune these latter expressions by deleting expressions
5260 already in the equivalence class.
5262 Check for an equivalent identical to the destination. If found,
5263 this is the preferred equivalent since it will likely lead to
5264 elimination of the insn. Indicate this by placing it in
5265 `src_related'. */
5267 if (elt)
5268 elt = elt->first_same_value;
5269 for (p = elt; p; p = p->next_same_value)
5271 enum rtx_code code = GET_CODE (p->exp);
5273 /* If the expression is not valid, ignore it. Then we do not
5274 have to check for validity below. In most cases, we can use
5275 `rtx_equal_p', since canonicalization has already been done. */
5276 if (code != REG && ! exp_equiv_p (p->exp, p->exp, 1, false))
5277 continue;
5279 /* Also skip paradoxical subregs, unless that's what we're
5280 looking for. */
5281 if (code == SUBREG
5282 && (GET_MODE_SIZE (GET_MODE (p->exp))
5283 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (p->exp))))
5284 && ! (src != 0
5285 && GET_CODE (src) == SUBREG
5286 && GET_MODE (src) == GET_MODE (p->exp)
5287 && (GET_MODE_SIZE (GET_MODE (SUBREG_REG (src)))
5288 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (p->exp))))))
5289 continue;
5291 if (src && GET_CODE (src) == code && rtx_equal_p (src, p->exp))
5292 src = 0;
5293 else if (src_folded && GET_CODE (src_folded) == code
5294 && rtx_equal_p (src_folded, p->exp))
5295 src_folded = 0;
5296 else if (src_eqv_here && GET_CODE (src_eqv_here) == code
5297 && rtx_equal_p (src_eqv_here, p->exp))
5298 src_eqv_here = 0;
5299 else if (src_related && GET_CODE (src_related) == code
5300 && rtx_equal_p (src_related, p->exp))
5301 src_related = 0;
5303 /* This is the same as the destination of the insns, we want
5304 to prefer it. Copy it to src_related. The code below will
5305 then give it a negative cost. */
5306 if (GET_CODE (dest) == code && rtx_equal_p (p->exp, dest))
5307 src_related = dest;
5310 /* Find the cheapest valid equivalent, trying all the available
5311 possibilities. Prefer items not in the hash table to ones
5312 that are when they are equal cost. Note that we can never
5313 worsen an insn as the current contents will also succeed.
5314 If we find an equivalent identical to the destination, use it as best,
5315 since this insn will probably be eliminated in that case. */
5316 if (src)
5318 if (rtx_equal_p (src, dest))
5319 src_cost = src_regcost = -1;
5320 else
5322 src_cost = COST (src);
5323 src_regcost = approx_reg_cost (src);
5327 if (src_eqv_here)
5329 if (rtx_equal_p (src_eqv_here, dest))
5330 src_eqv_cost = src_eqv_regcost = -1;
5331 else
5333 src_eqv_cost = COST (src_eqv_here);
5334 src_eqv_regcost = approx_reg_cost (src_eqv_here);
5338 if (src_folded)
5340 if (rtx_equal_p (src_folded, dest))
5341 src_folded_cost = src_folded_regcost = -1;
5342 else
5344 src_folded_cost = COST (src_folded);
5345 src_folded_regcost = approx_reg_cost (src_folded);
5349 if (src_related)
5351 if (rtx_equal_p (src_related, dest))
5352 src_related_cost = src_related_regcost = -1;
5353 else
5355 src_related_cost = COST (src_related);
5356 src_related_regcost = approx_reg_cost (src_related);
5360 /* If this was an indirect jump insn, a known label will really be
5361 cheaper even though it looks more expensive. */
5362 if (dest == pc_rtx && src_const && GET_CODE (src_const) == LABEL_REF)
5363 src_folded = src_const, src_folded_cost = src_folded_regcost = -1;
5365 /* Terminate loop when replacement made. This must terminate since
5366 the current contents will be tested and will always be valid. */
5367 while (1)
5369 rtx trial;
5371 /* Skip invalid entries. */
5372 while (elt && !REG_P (elt->exp)
5373 && ! exp_equiv_p (elt->exp, elt->exp, 1, false))
5374 elt = elt->next_same_value;
5376 /* A paradoxical subreg would be bad here: it'll be the right
5377 size, but later may be adjusted so that the upper bits aren't
5378 what we want. So reject it. */
5379 if (elt != 0
5380 && GET_CODE (elt->exp) == SUBREG
5381 && (GET_MODE_SIZE (GET_MODE (elt->exp))
5382 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (elt->exp))))
5383 /* It is okay, though, if the rtx we're trying to match
5384 will ignore any of the bits we can't predict. */
5385 && ! (src != 0
5386 && GET_CODE (src) == SUBREG
5387 && GET_MODE (src) == GET_MODE (elt->exp)
5388 && (GET_MODE_SIZE (GET_MODE (SUBREG_REG (src)))
5389 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (elt->exp))))))
5391 elt = elt->next_same_value;
5392 continue;
5395 if (elt)
5397 src_elt_cost = elt->cost;
5398 src_elt_regcost = elt->regcost;
5401 /* Find cheapest and skip it for the next time. For items
5402 of equal cost, use this order:
5403 src_folded, src, src_eqv, src_related and hash table entry. */
5404 if (src_folded
5405 && preferable (src_folded_cost, src_folded_regcost,
5406 src_cost, src_regcost) <= 0
5407 && preferable (src_folded_cost, src_folded_regcost,
5408 src_eqv_cost, src_eqv_regcost) <= 0
5409 && preferable (src_folded_cost, src_folded_regcost,
5410 src_related_cost, src_related_regcost) <= 0
5411 && preferable (src_folded_cost, src_folded_regcost,
5412 src_elt_cost, src_elt_regcost) <= 0)
5414 trial = src_folded, src_folded_cost = MAX_COST;
5415 if (src_folded_force_flag)
5417 rtx forced = force_const_mem (mode, trial);
5418 if (forced)
5419 trial = forced;
5422 else if (src
5423 && preferable (src_cost, src_regcost,
5424 src_eqv_cost, src_eqv_regcost) <= 0
5425 && preferable (src_cost, src_regcost,
5426 src_related_cost, src_related_regcost) <= 0
5427 && preferable (src_cost, src_regcost,
5428 src_elt_cost, src_elt_regcost) <= 0)
5429 trial = src, src_cost = MAX_COST;
5430 else if (src_eqv_here
5431 && preferable (src_eqv_cost, src_eqv_regcost,
5432 src_related_cost, src_related_regcost) <= 0
5433 && preferable (src_eqv_cost, src_eqv_regcost,
5434 src_elt_cost, src_elt_regcost) <= 0)
5435 trial = copy_rtx (src_eqv_here), src_eqv_cost = MAX_COST;
5436 else if (src_related
5437 && preferable (src_related_cost, src_related_regcost,
5438 src_elt_cost, src_elt_regcost) <= 0)
5439 trial = copy_rtx (src_related), src_related_cost = MAX_COST;
5440 else
5442 trial = copy_rtx (elt->exp);
5443 elt = elt->next_same_value;
5444 src_elt_cost = MAX_COST;
5447 /* We don't normally have an insn matching (set (pc) (pc)), so
5448 check for this separately here. We will delete such an
5449 insn below.
5451 For other cases such as a table jump or conditional jump
5452 where we know the ultimate target, go ahead and replace the
5453 operand. While that may not make a valid insn, we will
5454 reemit the jump below (and also insert any necessary
5455 barriers). */
5456 if (n_sets == 1 && dest == pc_rtx
5457 && (trial == pc_rtx
5458 || (GET_CODE (trial) == LABEL_REF
5459 && ! condjump_p (insn))))
5461 /* Don't substitute non-local labels, this confuses CFG. */
5462 if (GET_CODE (trial) == LABEL_REF
5463 && LABEL_REF_NONLOCAL_P (trial))
5464 continue;
5466 SET_SRC (sets[i].rtl) = trial;
5467 cse_jumps_altered = 1;
5468 break;
5471 /* Look for a substitution that makes a valid insn. */
5472 else if (validate_change (insn, &SET_SRC (sets[i].rtl), trial, 0))
5474 rtx new = canon_reg (SET_SRC (sets[i].rtl), insn);
5476 /* If we just made a substitution inside a libcall, then we
5477 need to make the same substitution in any notes attached
5478 to the RETVAL insn. */
5479 if (libcall_insn
5480 && (REG_P (sets[i].orig_src)
5481 || GET_CODE (sets[i].orig_src) == SUBREG
5482 || MEM_P (sets[i].orig_src)))
5484 rtx note = find_reg_equal_equiv_note (libcall_insn);
5485 if (note != 0)
5486 XEXP (note, 0) = simplify_replace_rtx (XEXP (note, 0),
5487 sets[i].orig_src,
5488 copy_rtx (new));
5491 /* The result of apply_change_group can be ignored; see
5492 canon_reg. */
5494 validate_change (insn, &SET_SRC (sets[i].rtl), new, 1);
5495 apply_change_group ();
5496 break;
5499 /* If we previously found constant pool entries for
5500 constants and this is a constant, try making a
5501 pool entry. Put it in src_folded unless we already have done
5502 this since that is where it likely came from. */
5504 else if (constant_pool_entries_cost
5505 && CONSTANT_P (trial)
5506 /* Reject cases that will abort in decode_rtx_const.
5507 On the alpha when simplifying a switch, we get
5508 (const (truncate (minus (label_ref) (label_ref)))). */
5509 && ! (GET_CODE (trial) == CONST
5510 && GET_CODE (XEXP (trial, 0)) == TRUNCATE)
5511 /* Likewise on IA-64, except without the truncate. */
5512 && ! (GET_CODE (trial) == CONST
5513 && GET_CODE (XEXP (trial, 0)) == MINUS
5514 && GET_CODE (XEXP (XEXP (trial, 0), 0)) == LABEL_REF
5515 && GET_CODE (XEXP (XEXP (trial, 0), 1)) == LABEL_REF)
5516 && (src_folded == 0
5517 || (!MEM_P (src_folded)
5518 && ! src_folded_force_flag))
5519 && GET_MODE_CLASS (mode) != MODE_CC
5520 && mode != VOIDmode)
5522 src_folded_force_flag = 1;
5523 src_folded = trial;
5524 src_folded_cost = constant_pool_entries_cost;
5525 src_folded_regcost = constant_pool_entries_regcost;
5529 src = SET_SRC (sets[i].rtl);
5531 /* In general, it is good to have a SET with SET_SRC == SET_DEST.
5532 However, there is an important exception: If both are registers
5533 that are not the head of their equivalence class, replace SET_SRC
5534 with the head of the class. If we do not do this, we will have
5535 both registers live over a portion of the basic block. This way,
5536 their lifetimes will likely abut instead of overlapping. */
5537 if (REG_P (dest)
5538 && REGNO_QTY_VALID_P (REGNO (dest)))
5540 int dest_q = REG_QTY (REGNO (dest));
5541 struct qty_table_elem *dest_ent = &qty_table[dest_q];
5543 if (dest_ent->mode == GET_MODE (dest)
5544 && dest_ent->first_reg != REGNO (dest)
5545 && REG_P (src) && REGNO (src) == REGNO (dest)
5546 /* Don't do this if the original insn had a hard reg as
5547 SET_SRC or SET_DEST. */
5548 && (!REG_P (sets[i].src)
5549 || REGNO (sets[i].src) >= FIRST_PSEUDO_REGISTER)
5550 && (!REG_P (dest) || REGNO (dest) >= FIRST_PSEUDO_REGISTER))
5551 /* We can't call canon_reg here because it won't do anything if
5552 SRC is a hard register. */
5554 int src_q = REG_QTY (REGNO (src));
5555 struct qty_table_elem *src_ent = &qty_table[src_q];
5556 int first = src_ent->first_reg;
5557 rtx new_src
5558 = (first >= FIRST_PSEUDO_REGISTER
5559 ? regno_reg_rtx[first] : gen_rtx_REG (GET_MODE (src), first));
5561 /* We must use validate-change even for this, because this
5562 might be a special no-op instruction, suitable only to
5563 tag notes onto. */
5564 if (validate_change (insn, &SET_SRC (sets[i].rtl), new_src, 0))
5566 src = new_src;
5567 /* If we had a constant that is cheaper than what we are now
5568 setting SRC to, use that constant. We ignored it when we
5569 thought we could make this into a no-op. */
5570 if (src_const && COST (src_const) < COST (src)
5571 && validate_change (insn, &SET_SRC (sets[i].rtl),
5572 src_const, 0))
5573 src = src_const;
5578 /* If we made a change, recompute SRC values. */
5579 if (src != sets[i].src)
5581 cse_altered = 1;
5582 do_not_record = 0;
5583 hash_arg_in_memory = 0;
5584 sets[i].src = src;
5585 sets[i].src_hash = HASH (src, mode);
5586 sets[i].src_volatile = do_not_record;
5587 sets[i].src_in_memory = hash_arg_in_memory;
5588 sets[i].src_elt = lookup (src, sets[i].src_hash, mode);
5591 /* If this is a single SET, we are setting a register, and we have an
5592 equivalent constant, we want to add a REG_NOTE. We don't want
5593 to write a REG_EQUAL note for a constant pseudo since verifying that
5594 that pseudo hasn't been eliminated is a pain. Such a note also
5595 won't help anything.
5597 Avoid a REG_EQUAL note for (CONST (MINUS (LABEL_REF) (LABEL_REF)))
5598 which can be created for a reference to a compile time computable
5599 entry in a jump table. */
5601 if (n_sets == 1 && src_const && REG_P (dest)
5602 && !REG_P (src_const)
5603 && ! (GET_CODE (src_const) == CONST
5604 && GET_CODE (XEXP (src_const, 0)) == MINUS
5605 && GET_CODE (XEXP (XEXP (src_const, 0), 0)) == LABEL_REF
5606 && GET_CODE (XEXP (XEXP (src_const, 0), 1)) == LABEL_REF))
5608 /* We only want a REG_EQUAL note if src_const != src. */
5609 if (! rtx_equal_p (src, src_const))
5611 /* Make sure that the rtx is not shared. */
5612 src_const = copy_rtx (src_const);
5614 /* Record the actual constant value in a REG_EQUAL note,
5615 making a new one if one does not already exist. */
5616 set_unique_reg_note (insn, REG_EQUAL, src_const);
5620 /* Now deal with the destination. */
5621 do_not_record = 0;
5623 /* Look within any ZERO_EXTRACT to the MEM or REG within it. */
5624 while (GET_CODE (dest) == SUBREG
5625 || GET_CODE (dest) == ZERO_EXTRACT
5626 || GET_CODE (dest) == STRICT_LOW_PART)
5627 dest = XEXP (dest, 0);
5629 sets[i].inner_dest = dest;
5631 if (MEM_P (dest))
5633 #ifdef PUSH_ROUNDING
5634 /* Stack pushes invalidate the stack pointer. */
5635 rtx addr = XEXP (dest, 0);
5636 if (GET_RTX_CLASS (GET_CODE (addr)) == RTX_AUTOINC
5637 && XEXP (addr, 0) == stack_pointer_rtx)
5638 invalidate (stack_pointer_rtx, Pmode);
5639 #endif
5640 dest = fold_rtx (dest, insn);
5643 /* Compute the hash code of the destination now,
5644 before the effects of this instruction are recorded,
5645 since the register values used in the address computation
5646 are those before this instruction. */
5647 sets[i].dest_hash = HASH (dest, mode);
5649 /* Don't enter a bit-field in the hash table
5650 because the value in it after the store
5651 may not equal what was stored, due to truncation. */
5653 if (GET_CODE (SET_DEST (sets[i].rtl)) == ZERO_EXTRACT)
5655 rtx width = XEXP (SET_DEST (sets[i].rtl), 1);
5657 if (src_const != 0 && GET_CODE (src_const) == CONST_INT
5658 && GET_CODE (width) == CONST_INT
5659 && INTVAL (width) < HOST_BITS_PER_WIDE_INT
5660 && ! (INTVAL (src_const)
5661 & ((HOST_WIDE_INT) (-1) << INTVAL (width))))
5662 /* Exception: if the value is constant,
5663 and it won't be truncated, record it. */
5665 else
5667 /* This is chosen so that the destination will be invalidated
5668 but no new value will be recorded.
5669 We must invalidate because sometimes constant
5670 values can be recorded for bitfields. */
5671 sets[i].src_elt = 0;
5672 sets[i].src_volatile = 1;
5673 src_eqv = 0;
5674 src_eqv_elt = 0;
5678 /* If only one set in a JUMP_INSN and it is now a no-op, we can delete
5679 the insn. */
5680 else if (n_sets == 1 && dest == pc_rtx && src == pc_rtx)
5682 /* One less use of the label this insn used to jump to. */
5683 delete_insn (insn);
5684 cse_jumps_altered = 1;
5685 /* No more processing for this set. */
5686 sets[i].rtl = 0;
5689 /* If this SET is now setting PC to a label, we know it used to
5690 be a conditional or computed branch. */
5691 else if (dest == pc_rtx && GET_CODE (src) == LABEL_REF
5692 && !LABEL_REF_NONLOCAL_P (src))
5694 /* Now emit a BARRIER after the unconditional jump. */
5695 if (NEXT_INSN (insn) == 0
5696 || !BARRIER_P (NEXT_INSN (insn)))
5697 emit_barrier_after (insn);
5699 /* We reemit the jump in as many cases as possible just in
5700 case the form of an unconditional jump is significantly
5701 different than a computed jump or conditional jump.
5703 If this insn has multiple sets, then reemitting the
5704 jump is nontrivial. So instead we just force rerecognition
5705 and hope for the best. */
5706 if (n_sets == 1)
5708 rtx new, note;
5710 new = emit_jump_insn_after (gen_jump (XEXP (src, 0)), insn);
5711 JUMP_LABEL (new) = XEXP (src, 0);
5712 LABEL_NUSES (XEXP (src, 0))++;
5714 /* Make sure to copy over REG_NON_LOCAL_GOTO. */
5715 note = find_reg_note (insn, REG_NON_LOCAL_GOTO, 0);
5716 if (note)
5718 XEXP (note, 1) = NULL_RTX;
5719 REG_NOTES (new) = note;
5722 delete_insn (insn);
5723 insn = new;
5725 /* Now emit a BARRIER after the unconditional jump. */
5726 if (NEXT_INSN (insn) == 0
5727 || !BARRIER_P (NEXT_INSN (insn)))
5728 emit_barrier_after (insn);
5730 else
5731 INSN_CODE (insn) = -1;
5733 /* Do not bother deleting any unreachable code,
5734 let jump/flow do that. */
5736 cse_jumps_altered = 1;
5737 sets[i].rtl = 0;
5740 /* If destination is volatile, invalidate it and then do no further
5741 processing for this assignment. */
5743 else if (do_not_record)
5745 if (REG_P (dest) || GET_CODE (dest) == SUBREG)
5746 invalidate (dest, VOIDmode);
5747 else if (MEM_P (dest))
5748 invalidate (dest, VOIDmode);
5749 else if (GET_CODE (dest) == STRICT_LOW_PART
5750 || GET_CODE (dest) == ZERO_EXTRACT)
5751 invalidate (XEXP (dest, 0), GET_MODE (dest));
5752 sets[i].rtl = 0;
5755 if (sets[i].rtl != 0 && dest != SET_DEST (sets[i].rtl))
5756 sets[i].dest_hash = HASH (SET_DEST (sets[i].rtl), mode);
5758 #ifdef HAVE_cc0
5759 /* If setting CC0, record what it was set to, or a constant, if it
5760 is equivalent to a constant. If it is being set to a floating-point
5761 value, make a COMPARE with the appropriate constant of 0. If we
5762 don't do this, later code can interpret this as a test against
5763 const0_rtx, which can cause problems if we try to put it into an
5764 insn as a floating-point operand. */
5765 if (dest == cc0_rtx)
5767 this_insn_cc0 = src_const && mode != VOIDmode ? src_const : src;
5768 this_insn_cc0_mode = mode;
5769 if (FLOAT_MODE_P (mode))
5770 this_insn_cc0 = gen_rtx_COMPARE (VOIDmode, this_insn_cc0,
5771 CONST0_RTX (mode));
5773 #endif
5776 /* Now enter all non-volatile source expressions in the hash table
5777 if they are not already present.
5778 Record their equivalence classes in src_elt.
5779 This way we can insert the corresponding destinations into
5780 the same classes even if the actual sources are no longer in them
5781 (having been invalidated). */
5783 if (src_eqv && src_eqv_elt == 0 && sets[0].rtl != 0 && ! src_eqv_volatile
5784 && ! rtx_equal_p (src_eqv, SET_DEST (sets[0].rtl)))
5786 struct table_elt *elt;
5787 struct table_elt *classp = sets[0].src_elt;
5788 rtx dest = SET_DEST (sets[0].rtl);
5789 enum machine_mode eqvmode = GET_MODE (dest);
5791 if (GET_CODE (dest) == STRICT_LOW_PART)
5793 eqvmode = GET_MODE (SUBREG_REG (XEXP (dest, 0)));
5794 classp = 0;
5796 if (insert_regs (src_eqv, classp, 0))
5798 rehash_using_reg (src_eqv);
5799 src_eqv_hash = HASH (src_eqv, eqvmode);
5801 elt = insert (src_eqv, classp, src_eqv_hash, eqvmode);
5802 elt->in_memory = src_eqv_in_memory;
5803 src_eqv_elt = elt;
5805 /* Check to see if src_eqv_elt is the same as a set source which
5806 does not yet have an elt, and if so set the elt of the set source
5807 to src_eqv_elt. */
5808 for (i = 0; i < n_sets; i++)
5809 if (sets[i].rtl && sets[i].src_elt == 0
5810 && rtx_equal_p (SET_SRC (sets[i].rtl), src_eqv))
5811 sets[i].src_elt = src_eqv_elt;
5814 for (i = 0; i < n_sets; i++)
5815 if (sets[i].rtl && ! sets[i].src_volatile
5816 && ! rtx_equal_p (SET_SRC (sets[i].rtl), SET_DEST (sets[i].rtl)))
5818 if (GET_CODE (SET_DEST (sets[i].rtl)) == STRICT_LOW_PART)
5820 /* REG_EQUAL in setting a STRICT_LOW_PART
5821 gives an equivalent for the entire destination register,
5822 not just for the subreg being stored in now.
5823 This is a more interesting equivalence, so we arrange later
5824 to treat the entire reg as the destination. */
5825 sets[i].src_elt = src_eqv_elt;
5826 sets[i].src_hash = src_eqv_hash;
5828 else
5830 /* Insert source and constant equivalent into hash table, if not
5831 already present. */
5832 struct table_elt *classp = src_eqv_elt;
5833 rtx src = sets[i].src;
5834 rtx dest = SET_DEST (sets[i].rtl);
5835 enum machine_mode mode
5836 = GET_MODE (src) == VOIDmode ? GET_MODE (dest) : GET_MODE (src);
5838 /* It's possible that we have a source value known to be
5839 constant but don't have a REG_EQUAL note on the insn.
5840 Lack of a note will mean src_eqv_elt will be NULL. This
5841 can happen where we've generated a SUBREG to access a
5842 CONST_INT that is already in a register in a wider mode.
5843 Ensure that the source expression is put in the proper
5844 constant class. */
5845 if (!classp)
5846 classp = sets[i].src_const_elt;
5848 if (sets[i].src_elt == 0)
5850 /* Don't put a hard register source into the table if this is
5851 the last insn of a libcall. In this case, we only need
5852 to put src_eqv_elt in src_elt. */
5853 if (! find_reg_note (insn, REG_RETVAL, NULL_RTX))
5855 struct table_elt *elt;
5857 /* Note that these insert_regs calls cannot remove
5858 any of the src_elt's, because they would have failed to
5859 match if not still valid. */
5860 if (insert_regs (src, classp, 0))
5862 rehash_using_reg (src);
5863 sets[i].src_hash = HASH (src, mode);
5865 elt = insert (src, classp, sets[i].src_hash, mode);
5866 elt->in_memory = sets[i].src_in_memory;
5867 sets[i].src_elt = classp = elt;
5869 else
5870 sets[i].src_elt = classp;
5872 if (sets[i].src_const && sets[i].src_const_elt == 0
5873 && src != sets[i].src_const
5874 && ! rtx_equal_p (sets[i].src_const, src))
5875 sets[i].src_elt = insert (sets[i].src_const, classp,
5876 sets[i].src_const_hash, mode);
5879 else if (sets[i].src_elt == 0)
5880 /* If we did not insert the source into the hash table (e.g., it was
5881 volatile), note the equivalence class for the REG_EQUAL value, if any,
5882 so that the destination goes into that class. */
5883 sets[i].src_elt = src_eqv_elt;
5885 invalidate_from_clobbers (x);
5887 /* Some registers are invalidated by subroutine calls. Memory is
5888 invalidated by non-constant calls. */
5890 if (CALL_P (insn))
5892 if (! CONST_OR_PURE_CALL_P (insn))
5893 invalidate_memory ();
5894 invalidate_for_call ();
5897 /* Now invalidate everything set by this instruction.
5898 If a SUBREG or other funny destination is being set,
5899 sets[i].rtl is still nonzero, so here we invalidate the reg
5900 a part of which is being set. */
5902 for (i = 0; i < n_sets; i++)
5903 if (sets[i].rtl)
5905 /* We can't use the inner dest, because the mode associated with
5906 a ZERO_EXTRACT is significant. */
5907 rtx dest = SET_DEST (sets[i].rtl);
5909 /* Needed for registers to remove the register from its
5910 previous quantity's chain.
5911 Needed for memory if this is a nonvarying address, unless
5912 we have just done an invalidate_memory that covers even those. */
5913 if (REG_P (dest) || GET_CODE (dest) == SUBREG)
5914 invalidate (dest, VOIDmode);
5915 else if (MEM_P (dest))
5916 invalidate (dest, VOIDmode);
5917 else if (GET_CODE (dest) == STRICT_LOW_PART
5918 || GET_CODE (dest) == ZERO_EXTRACT)
5919 invalidate (XEXP (dest, 0), GET_MODE (dest));
5922 /* A volatile ASM invalidates everything. */
5923 if (NONJUMP_INSN_P (insn)
5924 && GET_CODE (PATTERN (insn)) == ASM_OPERANDS
5925 && MEM_VOLATILE_P (PATTERN (insn)))
5926 flush_hash_table ();
5928 /* Make sure registers mentioned in destinations
5929 are safe for use in an expression to be inserted.
5930 This removes from the hash table
5931 any invalid entry that refers to one of these registers.
5933 We don't care about the return value from mention_regs because
5934 we are going to hash the SET_DEST values unconditionally. */
5936 for (i = 0; i < n_sets; i++)
5938 if (sets[i].rtl)
5940 rtx x = SET_DEST (sets[i].rtl);
5942 if (!REG_P (x))
5943 mention_regs (x);
5944 else
5946 /* We used to rely on all references to a register becoming
5947 inaccessible when a register changes to a new quantity,
5948 since that changes the hash code. However, that is not
5949 safe, since after HASH_SIZE new quantities we get a
5950 hash 'collision' of a register with its own invalid
5951 entries. And since SUBREGs have been changed not to
5952 change their hash code with the hash code of the register,
5953 it wouldn't work any longer at all. So we have to check
5954 for any invalid references lying around now.
5955 This code is similar to the REG case in mention_regs,
5956 but it knows that reg_tick has been incremented, and
5957 it leaves reg_in_table as -1 . */
5958 unsigned int regno = REGNO (x);
5959 unsigned int endregno
5960 = regno + (regno >= FIRST_PSEUDO_REGISTER ? 1
5961 : hard_regno_nregs[regno][GET_MODE (x)]);
5962 unsigned int i;
5964 for (i = regno; i < endregno; i++)
5966 if (REG_IN_TABLE (i) >= 0)
5968 remove_invalid_refs (i);
5969 REG_IN_TABLE (i) = -1;
5976 /* We may have just removed some of the src_elt's from the hash table.
5977 So replace each one with the current head of the same class. */
5979 for (i = 0; i < n_sets; i++)
5980 if (sets[i].rtl)
5982 if (sets[i].src_elt && sets[i].src_elt->first_same_value == 0)
5983 /* If elt was removed, find current head of same class,
5984 or 0 if nothing remains of that class. */
5986 struct table_elt *elt = sets[i].src_elt;
5988 while (elt && elt->prev_same_value)
5989 elt = elt->prev_same_value;
5991 while (elt && elt->first_same_value == 0)
5992 elt = elt->next_same_value;
5993 sets[i].src_elt = elt ? elt->first_same_value : 0;
5997 /* Now insert the destinations into their equivalence classes. */
5999 for (i = 0; i < n_sets; i++)
6000 if (sets[i].rtl)
6002 rtx dest = SET_DEST (sets[i].rtl);
6003 struct table_elt *elt;
6005 /* Don't record value if we are not supposed to risk allocating
6006 floating-point values in registers that might be wider than
6007 memory. */
6008 if ((flag_float_store
6009 && MEM_P (dest)
6010 && FLOAT_MODE_P (GET_MODE (dest)))
6011 /* Don't record BLKmode values, because we don't know the
6012 size of it, and can't be sure that other BLKmode values
6013 have the same or smaller size. */
6014 || GET_MODE (dest) == BLKmode
6015 /* Don't record values of destinations set inside a libcall block
6016 since we might delete the libcall. Things should have been set
6017 up so we won't want to reuse such a value, but we play it safe
6018 here. */
6019 || libcall_insn
6020 /* If we didn't put a REG_EQUAL value or a source into the hash
6021 table, there is no point is recording DEST. */
6022 || sets[i].src_elt == 0
6023 /* If DEST is a paradoxical SUBREG and SRC is a ZERO_EXTEND
6024 or SIGN_EXTEND, don't record DEST since it can cause
6025 some tracking to be wrong.
6027 ??? Think about this more later. */
6028 || (GET_CODE (dest) == SUBREG
6029 && (GET_MODE_SIZE (GET_MODE (dest))
6030 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest))))
6031 && (GET_CODE (sets[i].src) == SIGN_EXTEND
6032 || GET_CODE (sets[i].src) == ZERO_EXTEND)))
6033 continue;
6035 /* STRICT_LOW_PART isn't part of the value BEING set,
6036 and neither is the SUBREG inside it.
6037 Note that in this case SETS[I].SRC_ELT is really SRC_EQV_ELT. */
6038 if (GET_CODE (dest) == STRICT_LOW_PART)
6039 dest = SUBREG_REG (XEXP (dest, 0));
6041 if (REG_P (dest) || GET_CODE (dest) == SUBREG)
6042 /* Registers must also be inserted into chains for quantities. */
6043 if (insert_regs (dest, sets[i].src_elt, 1))
6045 /* If `insert_regs' changes something, the hash code must be
6046 recalculated. */
6047 rehash_using_reg (dest);
6048 sets[i].dest_hash = HASH (dest, GET_MODE (dest));
6051 elt = insert (dest, sets[i].src_elt,
6052 sets[i].dest_hash, GET_MODE (dest));
6054 elt->in_memory = (MEM_P (sets[i].inner_dest)
6055 && !MEM_READONLY_P (sets[i].inner_dest));
6057 /* If we have (set (subreg:m1 (reg:m2 foo) 0) (bar:m1)), M1 is no
6058 narrower than M2, and both M1 and M2 are the same number of words,
6059 we are also doing (set (reg:m2 foo) (subreg:m2 (bar:m1) 0)) so
6060 make that equivalence as well.
6062 However, BAR may have equivalences for which gen_lowpart
6063 will produce a simpler value than gen_lowpart applied to
6064 BAR (e.g., if BAR was ZERO_EXTENDed from M2), so we will scan all
6065 BAR's equivalences. If we don't get a simplified form, make
6066 the SUBREG. It will not be used in an equivalence, but will
6067 cause two similar assignments to be detected.
6069 Note the loop below will find SUBREG_REG (DEST) since we have
6070 already entered SRC and DEST of the SET in the table. */
6072 if (GET_CODE (dest) == SUBREG
6073 && (((GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest))) - 1)
6074 / UNITS_PER_WORD)
6075 == (GET_MODE_SIZE (GET_MODE (dest)) - 1) / UNITS_PER_WORD)
6076 && (GET_MODE_SIZE (GET_MODE (dest))
6077 >= GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest))))
6078 && sets[i].src_elt != 0)
6080 enum machine_mode new_mode = GET_MODE (SUBREG_REG (dest));
6081 struct table_elt *elt, *classp = 0;
6083 for (elt = sets[i].src_elt->first_same_value; elt;
6084 elt = elt->next_same_value)
6086 rtx new_src = 0;
6087 unsigned src_hash;
6088 struct table_elt *src_elt;
6089 int byte = 0;
6091 /* Ignore invalid entries. */
6092 if (!REG_P (elt->exp)
6093 && ! exp_equiv_p (elt->exp, elt->exp, 1, false))
6094 continue;
6096 /* We may have already been playing subreg games. If the
6097 mode is already correct for the destination, use it. */
6098 if (GET_MODE (elt->exp) == new_mode)
6099 new_src = elt->exp;
6100 else
6102 /* Calculate big endian correction for the SUBREG_BYTE.
6103 We have already checked that M1 (GET_MODE (dest))
6104 is not narrower than M2 (new_mode). */
6105 if (BYTES_BIG_ENDIAN)
6106 byte = (GET_MODE_SIZE (GET_MODE (dest))
6107 - GET_MODE_SIZE (new_mode));
6109 new_src = simplify_gen_subreg (new_mode, elt->exp,
6110 GET_MODE (dest), byte);
6113 /* The call to simplify_gen_subreg fails if the value
6114 is VOIDmode, yet we can't do any simplification, e.g.
6115 for EXPR_LISTs denoting function call results.
6116 It is invalid to construct a SUBREG with a VOIDmode
6117 SUBREG_REG, hence a zero new_src means we can't do
6118 this substitution. */
6119 if (! new_src)
6120 continue;
6122 src_hash = HASH (new_src, new_mode);
6123 src_elt = lookup (new_src, src_hash, new_mode);
6125 /* Put the new source in the hash table is if isn't
6126 already. */
6127 if (src_elt == 0)
6129 if (insert_regs (new_src, classp, 0))
6131 rehash_using_reg (new_src);
6132 src_hash = HASH (new_src, new_mode);
6134 src_elt = insert (new_src, classp, src_hash, new_mode);
6135 src_elt->in_memory = elt->in_memory;
6137 else if (classp && classp != src_elt->first_same_value)
6138 /* Show that two things that we've seen before are
6139 actually the same. */
6140 merge_equiv_classes (src_elt, classp);
6142 classp = src_elt->first_same_value;
6143 /* Ignore invalid entries. */
6144 while (classp
6145 && !REG_P (classp->exp)
6146 && ! exp_equiv_p (classp->exp, classp->exp, 1, false))
6147 classp = classp->next_same_value;
6152 /* Special handling for (set REG0 REG1) where REG0 is the
6153 "cheapest", cheaper than REG1. After cse, REG1 will probably not
6154 be used in the sequel, so (if easily done) change this insn to
6155 (set REG1 REG0) and replace REG1 with REG0 in the previous insn
6156 that computed their value. Then REG1 will become a dead store
6157 and won't cloud the situation for later optimizations.
6159 Do not make this change if REG1 is a hard register, because it will
6160 then be used in the sequel and we may be changing a two-operand insn
6161 into a three-operand insn.
6163 Also do not do this if we are operating on a copy of INSN.
6165 Also don't do this if INSN ends a libcall; this would cause an unrelated
6166 register to be set in the middle of a libcall, and we then get bad code
6167 if the libcall is deleted. */
6169 if (n_sets == 1 && sets[0].rtl && REG_P (SET_DEST (sets[0].rtl))
6170 && NEXT_INSN (PREV_INSN (insn)) == insn
6171 && REG_P (SET_SRC (sets[0].rtl))
6172 && REGNO (SET_SRC (sets[0].rtl)) >= FIRST_PSEUDO_REGISTER
6173 && REGNO_QTY_VALID_P (REGNO (SET_SRC (sets[0].rtl))))
6175 int src_q = REG_QTY (REGNO (SET_SRC (sets[0].rtl)));
6176 struct qty_table_elem *src_ent = &qty_table[src_q];
6178 if ((src_ent->first_reg == REGNO (SET_DEST (sets[0].rtl)))
6179 && ! find_reg_note (insn, REG_RETVAL, NULL_RTX))
6181 rtx prev = insn;
6182 /* Scan for the previous nonnote insn, but stop at a basic
6183 block boundary. */
6186 prev = PREV_INSN (prev);
6188 while (prev && NOTE_P (prev)
6189 && NOTE_LINE_NUMBER (prev) != NOTE_INSN_BASIC_BLOCK);
6191 /* Do not swap the registers around if the previous instruction
6192 attaches a REG_EQUIV note to REG1.
6194 ??? It's not entirely clear whether we can transfer a REG_EQUIV
6195 from the pseudo that originally shadowed an incoming argument
6196 to another register. Some uses of REG_EQUIV might rely on it
6197 being attached to REG1 rather than REG2.
6199 This section previously turned the REG_EQUIV into a REG_EQUAL
6200 note. We cannot do that because REG_EQUIV may provide an
6201 uninitialized stack slot when REG_PARM_STACK_SPACE is used. */
6203 if (prev != 0 && NONJUMP_INSN_P (prev)
6204 && GET_CODE (PATTERN (prev)) == SET
6205 && SET_DEST (PATTERN (prev)) == SET_SRC (sets[0].rtl)
6206 && ! find_reg_note (prev, REG_EQUIV, NULL_RTX))
6208 rtx dest = SET_DEST (sets[0].rtl);
6209 rtx src = SET_SRC (sets[0].rtl);
6210 rtx note;
6212 validate_change (prev, &SET_DEST (PATTERN (prev)), dest, 1);
6213 validate_change (insn, &SET_DEST (sets[0].rtl), src, 1);
6214 validate_change (insn, &SET_SRC (sets[0].rtl), dest, 1);
6215 apply_change_group ();
6217 /* If INSN has a REG_EQUAL note, and this note mentions
6218 REG0, then we must delete it, because the value in
6219 REG0 has changed. If the note's value is REG1, we must
6220 also delete it because that is now this insn's dest. */
6221 note = find_reg_note (insn, REG_EQUAL, NULL_RTX);
6222 if (note != 0
6223 && (reg_mentioned_p (dest, XEXP (note, 0))
6224 || rtx_equal_p (src, XEXP (note, 0))))
6225 remove_note (insn, note);
6230 /* If this is a conditional jump insn, record any known equivalences due to
6231 the condition being tested. */
6233 if (JUMP_P (insn)
6234 && n_sets == 1 && GET_CODE (x) == SET
6235 && GET_CODE (SET_SRC (x)) == IF_THEN_ELSE)
6236 record_jump_equiv (insn, 0);
6238 #ifdef HAVE_cc0
6239 /* If the previous insn set CC0 and this insn no longer references CC0,
6240 delete the previous insn. Here we use the fact that nothing expects CC0
6241 to be valid over an insn, which is true until the final pass. */
6242 if (prev_insn && NONJUMP_INSN_P (prev_insn)
6243 && (tem = single_set (prev_insn)) != 0
6244 && SET_DEST (tem) == cc0_rtx
6245 && ! reg_mentioned_p (cc0_rtx, x))
6246 delete_insn (prev_insn);
6248 prev_insn_cc0 = this_insn_cc0;
6249 prev_insn_cc0_mode = this_insn_cc0_mode;
6250 prev_insn = insn;
6251 #endif
6254 /* Remove from the hash table all expressions that reference memory. */
6256 static void
6257 invalidate_memory (void)
6259 int i;
6260 struct table_elt *p, *next;
6262 for (i = 0; i < HASH_SIZE; i++)
6263 for (p = table[i]; p; p = next)
6265 next = p->next_same_hash;
6266 if (p->in_memory)
6267 remove_from_table (p, i);
6271 /* If ADDR is an address that implicitly affects the stack pointer, return
6272 1 and update the register tables to show the effect. Else, return 0. */
6274 static int
6275 addr_affects_sp_p (rtx addr)
6277 if (GET_RTX_CLASS (GET_CODE (addr)) == RTX_AUTOINC
6278 && REG_P (XEXP (addr, 0))
6279 && REGNO (XEXP (addr, 0)) == STACK_POINTER_REGNUM)
6281 if (REG_TICK (STACK_POINTER_REGNUM) >= 0)
6283 REG_TICK (STACK_POINTER_REGNUM)++;
6284 /* Is it possible to use a subreg of SP? */
6285 SUBREG_TICKED (STACK_POINTER_REGNUM) = -1;
6288 /* This should be *very* rare. */
6289 if (TEST_HARD_REG_BIT (hard_regs_in_table, STACK_POINTER_REGNUM))
6290 invalidate (stack_pointer_rtx, VOIDmode);
6292 return 1;
6295 return 0;
6298 /* Perform invalidation on the basis of everything about an insn
6299 except for invalidating the actual places that are SET in it.
6300 This includes the places CLOBBERed, and anything that might
6301 alias with something that is SET or CLOBBERed.
6303 X is the pattern of the insn. */
6305 static void
6306 invalidate_from_clobbers (rtx x)
6308 if (GET_CODE (x) == CLOBBER)
6310 rtx ref = XEXP (x, 0);
6311 if (ref)
6313 if (REG_P (ref) || GET_CODE (ref) == SUBREG
6314 || MEM_P (ref))
6315 invalidate (ref, VOIDmode);
6316 else if (GET_CODE (ref) == STRICT_LOW_PART
6317 || GET_CODE (ref) == ZERO_EXTRACT)
6318 invalidate (XEXP (ref, 0), GET_MODE (ref));
6321 else if (GET_CODE (x) == PARALLEL)
6323 int i;
6324 for (i = XVECLEN (x, 0) - 1; i >= 0; i--)
6326 rtx y = XVECEXP (x, 0, i);
6327 if (GET_CODE (y) == CLOBBER)
6329 rtx ref = XEXP (y, 0);
6330 if (REG_P (ref) || GET_CODE (ref) == SUBREG
6331 || MEM_P (ref))
6332 invalidate (ref, VOIDmode);
6333 else if (GET_CODE (ref) == STRICT_LOW_PART
6334 || GET_CODE (ref) == ZERO_EXTRACT)
6335 invalidate (XEXP (ref, 0), GET_MODE (ref));
6341 /* Process X, part of the REG_NOTES of an insn. Look at any REG_EQUAL notes
6342 and replace any registers in them with either an equivalent constant
6343 or the canonical form of the register. If we are inside an address,
6344 only do this if the address remains valid.
6346 OBJECT is 0 except when within a MEM in which case it is the MEM.
6348 Return the replacement for X. */
6350 static rtx
6351 cse_process_notes (rtx x, rtx object)
6353 enum rtx_code code = GET_CODE (x);
6354 const char *fmt = GET_RTX_FORMAT (code);
6355 int i;
6357 switch (code)
6359 case CONST_INT:
6360 case CONST:
6361 case SYMBOL_REF:
6362 case LABEL_REF:
6363 case CONST_DOUBLE:
6364 case CONST_VECTOR:
6365 case PC:
6366 case CC0:
6367 case LO_SUM:
6368 return x;
6370 case MEM:
6371 validate_change (x, &XEXP (x, 0),
6372 cse_process_notes (XEXP (x, 0), x), 0);
6373 return x;
6375 case EXPR_LIST:
6376 case INSN_LIST:
6377 if (REG_NOTE_KIND (x) == REG_EQUAL)
6378 XEXP (x, 0) = cse_process_notes (XEXP (x, 0), NULL_RTX);
6379 if (XEXP (x, 1))
6380 XEXP (x, 1) = cse_process_notes (XEXP (x, 1), NULL_RTX);
6381 return x;
6383 case SIGN_EXTEND:
6384 case ZERO_EXTEND:
6385 case SUBREG:
6387 rtx new = cse_process_notes (XEXP (x, 0), object);
6388 /* We don't substitute VOIDmode constants into these rtx,
6389 since they would impede folding. */
6390 if (GET_MODE (new) != VOIDmode)
6391 validate_change (object, &XEXP (x, 0), new, 0);
6392 return x;
6395 case REG:
6396 i = REG_QTY (REGNO (x));
6398 /* Return a constant or a constant register. */
6399 if (REGNO_QTY_VALID_P (REGNO (x)))
6401 struct qty_table_elem *ent = &qty_table[i];
6403 if (ent->const_rtx != NULL_RTX
6404 && (CONSTANT_P (ent->const_rtx)
6405 || REG_P (ent->const_rtx)))
6407 rtx new = gen_lowpart (GET_MODE (x), ent->const_rtx);
6408 if (new)
6409 return new;
6413 /* Otherwise, canonicalize this register. */
6414 return canon_reg (x, NULL_RTX);
6416 default:
6417 break;
6420 for (i = 0; i < GET_RTX_LENGTH (code); i++)
6421 if (fmt[i] == 'e')
6422 validate_change (object, &XEXP (x, i),
6423 cse_process_notes (XEXP (x, i), object), 0);
6425 return x;
6428 /* Process one SET of an insn that was skipped. We ignore CLOBBERs
6429 since they are done elsewhere. This function is called via note_stores. */
6431 static void
6432 invalidate_skipped_set (rtx dest, rtx set, void *data ATTRIBUTE_UNUSED)
6434 enum rtx_code code = GET_CODE (dest);
6436 if (code == MEM
6437 && ! addr_affects_sp_p (dest) /* If this is not a stack push ... */
6438 /* There are times when an address can appear varying and be a PLUS
6439 during this scan when it would be a fixed address were we to know
6440 the proper equivalences. So invalidate all memory if there is
6441 a BLKmode or nonscalar memory reference or a reference to a
6442 variable address. */
6443 && (MEM_IN_STRUCT_P (dest) || GET_MODE (dest) == BLKmode
6444 || cse_rtx_varies_p (XEXP (dest, 0), 0)))
6446 invalidate_memory ();
6447 return;
6450 if (GET_CODE (set) == CLOBBER
6451 || CC0_P (dest)
6452 || dest == pc_rtx)
6453 return;
6455 if (code == STRICT_LOW_PART || code == ZERO_EXTRACT)
6456 invalidate (XEXP (dest, 0), GET_MODE (dest));
6457 else if (code == REG || code == SUBREG || code == MEM)
6458 invalidate (dest, VOIDmode);
6461 /* Invalidate all insns from START up to the end of the function or the
6462 next label. This called when we wish to CSE around a block that is
6463 conditionally executed. */
6465 static void
6466 invalidate_skipped_block (rtx start)
6468 rtx insn;
6470 for (insn = start; insn && !LABEL_P (insn);
6471 insn = NEXT_INSN (insn))
6473 if (! INSN_P (insn))
6474 continue;
6476 if (CALL_P (insn))
6478 if (! CONST_OR_PURE_CALL_P (insn))
6479 invalidate_memory ();
6480 invalidate_for_call ();
6483 invalidate_from_clobbers (PATTERN (insn));
6484 note_stores (PATTERN (insn), invalidate_skipped_set, NULL);
6488 /* Find the end of INSN's basic block and return its range,
6489 the total number of SETs in all the insns of the block, the last insn of the
6490 block, and the branch path.
6492 The branch path indicates which branches should be followed. If a nonzero
6493 path size is specified, the block should be rescanned and a different set
6494 of branches will be taken. The branch path is only used if
6495 FLAG_CSE_FOLLOW_JUMPS or FLAG_CSE_SKIP_BLOCKS is nonzero.
6497 DATA is a pointer to a struct cse_basic_block_data, defined below, that is
6498 used to describe the block. It is filled in with the information about
6499 the current block. The incoming structure's branch path, if any, is used
6500 to construct the output branch path. */
6502 static void
6503 cse_end_of_basic_block (rtx insn, struct cse_basic_block_data *data,
6504 int follow_jumps, int skip_blocks)
6506 rtx p = insn, q;
6507 int nsets = 0;
6508 int low_cuid = INSN_CUID (insn), high_cuid = INSN_CUID (insn);
6509 rtx next = INSN_P (insn) ? insn : next_real_insn (insn);
6510 int path_size = data->path_size;
6511 int path_entry = 0;
6512 int i;
6514 /* Update the previous branch path, if any. If the last branch was
6515 previously PATH_TAKEN, mark it PATH_NOT_TAKEN.
6516 If it was previously PATH_NOT_TAKEN,
6517 shorten the path by one and look at the previous branch. We know that
6518 at least one branch must have been taken if PATH_SIZE is nonzero. */
6519 while (path_size > 0)
6521 if (data->path[path_size - 1].status != PATH_NOT_TAKEN)
6523 data->path[path_size - 1].status = PATH_NOT_TAKEN;
6524 break;
6526 else
6527 path_size--;
6530 /* If the first instruction is marked with QImode, that means we've
6531 already processed this block. Our caller will look at DATA->LAST
6532 to figure out where to go next. We want to return the next block
6533 in the instruction stream, not some branched-to block somewhere
6534 else. We accomplish this by pretending our called forbid us to
6535 follow jumps, or skip blocks. */
6536 if (GET_MODE (insn) == QImode)
6537 follow_jumps = skip_blocks = 0;
6539 /* Scan to end of this basic block. */
6540 while (p && !LABEL_P (p))
6542 /* Don't cse over a call to setjmp; on some machines (eg VAX)
6543 the regs restored by the longjmp come from
6544 a later time than the setjmp. */
6545 if (PREV_INSN (p) && CALL_P (PREV_INSN (p))
6546 && find_reg_note (PREV_INSN (p), REG_SETJMP, NULL))
6547 break;
6549 /* A PARALLEL can have lots of SETs in it,
6550 especially if it is really an ASM_OPERANDS. */
6551 if (INSN_P (p) && GET_CODE (PATTERN (p)) == PARALLEL)
6552 nsets += XVECLEN (PATTERN (p), 0);
6553 else if (!NOTE_P (p))
6554 nsets += 1;
6556 /* Ignore insns made by CSE; they cannot affect the boundaries of
6557 the basic block. */
6559 if (INSN_UID (p) <= max_uid && INSN_CUID (p) > high_cuid)
6560 high_cuid = INSN_CUID (p);
6561 if (INSN_UID (p) <= max_uid && INSN_CUID (p) < low_cuid)
6562 low_cuid = INSN_CUID (p);
6564 /* See if this insn is in our branch path. If it is and we are to
6565 take it, do so. */
6566 if (path_entry < path_size && data->path[path_entry].branch == p)
6568 if (data->path[path_entry].status != PATH_NOT_TAKEN)
6569 p = JUMP_LABEL (p);
6571 /* Point to next entry in path, if any. */
6572 path_entry++;
6575 /* If this is a conditional jump, we can follow it if -fcse-follow-jumps
6576 was specified, we haven't reached our maximum path length, there are
6577 insns following the target of the jump, this is the only use of the
6578 jump label, and the target label is preceded by a BARRIER.
6580 Alternatively, we can follow the jump if it branches around a
6581 block of code and there are no other branches into the block.
6582 In this case invalidate_skipped_block will be called to invalidate any
6583 registers set in the block when following the jump. */
6585 else if ((follow_jumps || skip_blocks) && path_size < PARAM_VALUE (PARAM_MAX_CSE_PATH_LENGTH) - 1
6586 && JUMP_P (p)
6587 && GET_CODE (PATTERN (p)) == SET
6588 && GET_CODE (SET_SRC (PATTERN (p))) == IF_THEN_ELSE
6589 && JUMP_LABEL (p) != 0
6590 && LABEL_NUSES (JUMP_LABEL (p)) == 1
6591 && NEXT_INSN (JUMP_LABEL (p)) != 0)
6593 for (q = PREV_INSN (JUMP_LABEL (p)); q; q = PREV_INSN (q))
6594 if ((!NOTE_P (q)
6595 || NOTE_LINE_NUMBER (q) == NOTE_INSN_LOOP_END
6596 || (PREV_INSN (q) && CALL_P (PREV_INSN (q))
6597 && find_reg_note (PREV_INSN (q), REG_SETJMP, NULL)))
6598 && (!LABEL_P (q) || LABEL_NUSES (q) != 0))
6599 break;
6601 /* If we ran into a BARRIER, this code is an extension of the
6602 basic block when the branch is taken. */
6603 if (follow_jumps && q != 0 && BARRIER_P (q))
6605 /* Don't allow ourself to keep walking around an
6606 always-executed loop. */
6607 if (next_real_insn (q) == next)
6609 p = NEXT_INSN (p);
6610 continue;
6613 /* Similarly, don't put a branch in our path more than once. */
6614 for (i = 0; i < path_entry; i++)
6615 if (data->path[i].branch == p)
6616 break;
6618 if (i != path_entry)
6619 break;
6621 data->path[path_entry].branch = p;
6622 data->path[path_entry++].status = PATH_TAKEN;
6624 /* This branch now ends our path. It was possible that we
6625 didn't see this branch the last time around (when the
6626 insn in front of the target was a JUMP_INSN that was
6627 turned into a no-op). */
6628 path_size = path_entry;
6630 p = JUMP_LABEL (p);
6631 /* Mark block so we won't scan it again later. */
6632 PUT_MODE (NEXT_INSN (p), QImode);
6634 /* Detect a branch around a block of code. */
6635 else if (skip_blocks && q != 0 && !LABEL_P (q))
6637 rtx tmp;
6639 if (next_real_insn (q) == next)
6641 p = NEXT_INSN (p);
6642 continue;
6645 for (i = 0; i < path_entry; i++)
6646 if (data->path[i].branch == p)
6647 break;
6649 if (i != path_entry)
6650 break;
6652 /* This is no_labels_between_p (p, q) with an added check for
6653 reaching the end of a function (in case Q precedes P). */
6654 for (tmp = NEXT_INSN (p); tmp && tmp != q; tmp = NEXT_INSN (tmp))
6655 if (LABEL_P (tmp))
6656 break;
6658 if (tmp == q)
6660 data->path[path_entry].branch = p;
6661 data->path[path_entry++].status = PATH_AROUND;
6663 path_size = path_entry;
6665 p = JUMP_LABEL (p);
6666 /* Mark block so we won't scan it again later. */
6667 PUT_MODE (NEXT_INSN (p), QImode);
6671 p = NEXT_INSN (p);
6674 data->low_cuid = low_cuid;
6675 data->high_cuid = high_cuid;
6676 data->nsets = nsets;
6677 data->last = p;
6679 /* If all jumps in the path are not taken, set our path length to zero
6680 so a rescan won't be done. */
6681 for (i = path_size - 1; i >= 0; i--)
6682 if (data->path[i].status != PATH_NOT_TAKEN)
6683 break;
6685 if (i == -1)
6686 data->path_size = 0;
6687 else
6688 data->path_size = path_size;
6690 /* End the current branch path. */
6691 data->path[path_size].branch = 0;
6694 /* Perform cse on the instructions of a function.
6695 F is the first instruction.
6696 NREGS is one plus the highest pseudo-reg number used in the instruction.
6698 Returns 1 if jump_optimize should be redone due to simplifications
6699 in conditional jump instructions. */
6702 cse_main (rtx f, int nregs, FILE *file)
6704 struct cse_basic_block_data val;
6705 rtx insn = f;
6706 int i;
6708 val.path = xmalloc (sizeof (struct branch_path)
6709 * PARAM_VALUE (PARAM_MAX_CSE_PATH_LENGTH));
6711 cse_jumps_altered = 0;
6712 recorded_label_ref = 0;
6713 constant_pool_entries_cost = 0;
6714 constant_pool_entries_regcost = 0;
6715 val.path_size = 0;
6716 rtl_hooks = cse_rtl_hooks;
6718 init_recog ();
6719 init_alias_analysis ();
6721 reg_eqv_table = xmalloc (nregs * sizeof (struct reg_eqv_elem));
6723 /* Reset the counter indicating how many elements have been made
6724 thus far. */
6725 n_elements_made = 0;
6727 /* Find the largest uid. */
6729 max_uid = get_max_uid ();
6730 uid_cuid = xcalloc (max_uid + 1, sizeof (int));
6732 /* Compute the mapping from uids to cuids.
6733 CUIDs are numbers assigned to insns, like uids,
6734 except that cuids increase monotonically through the code.
6735 Don't assign cuids to line-number NOTEs, so that the distance in cuids
6736 between two insns is not affected by -g. */
6738 for (insn = f, i = 0; insn; insn = NEXT_INSN (insn))
6740 if (!NOTE_P (insn)
6741 || NOTE_LINE_NUMBER (insn) < 0)
6742 INSN_CUID (insn) = ++i;
6743 else
6744 /* Give a line number note the same cuid as preceding insn. */
6745 INSN_CUID (insn) = i;
6748 /* Loop over basic blocks.
6749 Compute the maximum number of qty's needed for each basic block
6750 (which is 2 for each SET). */
6751 insn = f;
6752 while (insn)
6754 cse_altered = 0;
6755 cse_end_of_basic_block (insn, &val, flag_cse_follow_jumps,
6756 flag_cse_skip_blocks);
6758 /* If this basic block was already processed or has no sets, skip it. */
6759 if (val.nsets == 0 || GET_MODE (insn) == QImode)
6761 PUT_MODE (insn, VOIDmode);
6762 insn = (val.last ? NEXT_INSN (val.last) : 0);
6763 val.path_size = 0;
6764 continue;
6767 cse_basic_block_start = val.low_cuid;
6768 cse_basic_block_end = val.high_cuid;
6769 max_qty = val.nsets * 2;
6771 if (file)
6772 fnotice (file, ";; Processing block from %d to %d, %d sets.\n",
6773 INSN_UID (insn), val.last ? INSN_UID (val.last) : 0,
6774 val.nsets);
6776 /* Make MAX_QTY bigger to give us room to optimize
6777 past the end of this basic block, if that should prove useful. */
6778 if (max_qty < 500)
6779 max_qty = 500;
6781 /* If this basic block is being extended by following certain jumps,
6782 (see `cse_end_of_basic_block'), we reprocess the code from the start.
6783 Otherwise, we start after this basic block. */
6784 if (val.path_size > 0)
6785 cse_basic_block (insn, val.last, val.path);
6786 else
6788 int old_cse_jumps_altered = cse_jumps_altered;
6789 rtx temp;
6791 /* When cse changes a conditional jump to an unconditional
6792 jump, we want to reprocess the block, since it will give
6793 us a new branch path to investigate. */
6794 cse_jumps_altered = 0;
6795 temp = cse_basic_block (insn, val.last, val.path);
6796 if (cse_jumps_altered == 0
6797 || (flag_cse_follow_jumps == 0 && flag_cse_skip_blocks == 0))
6798 insn = temp;
6800 cse_jumps_altered |= old_cse_jumps_altered;
6803 if (cse_altered)
6804 ggc_collect ();
6806 #ifdef USE_C_ALLOCA
6807 alloca (0);
6808 #endif
6811 if (max_elements_made < n_elements_made)
6812 max_elements_made = n_elements_made;
6814 /* Clean up. */
6815 end_alias_analysis ();
6816 free (uid_cuid);
6817 free (reg_eqv_table);
6818 free (val.path);
6819 rtl_hooks = general_rtl_hooks;
6821 return cse_jumps_altered || recorded_label_ref;
6824 /* Process a single basic block. FROM and TO and the limits of the basic
6825 block. NEXT_BRANCH points to the branch path when following jumps or
6826 a null path when not following jumps. */
6828 static rtx
6829 cse_basic_block (rtx from, rtx to, struct branch_path *next_branch)
6831 rtx insn;
6832 int to_usage = 0;
6833 rtx libcall_insn = NULL_RTX;
6834 int num_insns = 0;
6835 int no_conflict = 0;
6837 /* Allocate the space needed by qty_table. */
6838 qty_table = xmalloc (max_qty * sizeof (struct qty_table_elem));
6840 new_basic_block ();
6842 /* TO might be a label. If so, protect it from being deleted. */
6843 if (to != 0 && LABEL_P (to))
6844 ++LABEL_NUSES (to);
6846 for (insn = from; insn != to; insn = NEXT_INSN (insn))
6848 enum rtx_code code = GET_CODE (insn);
6850 /* If we have processed 1,000 insns, flush the hash table to
6851 avoid extreme quadratic behavior. We must not include NOTEs
6852 in the count since there may be more of them when generating
6853 debugging information. If we clear the table at different
6854 times, code generated with -g -O might be different than code
6855 generated with -O but not -g.
6857 ??? This is a real kludge and needs to be done some other way.
6858 Perhaps for 2.9. */
6859 if (code != NOTE && num_insns++ > 1000)
6861 flush_hash_table ();
6862 num_insns = 0;
6865 /* See if this is a branch that is part of the path. If so, and it is
6866 to be taken, do so. */
6867 if (next_branch->branch == insn)
6869 enum taken status = next_branch++->status;
6870 if (status != PATH_NOT_TAKEN)
6872 if (status == PATH_TAKEN)
6873 record_jump_equiv (insn, 1);
6874 else
6875 invalidate_skipped_block (NEXT_INSN (insn));
6877 /* Set the last insn as the jump insn; it doesn't affect cc0.
6878 Then follow this branch. */
6879 #ifdef HAVE_cc0
6880 prev_insn_cc0 = 0;
6881 prev_insn = insn;
6882 #endif
6883 insn = JUMP_LABEL (insn);
6884 continue;
6888 if (GET_MODE (insn) == QImode)
6889 PUT_MODE (insn, VOIDmode);
6891 if (GET_RTX_CLASS (code) == RTX_INSN)
6893 rtx p;
6895 /* Process notes first so we have all notes in canonical forms when
6896 looking for duplicate operations. */
6898 if (REG_NOTES (insn))
6899 REG_NOTES (insn) = cse_process_notes (REG_NOTES (insn), NULL_RTX);
6901 /* Track when we are inside in LIBCALL block. Inside such a block,
6902 we do not want to record destinations. The last insn of a
6903 LIBCALL block is not considered to be part of the block, since
6904 its destination is the result of the block and hence should be
6905 recorded. */
6907 if (REG_NOTES (insn) != 0)
6909 if ((p = find_reg_note (insn, REG_LIBCALL, NULL_RTX)))
6910 libcall_insn = XEXP (p, 0);
6911 else if (find_reg_note (insn, REG_RETVAL, NULL_RTX))
6913 /* Keep libcall_insn for the last SET insn of a no-conflict
6914 block to prevent changing the destination. */
6915 if (! no_conflict)
6916 libcall_insn = 0;
6917 else
6918 no_conflict = -1;
6920 else if (find_reg_note (insn, REG_NO_CONFLICT, NULL_RTX))
6921 no_conflict = 1;
6924 cse_insn (insn, libcall_insn);
6926 if (no_conflict == -1)
6928 libcall_insn = 0;
6929 no_conflict = 0;
6932 /* If we haven't already found an insn where we added a LABEL_REF,
6933 check this one. */
6934 if (NONJUMP_INSN_P (insn) && ! recorded_label_ref
6935 && for_each_rtx (&PATTERN (insn), check_for_label_ref,
6936 (void *) insn))
6937 recorded_label_ref = 1;
6940 /* If INSN is now an unconditional jump, skip to the end of our
6941 basic block by pretending that we just did the last insn in the
6942 basic block. If we are jumping to the end of our block, show
6943 that we can have one usage of TO. */
6945 if (any_uncondjump_p (insn))
6947 if (to == 0)
6949 free (qty_table);
6950 return 0;
6953 if (JUMP_LABEL (insn) == to)
6954 to_usage = 1;
6956 /* Maybe TO was deleted because the jump is unconditional.
6957 If so, there is nothing left in this basic block. */
6958 /* ??? Perhaps it would be smarter to set TO
6959 to whatever follows this insn,
6960 and pretend the basic block had always ended here. */
6961 if (INSN_DELETED_P (to))
6962 break;
6964 insn = PREV_INSN (to);
6967 /* See if it is ok to keep on going past the label
6968 which used to end our basic block. Remember that we incremented
6969 the count of that label, so we decrement it here. If we made
6970 a jump unconditional, TO_USAGE will be one; in that case, we don't
6971 want to count the use in that jump. */
6973 if (to != 0 && NEXT_INSN (insn) == to
6974 && LABEL_P (to) && --LABEL_NUSES (to) == to_usage)
6976 struct cse_basic_block_data val;
6977 rtx prev;
6979 insn = NEXT_INSN (to);
6981 /* If TO was the last insn in the function, we are done. */
6982 if (insn == 0)
6984 free (qty_table);
6985 return 0;
6988 /* If TO was preceded by a BARRIER we are done with this block
6989 because it has no continuation. */
6990 prev = prev_nonnote_insn (to);
6991 if (prev && BARRIER_P (prev))
6993 free (qty_table);
6994 return insn;
6997 /* Find the end of the following block. Note that we won't be
6998 following branches in this case. */
6999 to_usage = 0;
7000 val.path_size = 0;
7001 val.path = xmalloc (sizeof (struct branch_path)
7002 * PARAM_VALUE (PARAM_MAX_CSE_PATH_LENGTH));
7003 cse_end_of_basic_block (insn, &val, 0, 0);
7004 free (val.path);
7006 /* If the tables we allocated have enough space left
7007 to handle all the SETs in the next basic block,
7008 continue through it. Otherwise, return,
7009 and that block will be scanned individually. */
7010 if (val.nsets * 2 + next_qty > max_qty)
7011 break;
7013 cse_basic_block_start = val.low_cuid;
7014 cse_basic_block_end = val.high_cuid;
7015 to = val.last;
7017 /* Prevent TO from being deleted if it is a label. */
7018 if (to != 0 && LABEL_P (to))
7019 ++LABEL_NUSES (to);
7021 /* Back up so we process the first insn in the extension. */
7022 insn = PREV_INSN (insn);
7026 gcc_assert (next_qty <= max_qty);
7028 free (qty_table);
7030 return to ? NEXT_INSN (to) : 0;
7033 /* Called via for_each_rtx to see if an insn is using a LABEL_REF for which
7034 there isn't a REG_LABEL note. Return one if so. DATA is the insn. */
7036 static int
7037 check_for_label_ref (rtx *rtl, void *data)
7039 rtx insn = (rtx) data;
7041 /* If this insn uses a LABEL_REF and there isn't a REG_LABEL note for it,
7042 we must rerun jump since it needs to place the note. If this is a
7043 LABEL_REF for a CODE_LABEL that isn't in the insn chain, don't do this
7044 since no REG_LABEL will be added. */
7045 return (GET_CODE (*rtl) == LABEL_REF
7046 && ! LABEL_REF_NONLOCAL_P (*rtl)
7047 && LABEL_P (XEXP (*rtl, 0))
7048 && INSN_UID (XEXP (*rtl, 0)) != 0
7049 && ! find_reg_note (insn, REG_LABEL, XEXP (*rtl, 0)));
7052 /* Count the number of times registers are used (not set) in X.
7053 COUNTS is an array in which we accumulate the count, INCR is how much
7054 we count each register usage. */
7056 static void
7057 count_reg_usage (rtx x, int *counts, int incr)
7059 enum rtx_code code;
7060 rtx note;
7061 const char *fmt;
7062 int i, j;
7064 if (x == 0)
7065 return;
7067 switch (code = GET_CODE (x))
7069 case REG:
7070 counts[REGNO (x)] += incr;
7071 return;
7073 case PC:
7074 case CC0:
7075 case CONST:
7076 case CONST_INT:
7077 case CONST_DOUBLE:
7078 case CONST_VECTOR:
7079 case SYMBOL_REF:
7080 case LABEL_REF:
7081 return;
7083 case CLOBBER:
7084 /* If we are clobbering a MEM, mark any registers inside the address
7085 as being used. */
7086 if (MEM_P (XEXP (x, 0)))
7087 count_reg_usage (XEXP (XEXP (x, 0), 0), counts, incr);
7088 return;
7090 case SET:
7091 /* Unless we are setting a REG, count everything in SET_DEST. */
7092 if (!REG_P (SET_DEST (x)))
7093 count_reg_usage (SET_DEST (x), counts, incr);
7094 count_reg_usage (SET_SRC (x), counts, incr);
7095 return;
7097 case CALL_INSN:
7098 count_reg_usage (CALL_INSN_FUNCTION_USAGE (x), counts, incr);
7099 /* Fall through. */
7101 case INSN:
7102 case JUMP_INSN:
7103 count_reg_usage (PATTERN (x), counts, incr);
7105 /* Things used in a REG_EQUAL note aren't dead since loop may try to
7106 use them. */
7108 note = find_reg_equal_equiv_note (x);
7109 if (note)
7111 rtx eqv = XEXP (note, 0);
7113 if (GET_CODE (eqv) == EXPR_LIST)
7114 /* This REG_EQUAL note describes the result of a function call.
7115 Process all the arguments. */
7118 count_reg_usage (XEXP (eqv, 0), counts, incr);
7119 eqv = XEXP (eqv, 1);
7121 while (eqv && GET_CODE (eqv) == EXPR_LIST);
7122 else
7123 count_reg_usage (eqv, counts, incr);
7125 return;
7127 case EXPR_LIST:
7128 if (REG_NOTE_KIND (x) == REG_EQUAL
7129 || (REG_NOTE_KIND (x) != REG_NONNEG && GET_CODE (XEXP (x,0)) == USE)
7130 /* FUNCTION_USAGE expression lists may include (CLOBBER (mem /u)),
7131 involving registers in the address. */
7132 || GET_CODE (XEXP (x, 0)) == CLOBBER)
7133 count_reg_usage (XEXP (x, 0), counts, incr);
7135 count_reg_usage (XEXP (x, 1), counts, incr);
7136 return;
7138 case ASM_OPERANDS:
7139 /* Iterate over just the inputs, not the constraints as well. */
7140 for (i = ASM_OPERANDS_INPUT_LENGTH (x) - 1; i >= 0; i--)
7141 count_reg_usage (ASM_OPERANDS_INPUT (x, i), counts, incr);
7142 return;
7144 case INSN_LIST:
7145 gcc_unreachable ();
7147 default:
7148 break;
7151 fmt = GET_RTX_FORMAT (code);
7152 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
7154 if (fmt[i] == 'e')
7155 count_reg_usage (XEXP (x, i), counts, incr);
7156 else if (fmt[i] == 'E')
7157 for (j = XVECLEN (x, i) - 1; j >= 0; j--)
7158 count_reg_usage (XVECEXP (x, i, j), counts, incr);
7162 /* Return true if set is live. */
7163 static bool
7164 set_live_p (rtx set, rtx insn ATTRIBUTE_UNUSED, /* Only used with HAVE_cc0. */
7165 int *counts)
7167 #ifdef HAVE_cc0
7168 rtx tem;
7169 #endif
7171 if (set_noop_p (set))
7174 #ifdef HAVE_cc0
7175 else if (GET_CODE (SET_DEST (set)) == CC0
7176 && !side_effects_p (SET_SRC (set))
7177 && ((tem = next_nonnote_insn (insn)) == 0
7178 || !INSN_P (tem)
7179 || !reg_referenced_p (cc0_rtx, PATTERN (tem))))
7180 return false;
7181 #endif
7182 else if (!REG_P (SET_DEST (set))
7183 || REGNO (SET_DEST (set)) < FIRST_PSEUDO_REGISTER
7184 || counts[REGNO (SET_DEST (set))] != 0
7185 || side_effects_p (SET_SRC (set)))
7186 return true;
7187 return false;
7190 /* Return true if insn is live. */
7192 static bool
7193 insn_live_p (rtx insn, int *counts)
7195 int i;
7196 if (flag_non_call_exceptions && may_trap_p (PATTERN (insn)))
7197 return true;
7198 else if (GET_CODE (PATTERN (insn)) == SET)
7199 return set_live_p (PATTERN (insn), insn, counts);
7200 else if (GET_CODE (PATTERN (insn)) == PARALLEL)
7202 for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
7204 rtx elt = XVECEXP (PATTERN (insn), 0, i);
7206 if (GET_CODE (elt) == SET)
7208 if (set_live_p (elt, insn, counts))
7209 return true;
7211 else if (GET_CODE (elt) != CLOBBER && GET_CODE (elt) != USE)
7212 return true;
7214 return false;
7216 else
7217 return true;
7220 /* Return true if libcall is dead as a whole. */
7222 static bool
7223 dead_libcall_p (rtx insn, int *counts)
7225 rtx note, set, new;
7227 /* See if there's a REG_EQUAL note on this insn and try to
7228 replace the source with the REG_EQUAL expression.
7230 We assume that insns with REG_RETVALs can only be reg->reg
7231 copies at this point. */
7232 note = find_reg_note (insn, REG_EQUAL, NULL_RTX);
7233 if (!note)
7234 return false;
7236 set = single_set (insn);
7237 if (!set)
7238 return false;
7240 new = simplify_rtx (XEXP (note, 0));
7241 if (!new)
7242 new = XEXP (note, 0);
7244 /* While changing insn, we must update the counts accordingly. */
7245 count_reg_usage (insn, counts, -1);
7247 if (validate_change (insn, &SET_SRC (set), new, 0))
7249 count_reg_usage (insn, counts, 1);
7250 remove_note (insn, find_reg_note (insn, REG_RETVAL, NULL_RTX));
7251 remove_note (insn, note);
7252 return true;
7255 if (CONSTANT_P (new))
7257 new = force_const_mem (GET_MODE (SET_DEST (set)), new);
7258 if (new && validate_change (insn, &SET_SRC (set), new, 0))
7260 count_reg_usage (insn, counts, 1);
7261 remove_note (insn, find_reg_note (insn, REG_RETVAL, NULL_RTX));
7262 remove_note (insn, note);
7263 return true;
7267 count_reg_usage (insn, counts, 1);
7268 return false;
7271 /* Scan all the insns and delete any that are dead; i.e., they store a register
7272 that is never used or they copy a register to itself.
7274 This is used to remove insns made obviously dead by cse, loop or other
7275 optimizations. It improves the heuristics in loop since it won't try to
7276 move dead invariants out of loops or make givs for dead quantities. The
7277 remaining passes of the compilation are also sped up. */
7280 delete_trivially_dead_insns (rtx insns, int nreg)
7282 int *counts;
7283 rtx insn, prev;
7284 int in_libcall = 0, dead_libcall = 0;
7285 int ndead = 0, nlastdead, niterations = 0;
7287 timevar_push (TV_DELETE_TRIVIALLY_DEAD);
7288 /* First count the number of times each register is used. */
7289 counts = xcalloc (nreg, sizeof (int));
7290 for (insn = next_real_insn (insns); insn; insn = next_real_insn (insn))
7291 count_reg_usage (insn, counts, 1);
7295 nlastdead = ndead;
7296 niterations++;
7297 /* Go from the last insn to the first and delete insns that only set unused
7298 registers or copy a register to itself. As we delete an insn, remove
7299 usage counts for registers it uses.
7301 The first jump optimization pass may leave a real insn as the last
7302 insn in the function. We must not skip that insn or we may end
7303 up deleting code that is not really dead. */
7304 insn = get_last_insn ();
7305 if (! INSN_P (insn))
7306 insn = prev_real_insn (insn);
7308 for (; insn; insn = prev)
7310 int live_insn = 0;
7312 prev = prev_real_insn (insn);
7314 /* Don't delete any insns that are part of a libcall block unless
7315 we can delete the whole libcall block.
7317 Flow or loop might get confused if we did that. Remember
7318 that we are scanning backwards. */
7319 if (find_reg_note (insn, REG_RETVAL, NULL_RTX))
7321 in_libcall = 1;
7322 live_insn = 1;
7323 dead_libcall = dead_libcall_p (insn, counts);
7325 else if (in_libcall)
7326 live_insn = ! dead_libcall;
7327 else
7328 live_insn = insn_live_p (insn, counts);
7330 /* If this is a dead insn, delete it and show registers in it aren't
7331 being used. */
7333 if (! live_insn)
7335 count_reg_usage (insn, counts, -1);
7336 delete_insn_and_edges (insn);
7337 ndead++;
7340 if (find_reg_note (insn, REG_LIBCALL, NULL_RTX))
7342 in_libcall = 0;
7343 dead_libcall = 0;
7347 while (ndead != nlastdead);
7349 if (dump_file && ndead)
7350 fprintf (dump_file, "Deleted %i trivially dead insns; %i iterations\n",
7351 ndead, niterations);
7352 /* Clean up. */
7353 free (counts);
7354 timevar_pop (TV_DELETE_TRIVIALLY_DEAD);
7355 return ndead;
7358 /* This function is called via for_each_rtx. The argument, NEWREG, is
7359 a condition code register with the desired mode. If we are looking
7360 at the same register in a different mode, replace it with
7361 NEWREG. */
7363 static int
7364 cse_change_cc_mode (rtx *loc, void *data)
7366 struct change_cc_mode_args* args = (struct change_cc_mode_args*)data;
7368 if (*loc
7369 && REG_P (*loc)
7370 && REGNO (*loc) == REGNO (args->newreg)
7371 && GET_MODE (*loc) != GET_MODE (args->newreg))
7373 validate_change (args->insn, loc, args->newreg, 1);
7375 return -1;
7377 return 0;
7380 /* Change the mode of any reference to the register REGNO (NEWREG) to
7381 GET_MODE (NEWREG) in INSN. */
7383 static void
7384 cse_change_cc_mode_insn (rtx insn, rtx newreg)
7386 struct change_cc_mode_args args;
7387 int success;
7389 if (!INSN_P (insn))
7390 return;
7392 args.insn = insn;
7393 args.newreg = newreg;
7395 for_each_rtx (&PATTERN (insn), cse_change_cc_mode, &args);
7396 for_each_rtx (&REG_NOTES (insn), cse_change_cc_mode, &args);
7398 /* If the following assertion was triggered, there is most probably
7399 something wrong with the cc_modes_compatible back end function.
7400 CC modes only can be considered compatible if the insn - with the mode
7401 replaced by any of the compatible modes - can still be recognized. */
7402 success = apply_change_group ();
7403 gcc_assert (success);
7406 /* Change the mode of any reference to the register REGNO (NEWREG) to
7407 GET_MODE (NEWREG), starting at START. Stop before END. Stop at
7408 any instruction which modifies NEWREG. */
7410 static void
7411 cse_change_cc_mode_insns (rtx start, rtx end, rtx newreg)
7413 rtx insn;
7415 for (insn = start; insn != end; insn = NEXT_INSN (insn))
7417 if (! INSN_P (insn))
7418 continue;
7420 if (reg_set_p (newreg, insn))
7421 return;
7423 cse_change_cc_mode_insn (insn, newreg);
7427 /* BB is a basic block which finishes with CC_REG as a condition code
7428 register which is set to CC_SRC. Look through the successors of BB
7429 to find blocks which have a single predecessor (i.e., this one),
7430 and look through those blocks for an assignment to CC_REG which is
7431 equivalent to CC_SRC. CAN_CHANGE_MODE indicates whether we are
7432 permitted to change the mode of CC_SRC to a compatible mode. This
7433 returns VOIDmode if no equivalent assignments were found.
7434 Otherwise it returns the mode which CC_SRC should wind up with.
7436 The main complexity in this function is handling the mode issues.
7437 We may have more than one duplicate which we can eliminate, and we
7438 try to find a mode which will work for multiple duplicates. */
7440 static enum machine_mode
7441 cse_cc_succs (basic_block bb, rtx cc_reg, rtx cc_src, bool can_change_mode)
7443 bool found_equiv;
7444 enum machine_mode mode;
7445 unsigned int insn_count;
7446 edge e;
7447 rtx insns[2];
7448 enum machine_mode modes[2];
7449 rtx last_insns[2];
7450 unsigned int i;
7451 rtx newreg;
7452 edge_iterator ei;
7454 /* We expect to have two successors. Look at both before picking
7455 the final mode for the comparison. If we have more successors
7456 (i.e., some sort of table jump, although that seems unlikely),
7457 then we require all beyond the first two to use the same
7458 mode. */
7460 found_equiv = false;
7461 mode = GET_MODE (cc_src);
7462 insn_count = 0;
7463 FOR_EACH_EDGE (e, ei, bb->succs)
7465 rtx insn;
7466 rtx end;
7468 if (e->flags & EDGE_COMPLEX)
7469 continue;
7471 if (EDGE_COUNT (e->dest->preds) != 1
7472 || e->dest == EXIT_BLOCK_PTR)
7473 continue;
7475 end = NEXT_INSN (BB_END (e->dest));
7476 for (insn = BB_HEAD (e->dest); insn != end; insn = NEXT_INSN (insn))
7478 rtx set;
7480 if (! INSN_P (insn))
7481 continue;
7483 /* If CC_SRC is modified, we have to stop looking for
7484 something which uses it. */
7485 if (modified_in_p (cc_src, insn))
7486 break;
7488 /* Check whether INSN sets CC_REG to CC_SRC. */
7489 set = single_set (insn);
7490 if (set
7491 && REG_P (SET_DEST (set))
7492 && REGNO (SET_DEST (set)) == REGNO (cc_reg))
7494 bool found;
7495 enum machine_mode set_mode;
7496 enum machine_mode comp_mode;
7498 found = false;
7499 set_mode = GET_MODE (SET_SRC (set));
7500 comp_mode = set_mode;
7501 if (rtx_equal_p (cc_src, SET_SRC (set)))
7502 found = true;
7503 else if (GET_CODE (cc_src) == COMPARE
7504 && GET_CODE (SET_SRC (set)) == COMPARE
7505 && mode != set_mode
7506 && rtx_equal_p (XEXP (cc_src, 0),
7507 XEXP (SET_SRC (set), 0))
7508 && rtx_equal_p (XEXP (cc_src, 1),
7509 XEXP (SET_SRC (set), 1)))
7512 comp_mode = targetm.cc_modes_compatible (mode, set_mode);
7513 if (comp_mode != VOIDmode
7514 && (can_change_mode || comp_mode == mode))
7515 found = true;
7518 if (found)
7520 found_equiv = true;
7521 if (insn_count < ARRAY_SIZE (insns))
7523 insns[insn_count] = insn;
7524 modes[insn_count] = set_mode;
7525 last_insns[insn_count] = end;
7526 ++insn_count;
7528 if (mode != comp_mode)
7530 gcc_assert (can_change_mode);
7531 mode = comp_mode;
7533 /* The modified insn will be re-recognized later. */
7534 PUT_MODE (cc_src, mode);
7537 else
7539 if (set_mode != mode)
7541 /* We found a matching expression in the
7542 wrong mode, but we don't have room to
7543 store it in the array. Punt. This case
7544 should be rare. */
7545 break;
7547 /* INSN sets CC_REG to a value equal to CC_SRC
7548 with the right mode. We can simply delete
7549 it. */
7550 delete_insn (insn);
7553 /* We found an instruction to delete. Keep looking,
7554 in the hopes of finding a three-way jump. */
7555 continue;
7558 /* We found an instruction which sets the condition
7559 code, so don't look any farther. */
7560 break;
7563 /* If INSN sets CC_REG in some other way, don't look any
7564 farther. */
7565 if (reg_set_p (cc_reg, insn))
7566 break;
7569 /* If we fell off the bottom of the block, we can keep looking
7570 through successors. We pass CAN_CHANGE_MODE as false because
7571 we aren't prepared to handle compatibility between the
7572 further blocks and this block. */
7573 if (insn == end)
7575 enum machine_mode submode;
7577 submode = cse_cc_succs (e->dest, cc_reg, cc_src, false);
7578 if (submode != VOIDmode)
7580 gcc_assert (submode == mode);
7581 found_equiv = true;
7582 can_change_mode = false;
7587 if (! found_equiv)
7588 return VOIDmode;
7590 /* Now INSN_COUNT is the number of instructions we found which set
7591 CC_REG to a value equivalent to CC_SRC. The instructions are in
7592 INSNS. The modes used by those instructions are in MODES. */
7594 newreg = NULL_RTX;
7595 for (i = 0; i < insn_count; ++i)
7597 if (modes[i] != mode)
7599 /* We need to change the mode of CC_REG in INSNS[i] and
7600 subsequent instructions. */
7601 if (! newreg)
7603 if (GET_MODE (cc_reg) == mode)
7604 newreg = cc_reg;
7605 else
7606 newreg = gen_rtx_REG (mode, REGNO (cc_reg));
7608 cse_change_cc_mode_insns (NEXT_INSN (insns[i]), last_insns[i],
7609 newreg);
7612 delete_insn (insns[i]);
7615 return mode;
7618 /* If we have a fixed condition code register (or two), walk through
7619 the instructions and try to eliminate duplicate assignments. */
7621 void
7622 cse_condition_code_reg (void)
7624 unsigned int cc_regno_1;
7625 unsigned int cc_regno_2;
7626 rtx cc_reg_1;
7627 rtx cc_reg_2;
7628 basic_block bb;
7630 if (! targetm.fixed_condition_code_regs (&cc_regno_1, &cc_regno_2))
7631 return;
7633 cc_reg_1 = gen_rtx_REG (CCmode, cc_regno_1);
7634 if (cc_regno_2 != INVALID_REGNUM)
7635 cc_reg_2 = gen_rtx_REG (CCmode, cc_regno_2);
7636 else
7637 cc_reg_2 = NULL_RTX;
7639 FOR_EACH_BB (bb)
7641 rtx last_insn;
7642 rtx cc_reg;
7643 rtx insn;
7644 rtx cc_src_insn;
7645 rtx cc_src;
7646 enum machine_mode mode;
7647 enum machine_mode orig_mode;
7649 /* Look for blocks which end with a conditional jump based on a
7650 condition code register. Then look for the instruction which
7651 sets the condition code register. Then look through the
7652 successor blocks for instructions which set the condition
7653 code register to the same value. There are other possible
7654 uses of the condition code register, but these are by far the
7655 most common and the ones which we are most likely to be able
7656 to optimize. */
7658 last_insn = BB_END (bb);
7659 if (!JUMP_P (last_insn))
7660 continue;
7662 if (reg_referenced_p (cc_reg_1, PATTERN (last_insn)))
7663 cc_reg = cc_reg_1;
7664 else if (cc_reg_2 && reg_referenced_p (cc_reg_2, PATTERN (last_insn)))
7665 cc_reg = cc_reg_2;
7666 else
7667 continue;
7669 cc_src_insn = NULL_RTX;
7670 cc_src = NULL_RTX;
7671 for (insn = PREV_INSN (last_insn);
7672 insn && insn != PREV_INSN (BB_HEAD (bb));
7673 insn = PREV_INSN (insn))
7675 rtx set;
7677 if (! INSN_P (insn))
7678 continue;
7679 set = single_set (insn);
7680 if (set
7681 && REG_P (SET_DEST (set))
7682 && REGNO (SET_DEST (set)) == REGNO (cc_reg))
7684 cc_src_insn = insn;
7685 cc_src = SET_SRC (set);
7686 break;
7688 else if (reg_set_p (cc_reg, insn))
7689 break;
7692 if (! cc_src_insn)
7693 continue;
7695 if (modified_between_p (cc_src, cc_src_insn, NEXT_INSN (last_insn)))
7696 continue;
7698 /* Now CC_REG is a condition code register used for a
7699 conditional jump at the end of the block, and CC_SRC, in
7700 CC_SRC_INSN, is the value to which that condition code
7701 register is set, and CC_SRC is still meaningful at the end of
7702 the basic block. */
7704 orig_mode = GET_MODE (cc_src);
7705 mode = cse_cc_succs (bb, cc_reg, cc_src, true);
7706 if (mode != VOIDmode)
7708 gcc_assert (mode == GET_MODE (cc_src));
7709 if (mode != orig_mode)
7711 rtx newreg = gen_rtx_REG (mode, REGNO (cc_reg));
7713 cse_change_cc_mode_insn (cc_src_insn, newreg);
7715 /* Do the same in the following insns that use the
7716 current value of CC_REG within BB. */
7717 cse_change_cc_mode_insns (NEXT_INSN (cc_src_insn),
7718 NEXT_INSN (last_insn),
7719 newreg);