* emit-rtl.c (gen_lowpart_common): Suppress last change if __complex__.
[official-gcc.git] / gcc / combine.c
blob2fd6246e2ef394a90515b66b0491aa69d828b746
1 /* Optimize by combining instructions for GNU compiler.
2 Copyright (C) 1987, 88, 92-96, 1997 Free Software Foundation, Inc.
4 This file is part of GNU CC.
6 GNU CC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2, or (at your option)
9 any later version.
11 GNU CC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GNU CC; see the file COPYING. If not, write to
18 the Free Software Foundation, 59 Temple Place - Suite 330,
19 Boston, MA 02111-1307, USA. */
22 /* This module is essentially the "combiner" phase of the U. of Arizona
23 Portable Optimizer, but redone to work on our list-structured
24 representation for RTL instead of their string representation.
26 The LOG_LINKS of each insn identify the most recent assignment
27 to each REG used in the insn. It is a list of previous insns,
28 each of which contains a SET for a REG that is used in this insn
29 and not used or set in between. LOG_LINKs never cross basic blocks.
30 They were set up by the preceding pass (lifetime analysis).
32 We try to combine each pair of insns joined by a logical link.
33 We also try to combine triples of insns A, B and C when
34 C has a link back to B and B has a link back to A.
36 LOG_LINKS does not have links for use of the CC0. They don't
37 need to, because the insn that sets the CC0 is always immediately
38 before the insn that tests it. So we always regard a branch
39 insn as having a logical link to the preceding insn. The same is true
40 for an insn explicitly using CC0.
42 We check (with use_crosses_set_p) to avoid combining in such a way
43 as to move a computation to a place where its value would be different.
45 Combination is done by mathematically substituting the previous
46 insn(s) values for the regs they set into the expressions in
47 the later insns that refer to these regs. If the result is a valid insn
48 for our target machine, according to the machine description,
49 we install it, delete the earlier insns, and update the data flow
50 information (LOG_LINKS and REG_NOTES) for what we did.
52 There are a few exceptions where the dataflow information created by
53 flow.c aren't completely updated:
55 - reg_live_length is not updated
56 - reg_n_refs is not adjusted in the rare case when a register is
57 no longer required in a computation
58 - there are extremely rare cases (see distribute_regnotes) when a
59 REG_DEAD note is lost
60 - a LOG_LINKS entry that refers to an insn with multiple SETs may be
61 removed because there is no way to know which register it was
62 linking
64 To simplify substitution, we combine only when the earlier insn(s)
65 consist of only a single assignment. To simplify updating afterward,
66 we never combine when a subroutine call appears in the middle.
68 Since we do not represent assignments to CC0 explicitly except when that
69 is all an insn does, there is no LOG_LINKS entry in an insn that uses
70 the condition code for the insn that set the condition code.
71 Fortunately, these two insns must be consecutive.
72 Therefore, every JUMP_INSN is taken to have an implicit logical link
73 to the preceding insn. This is not quite right, since non-jumps can
74 also use the condition code; but in practice such insns would not
75 combine anyway. */
77 #include "config.h"
78 #ifdef __STDC__
79 #include <stdarg.h>
80 #else
81 #include <varargs.h>
82 #endif
84 /* Must precede rtl.h for FFS. */
85 #include <stdio.h>
87 #include "rtl.h"
88 #include "flags.h"
89 #include "regs.h"
90 #include "hard-reg-set.h"
91 #include "expr.h"
92 #include "basic-block.h"
93 #include "insn-config.h"
94 #include "insn-flags.h"
95 #include "insn-codes.h"
96 #include "insn-attr.h"
97 #include "recog.h"
98 #include "real.h"
100 /* It is not safe to use ordinary gen_lowpart in combine.
101 Use gen_lowpart_for_combine instead. See comments there. */
102 #define gen_lowpart dont_use_gen_lowpart_you_dummy
104 /* Number of attempts to combine instructions in this function. */
106 static int combine_attempts;
108 /* Number of attempts that got as far as substitution in this function. */
110 static int combine_merges;
112 /* Number of instructions combined with added SETs in this function. */
114 static int combine_extras;
116 /* Number of instructions combined in this function. */
118 static int combine_successes;
120 /* Totals over entire compilation. */
122 static int total_attempts, total_merges, total_extras, total_successes;
124 /* Define a default value for REVERSIBLE_CC_MODE.
125 We can never assume that a condition code mode is safe to reverse unless
126 the md tells us so. */
127 #ifndef REVERSIBLE_CC_MODE
128 #define REVERSIBLE_CC_MODE(MODE) 0
129 #endif
131 /* Vector mapping INSN_UIDs to cuids.
132 The cuids are like uids but increase monotonically always.
133 Combine always uses cuids so that it can compare them.
134 But actually renumbering the uids, which we used to do,
135 proves to be a bad idea because it makes it hard to compare
136 the dumps produced by earlier passes with those from later passes. */
138 static int *uid_cuid;
139 static int max_uid_cuid;
141 /* Get the cuid of an insn. */
143 #define INSN_CUID(INSN) \
144 (INSN_UID (INSN) > max_uid_cuid ? insn_cuid (INSN) : uid_cuid[INSN_UID (INSN)])
146 /* Maximum register number, which is the size of the tables below. */
148 static int combine_max_regno;
150 /* Record last point of death of (hard or pseudo) register n. */
152 static rtx *reg_last_death;
154 /* Record last point of modification of (hard or pseudo) register n. */
156 static rtx *reg_last_set;
158 /* Record the cuid of the last insn that invalidated memory
159 (anything that writes memory, and subroutine calls, but not pushes). */
161 static int mem_last_set;
163 /* Record the cuid of the last CALL_INSN
164 so we can tell whether a potential combination crosses any calls. */
166 static int last_call_cuid;
168 /* When `subst' is called, this is the insn that is being modified
169 (by combining in a previous insn). The PATTERN of this insn
170 is still the old pattern partially modified and it should not be
171 looked at, but this may be used to examine the successors of the insn
172 to judge whether a simplification is valid. */
174 static rtx subst_insn;
176 /* This is an insn that belongs before subst_insn, but is not currently
177 on the insn chain. */
179 static rtx subst_prev_insn;
181 /* This is the lowest CUID that `subst' is currently dealing with.
182 get_last_value will not return a value if the register was set at or
183 after this CUID. If not for this mechanism, we could get confused if
184 I2 or I1 in try_combine were an insn that used the old value of a register
185 to obtain a new value. In that case, we might erroneously get the
186 new value of the register when we wanted the old one. */
188 static int subst_low_cuid;
190 /* This contains any hard registers that are used in newpat; reg_dead_at_p
191 must consider all these registers to be always live. */
193 static HARD_REG_SET newpat_used_regs;
195 /* This is an insn to which a LOG_LINKS entry has been added. If this
196 insn is the earlier than I2 or I3, combine should rescan starting at
197 that location. */
199 static rtx added_links_insn;
201 /* Basic block number of the block in which we are performing combines. */
202 static int this_basic_block;
204 /* The next group of arrays allows the recording of the last value assigned
205 to (hard or pseudo) register n. We use this information to see if a
206 operation being processed is redundant given a prior operation performed
207 on the register. For example, an `and' with a constant is redundant if
208 all the zero bits are already known to be turned off.
210 We use an approach similar to that used by cse, but change it in the
211 following ways:
213 (1) We do not want to reinitialize at each label.
214 (2) It is useful, but not critical, to know the actual value assigned
215 to a register. Often just its form is helpful.
217 Therefore, we maintain the following arrays:
219 reg_last_set_value the last value assigned
220 reg_last_set_label records the value of label_tick when the
221 register was assigned
222 reg_last_set_table_tick records the value of label_tick when a
223 value using the register is assigned
224 reg_last_set_invalid set to non-zero when it is not valid
225 to use the value of this register in some
226 register's value
228 To understand the usage of these tables, it is important to understand
229 the distinction between the value in reg_last_set_value being valid
230 and the register being validly contained in some other expression in the
231 table.
233 Entry I in reg_last_set_value is valid if it is non-zero, and either
234 reg_n_sets[i] is 1 or reg_last_set_label[i] == label_tick.
236 Register I may validly appear in any expression returned for the value
237 of another register if reg_n_sets[i] is 1. It may also appear in the
238 value for register J if reg_last_set_label[i] < reg_last_set_label[j] or
239 reg_last_set_invalid[j] is zero.
241 If an expression is found in the table containing a register which may
242 not validly appear in an expression, the register is replaced by
243 something that won't match, (clobber (const_int 0)).
245 reg_last_set_invalid[i] is set non-zero when register I is being assigned
246 to and reg_last_set_table_tick[i] == label_tick. */
248 /* Record last value assigned to (hard or pseudo) register n. */
250 static rtx *reg_last_set_value;
252 /* Record the value of label_tick when the value for register n is placed in
253 reg_last_set_value[n]. */
255 static int *reg_last_set_label;
257 /* Record the value of label_tick when an expression involving register n
258 is placed in reg_last_set_value. */
260 static int *reg_last_set_table_tick;
262 /* Set non-zero if references to register n in expressions should not be
263 used. */
265 static char *reg_last_set_invalid;
267 /* Incremented for each label. */
269 static int label_tick;
271 /* Some registers that are set more than once and used in more than one
272 basic block are nevertheless always set in similar ways. For example,
273 a QImode register may be loaded from memory in two places on a machine
274 where byte loads zero extend.
276 We record in the following array what we know about the nonzero
277 bits of a register, specifically which bits are known to be zero.
279 If an entry is zero, it means that we don't know anything special. */
281 static unsigned HOST_WIDE_INT *reg_nonzero_bits;
283 /* Mode used to compute significance in reg_nonzero_bits. It is the largest
284 integer mode that can fit in HOST_BITS_PER_WIDE_INT. */
286 static enum machine_mode nonzero_bits_mode;
288 /* Nonzero if we know that a register has some leading bits that are always
289 equal to the sign bit. */
291 static char *reg_sign_bit_copies;
293 /* Nonzero when reg_nonzero_bits and reg_sign_bit_copies can be safely used.
294 It is zero while computing them and after combine has completed. This
295 former test prevents propagating values based on previously set values,
296 which can be incorrect if a variable is modified in a loop. */
298 static int nonzero_sign_valid;
300 /* These arrays are maintained in parallel with reg_last_set_value
301 and are used to store the mode in which the register was last set,
302 the bits that were known to be zero when it was last set, and the
303 number of sign bits copies it was known to have when it was last set. */
305 static enum machine_mode *reg_last_set_mode;
306 static unsigned HOST_WIDE_INT *reg_last_set_nonzero_bits;
307 static char *reg_last_set_sign_bit_copies;
309 /* Record one modification to rtl structure
310 to be undone by storing old_contents into *where.
311 is_int is 1 if the contents are an int. */
313 struct undo
315 struct undo *next;
316 int is_int;
317 union {rtx r; int i;} old_contents;
318 union {rtx *r; int *i;} where;
321 /* Record a bunch of changes to be undone, up to MAX_UNDO of them.
322 num_undo says how many are currently recorded.
324 storage is nonzero if we must undo the allocation of new storage.
325 The value of storage is what to pass to obfree.
327 other_insn is nonzero if we have modified some other insn in the process
328 of working on subst_insn. It must be verified too.
330 previous_undos is the value of undobuf.undos when we started processing
331 this substitution. This will prevent gen_rtx_combine from re-used a piece
332 from the previous expression. Doing so can produce circular rtl
333 structures. */
335 struct undobuf
337 char *storage;
338 struct undo *undos;
339 struct undo *frees;
340 struct undo *previous_undos;
341 rtx other_insn;
344 static struct undobuf undobuf;
346 /* Substitute NEWVAL, an rtx expression, into INTO, a place in some
347 insn. The substitution can be undone by undo_all. If INTO is already
348 set to NEWVAL, do not record this change. Because computing NEWVAL might
349 also call SUBST, we have to compute it before we put anything into
350 the undo table. */
352 #define SUBST(INTO, NEWVAL) \
353 do { rtx _new = (NEWVAL); \
354 struct undo *_buf; \
356 if (undobuf.frees) \
357 _buf = undobuf.frees, undobuf.frees = _buf->next; \
358 else \
359 _buf = (struct undo *) xmalloc (sizeof (struct undo)); \
361 _buf->is_int = 0; \
362 _buf->where.r = &INTO; \
363 _buf->old_contents.r = INTO; \
364 INTO = _new; \
365 if (_buf->old_contents.r == INTO) \
366 _buf->next = undobuf.frees, undobuf.frees = _buf; \
367 else \
368 _buf->next = undobuf.undos, undobuf.undos = _buf; \
369 } while (0)
371 /* Similar to SUBST, but NEWVAL is an int expression. Note that substitution
372 for the value of a HOST_WIDE_INT value (including CONST_INT) is
373 not safe. */
375 #define SUBST_INT(INTO, NEWVAL) \
376 do { struct undo *_buf; \
378 if (undobuf.frees) \
379 _buf = undobuf.frees, undobuf.frees = _buf->next; \
380 else \
381 _buf = (struct undo *) xmalloc (sizeof (struct undo)); \
383 _buf->is_int = 1; \
384 _buf->where.i = (int *) &INTO; \
385 _buf->old_contents.i = INTO; \
386 INTO = NEWVAL; \
387 if (_buf->old_contents.i == INTO) \
388 _buf->next = undobuf.frees, undobuf.frees = _buf; \
389 else \
390 _buf->next = undobuf.undos, undobuf.undos = _buf; \
391 } while (0)
393 /* Number of times the pseudo being substituted for
394 was found and replaced. */
396 static int n_occurrences;
398 static void init_reg_last_arrays PROTO((void));
399 static void setup_incoming_promotions PROTO((void));
400 static void set_nonzero_bits_and_sign_copies PROTO((rtx, rtx));
401 static int can_combine_p PROTO((rtx, rtx, rtx, rtx, rtx *, rtx *));
402 static int combinable_i3pat PROTO((rtx, rtx *, rtx, rtx, int, rtx *));
403 static rtx try_combine PROTO((rtx, rtx, rtx));
404 static void undo_all PROTO((void));
405 static rtx *find_split_point PROTO((rtx *, rtx));
406 static rtx subst PROTO((rtx, rtx, rtx, int, int));
407 static rtx simplify_rtx PROTO((rtx, enum machine_mode, int, int));
408 static rtx simplify_if_then_else PROTO((rtx));
409 static rtx simplify_set PROTO((rtx));
410 static rtx simplify_logical PROTO((rtx, int));
411 static rtx expand_compound_operation PROTO((rtx));
412 static rtx expand_field_assignment PROTO((rtx));
413 static rtx make_extraction PROTO((enum machine_mode, rtx, int, rtx, int,
414 int, int, int));
415 static rtx extract_left_shift PROTO((rtx, int));
416 static rtx make_compound_operation PROTO((rtx, enum rtx_code));
417 static int get_pos_from_mask PROTO((unsigned HOST_WIDE_INT, int *));
418 static rtx force_to_mode PROTO((rtx, enum machine_mode,
419 unsigned HOST_WIDE_INT, rtx, int));
420 static rtx if_then_else_cond PROTO((rtx, rtx *, rtx *));
421 static rtx known_cond PROTO((rtx, enum rtx_code, rtx, rtx));
422 static int rtx_equal_for_field_assignment_p PROTO((rtx, rtx));
423 static rtx make_field_assignment PROTO((rtx));
424 static rtx apply_distributive_law PROTO((rtx));
425 static rtx simplify_and_const_int PROTO((rtx, enum machine_mode, rtx,
426 unsigned HOST_WIDE_INT));
427 static unsigned HOST_WIDE_INT nonzero_bits PROTO((rtx, enum machine_mode));
428 static int num_sign_bit_copies PROTO((rtx, enum machine_mode));
429 static int merge_outer_ops PROTO((enum rtx_code *, HOST_WIDE_INT *,
430 enum rtx_code, HOST_WIDE_INT,
431 enum machine_mode, int *));
432 static rtx simplify_shift_const PROTO((rtx, enum rtx_code, enum machine_mode,
433 rtx, int));
434 static int recog_for_combine PROTO((rtx *, rtx, rtx *, int *));
435 static rtx gen_lowpart_for_combine PROTO((enum machine_mode, rtx));
436 static rtx gen_rtx_combine PVPROTO((enum rtx_code code, enum machine_mode mode,
437 ...));
438 static rtx gen_binary PROTO((enum rtx_code, enum machine_mode,
439 rtx, rtx));
440 static rtx gen_unary PROTO((enum rtx_code, enum machine_mode,
441 enum machine_mode, rtx));
442 static enum rtx_code simplify_comparison PROTO((enum rtx_code, rtx *, rtx *));
443 static int reversible_comparison_p PROTO((rtx));
444 static void update_table_tick PROTO((rtx));
445 static void record_value_for_reg PROTO((rtx, rtx, rtx));
446 static void record_dead_and_set_regs_1 PROTO((rtx, rtx));
447 static void record_dead_and_set_regs PROTO((rtx));
448 static int get_last_value_validate PROTO((rtx *, rtx, int, int));
449 static rtx get_last_value PROTO((rtx));
450 static int use_crosses_set_p PROTO((rtx, int));
451 static void reg_dead_at_p_1 PROTO((rtx, rtx));
452 static int reg_dead_at_p PROTO((rtx, rtx));
453 static void move_deaths PROTO((rtx, rtx, int, rtx, rtx *));
454 static int reg_bitfield_target_p PROTO((rtx, rtx));
455 static void distribute_notes PROTO((rtx, rtx, rtx, rtx, rtx, rtx));
456 static void distribute_links PROTO((rtx));
457 static void mark_used_regs_combine PROTO((rtx));
458 static int insn_cuid PROTO((rtx));
460 /* Main entry point for combiner. F is the first insn of the function.
461 NREGS is the first unused pseudo-reg number. */
463 void
464 combine_instructions (f, nregs)
465 rtx f;
466 int nregs;
468 register rtx insn, next, prev;
469 register int i;
470 register rtx links, nextlinks;
472 combine_attempts = 0;
473 combine_merges = 0;
474 combine_extras = 0;
475 combine_successes = 0;
476 undobuf.undos = undobuf.previous_undos = 0;
478 combine_max_regno = nregs;
480 reg_nonzero_bits
481 = (unsigned HOST_WIDE_INT *) alloca (nregs * sizeof (HOST_WIDE_INT));
482 reg_sign_bit_copies = (char *) alloca (nregs * sizeof (char));
484 bzero ((char *) reg_nonzero_bits, nregs * sizeof (HOST_WIDE_INT));
485 bzero (reg_sign_bit_copies, nregs * sizeof (char));
487 reg_last_death = (rtx *) alloca (nregs * sizeof (rtx));
488 reg_last_set = (rtx *) alloca (nregs * sizeof (rtx));
489 reg_last_set_value = (rtx *) alloca (nregs * sizeof (rtx));
490 reg_last_set_table_tick = (int *) alloca (nregs * sizeof (int));
491 reg_last_set_label = (int *) alloca (nregs * sizeof (int));
492 reg_last_set_invalid = (char *) alloca (nregs * sizeof (char));
493 reg_last_set_mode
494 = (enum machine_mode *) alloca (nregs * sizeof (enum machine_mode));
495 reg_last_set_nonzero_bits
496 = (unsigned HOST_WIDE_INT *) alloca (nregs * sizeof (HOST_WIDE_INT));
497 reg_last_set_sign_bit_copies
498 = (char *) alloca (nregs * sizeof (char));
500 init_reg_last_arrays ();
502 init_recog_no_volatile ();
504 /* Compute maximum uid value so uid_cuid can be allocated. */
506 for (insn = f, i = 0; insn; insn = NEXT_INSN (insn))
507 if (INSN_UID (insn) > i)
508 i = INSN_UID (insn);
510 uid_cuid = (int *) alloca ((i + 1) * sizeof (int));
511 max_uid_cuid = i;
513 nonzero_bits_mode = mode_for_size (HOST_BITS_PER_WIDE_INT, MODE_INT, 0);
515 /* Don't use reg_nonzero_bits when computing it. This can cause problems
516 when, for example, we have j <<= 1 in a loop. */
518 nonzero_sign_valid = 0;
520 /* Compute the mapping from uids to cuids.
521 Cuids are numbers assigned to insns, like uids,
522 except that cuids increase monotonically through the code.
524 Scan all SETs and see if we can deduce anything about what
525 bits are known to be zero for some registers and how many copies
526 of the sign bit are known to exist for those registers.
528 Also set any known values so that we can use it while searching
529 for what bits are known to be set. */
531 label_tick = 1;
533 /* We need to initialize it here, because record_dead_and_set_regs may call
534 get_last_value. */
535 subst_prev_insn = NULL_RTX;
537 setup_incoming_promotions ();
539 for (insn = f, i = 0; insn; insn = NEXT_INSN (insn))
541 uid_cuid[INSN_UID (insn)] = ++i;
542 subst_low_cuid = i;
543 subst_insn = insn;
545 if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
547 note_stores (PATTERN (insn), set_nonzero_bits_and_sign_copies);
548 record_dead_and_set_regs (insn);
550 #ifdef AUTO_INC_DEC
551 for (links = REG_NOTES (insn); links; links = XEXP (links, 1))
552 if (REG_NOTE_KIND (links) == REG_INC)
553 set_nonzero_bits_and_sign_copies (XEXP (links, 0), NULL_RTX);
554 #endif
557 if (GET_CODE (insn) == CODE_LABEL)
558 label_tick++;
561 nonzero_sign_valid = 1;
563 /* Now scan all the insns in forward order. */
565 this_basic_block = -1;
566 label_tick = 1;
567 last_call_cuid = 0;
568 mem_last_set = 0;
569 init_reg_last_arrays ();
570 setup_incoming_promotions ();
572 for (insn = f; insn; insn = next ? next : NEXT_INSN (insn))
574 next = 0;
576 /* If INSN starts a new basic block, update our basic block number. */
577 if (this_basic_block + 1 < n_basic_blocks
578 && basic_block_head[this_basic_block + 1] == insn)
579 this_basic_block++;
581 if (GET_CODE (insn) == CODE_LABEL)
582 label_tick++;
584 else if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
586 /* Try this insn with each insn it links back to. */
588 for (links = LOG_LINKS (insn); links; links = XEXP (links, 1))
589 if ((next = try_combine (insn, XEXP (links, 0), NULL_RTX)) != 0)
590 goto retry;
592 /* Try each sequence of three linked insns ending with this one. */
594 for (links = LOG_LINKS (insn); links; links = XEXP (links, 1))
595 for (nextlinks = LOG_LINKS (XEXP (links, 0)); nextlinks;
596 nextlinks = XEXP (nextlinks, 1))
597 if ((next = try_combine (insn, XEXP (links, 0),
598 XEXP (nextlinks, 0))) != 0)
599 goto retry;
601 #ifdef HAVE_cc0
602 /* Try to combine a jump insn that uses CC0
603 with a preceding insn that sets CC0, and maybe with its
604 logical predecessor as well.
605 This is how we make decrement-and-branch insns.
606 We need this special code because data flow connections
607 via CC0 do not get entered in LOG_LINKS. */
609 if (GET_CODE (insn) == JUMP_INSN
610 && (prev = prev_nonnote_insn (insn)) != 0
611 && GET_CODE (prev) == INSN
612 && sets_cc0_p (PATTERN (prev)))
614 if ((next = try_combine (insn, prev, NULL_RTX)) != 0)
615 goto retry;
617 for (nextlinks = LOG_LINKS (prev); nextlinks;
618 nextlinks = XEXP (nextlinks, 1))
619 if ((next = try_combine (insn, prev,
620 XEXP (nextlinks, 0))) != 0)
621 goto retry;
624 /* Do the same for an insn that explicitly references CC0. */
625 if (GET_CODE (insn) == INSN
626 && (prev = prev_nonnote_insn (insn)) != 0
627 && GET_CODE (prev) == INSN
628 && sets_cc0_p (PATTERN (prev))
629 && GET_CODE (PATTERN (insn)) == SET
630 && reg_mentioned_p (cc0_rtx, SET_SRC (PATTERN (insn))))
632 if ((next = try_combine (insn, prev, NULL_RTX)) != 0)
633 goto retry;
635 for (nextlinks = LOG_LINKS (prev); nextlinks;
636 nextlinks = XEXP (nextlinks, 1))
637 if ((next = try_combine (insn, prev,
638 XEXP (nextlinks, 0))) != 0)
639 goto retry;
642 /* Finally, see if any of the insns that this insn links to
643 explicitly references CC0. If so, try this insn, that insn,
644 and its predecessor if it sets CC0. */
645 for (links = LOG_LINKS (insn); links; links = XEXP (links, 1))
646 if (GET_CODE (XEXP (links, 0)) == INSN
647 && GET_CODE (PATTERN (XEXP (links, 0))) == SET
648 && reg_mentioned_p (cc0_rtx, SET_SRC (PATTERN (XEXP (links, 0))))
649 && (prev = prev_nonnote_insn (XEXP (links, 0))) != 0
650 && GET_CODE (prev) == INSN
651 && sets_cc0_p (PATTERN (prev))
652 && (next = try_combine (insn, XEXP (links, 0), prev)) != 0)
653 goto retry;
654 #endif
656 /* Try combining an insn with two different insns whose results it
657 uses. */
658 for (links = LOG_LINKS (insn); links; links = XEXP (links, 1))
659 for (nextlinks = XEXP (links, 1); nextlinks;
660 nextlinks = XEXP (nextlinks, 1))
661 if ((next = try_combine (insn, XEXP (links, 0),
662 XEXP (nextlinks, 0))) != 0)
663 goto retry;
665 if (GET_CODE (insn) != NOTE)
666 record_dead_and_set_regs (insn);
668 retry:
673 total_attempts += combine_attempts;
674 total_merges += combine_merges;
675 total_extras += combine_extras;
676 total_successes += combine_successes;
678 nonzero_sign_valid = 0;
681 /* Wipe the reg_last_xxx arrays in preparation for another pass. */
683 static void
684 init_reg_last_arrays ()
686 int nregs = combine_max_regno;
688 bzero ((char *) reg_last_death, nregs * sizeof (rtx));
689 bzero ((char *) reg_last_set, nregs * sizeof (rtx));
690 bzero ((char *) reg_last_set_value, nregs * sizeof (rtx));
691 bzero ((char *) reg_last_set_table_tick, nregs * sizeof (int));
692 bzero ((char *) reg_last_set_label, nregs * sizeof (int));
693 bzero (reg_last_set_invalid, nregs * sizeof (char));
694 bzero ((char *) reg_last_set_mode, nregs * sizeof (enum machine_mode));
695 bzero ((char *) reg_last_set_nonzero_bits, nregs * sizeof (HOST_WIDE_INT));
696 bzero (reg_last_set_sign_bit_copies, nregs * sizeof (char));
699 /* Set up any promoted values for incoming argument registers. */
701 static void
702 setup_incoming_promotions ()
704 #ifdef PROMOTE_FUNCTION_ARGS
705 int regno;
706 rtx reg;
707 enum machine_mode mode;
708 int unsignedp;
709 rtx first = get_insns ();
711 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
712 if (FUNCTION_ARG_REGNO_P (regno)
713 && (reg = promoted_input_arg (regno, &mode, &unsignedp)) != 0)
714 record_value_for_reg (reg, first,
715 gen_rtx (unsignedp ? ZERO_EXTEND : SIGN_EXTEND,
716 GET_MODE (reg),
717 gen_rtx (CLOBBER, mode, const0_rtx)));
718 #endif
721 /* Called via note_stores. If X is a pseudo that is narrower than
722 HOST_BITS_PER_WIDE_INT and is being set, record what bits are known zero.
724 If we are setting only a portion of X and we can't figure out what
725 portion, assume all bits will be used since we don't know what will
726 be happening.
728 Similarly, set how many bits of X are known to be copies of the sign bit
729 at all locations in the function. This is the smallest number implied
730 by any set of X. */
732 static void
733 set_nonzero_bits_and_sign_copies (x, set)
734 rtx x;
735 rtx set;
737 int num;
739 if (GET_CODE (x) == REG
740 && REGNO (x) >= FIRST_PSEUDO_REGISTER
741 /* If this register is undefined at the start of the file, we can't
742 say what its contents were. */
743 && ! REGNO_REG_SET_P (basic_block_live_at_start[0], REGNO (x))
744 && GET_MODE_BITSIZE (GET_MODE (x)) <= HOST_BITS_PER_WIDE_INT)
746 if (set == 0 || GET_CODE (set) == CLOBBER)
748 reg_nonzero_bits[REGNO (x)] = GET_MODE_MASK (GET_MODE (x));
749 reg_sign_bit_copies[REGNO (x)] = 1;
750 return;
753 /* If this is a complex assignment, see if we can convert it into a
754 simple assignment. */
755 set = expand_field_assignment (set);
757 /* If this is a simple assignment, or we have a paradoxical SUBREG,
758 set what we know about X. */
760 if (SET_DEST (set) == x
761 || (GET_CODE (SET_DEST (set)) == SUBREG
762 && (GET_MODE_SIZE (GET_MODE (SET_DEST (set)))
763 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (SET_DEST (set)))))
764 && SUBREG_REG (SET_DEST (set)) == x))
766 rtx src = SET_SRC (set);
768 #ifdef SHORT_IMMEDIATES_SIGN_EXTEND
769 /* If X is narrower than a word and SRC is a non-negative
770 constant that would appear negative in the mode of X,
771 sign-extend it for use in reg_nonzero_bits because some
772 machines (maybe most) will actually do the sign-extension
773 and this is the conservative approach.
775 ??? For 2.5, try to tighten up the MD files in this regard
776 instead of this kludge. */
778 if (GET_MODE_BITSIZE (GET_MODE (x)) < BITS_PER_WORD
779 && GET_CODE (src) == CONST_INT
780 && INTVAL (src) > 0
781 && 0 != (INTVAL (src)
782 & ((HOST_WIDE_INT) 1
783 << (GET_MODE_BITSIZE (GET_MODE (x)) - 1))))
784 src = GEN_INT (INTVAL (src)
785 | ((HOST_WIDE_INT) (-1)
786 << GET_MODE_BITSIZE (GET_MODE (x))));
787 #endif
789 reg_nonzero_bits[REGNO (x)]
790 |= nonzero_bits (src, nonzero_bits_mode);
791 num = num_sign_bit_copies (SET_SRC (set), GET_MODE (x));
792 if (reg_sign_bit_copies[REGNO (x)] == 0
793 || reg_sign_bit_copies[REGNO (x)] > num)
794 reg_sign_bit_copies[REGNO (x)] = num;
796 else
798 reg_nonzero_bits[REGNO (x)] = GET_MODE_MASK (GET_MODE (x));
799 reg_sign_bit_copies[REGNO (x)] = 1;
804 /* See if INSN can be combined into I3. PRED and SUCC are optionally
805 insns that were previously combined into I3 or that will be combined
806 into the merger of INSN and I3.
808 Return 0 if the combination is not allowed for any reason.
810 If the combination is allowed, *PDEST will be set to the single
811 destination of INSN and *PSRC to the single source, and this function
812 will return 1. */
814 static int
815 can_combine_p (insn, i3, pred, succ, pdest, psrc)
816 rtx insn;
817 rtx i3;
818 rtx pred, succ;
819 rtx *pdest, *psrc;
821 int i;
822 rtx set = 0, src, dest;
823 rtx p, link;
824 int all_adjacent = (succ ? (next_active_insn (insn) == succ
825 && next_active_insn (succ) == i3)
826 : next_active_insn (insn) == i3);
828 /* Can combine only if previous insn is a SET of a REG, a SUBREG or CC0.
829 or a PARALLEL consisting of such a SET and CLOBBERs.
831 If INSN has CLOBBER parallel parts, ignore them for our processing.
832 By definition, these happen during the execution of the insn. When it
833 is merged with another insn, all bets are off. If they are, in fact,
834 needed and aren't also supplied in I3, they may be added by
835 recog_for_combine. Otherwise, it won't match.
837 We can also ignore a SET whose SET_DEST is mentioned in a REG_UNUSED
838 note.
840 Get the source and destination of INSN. If more than one, can't
841 combine. */
843 if (GET_CODE (PATTERN (insn)) == SET)
844 set = PATTERN (insn);
845 else if (GET_CODE (PATTERN (insn)) == PARALLEL
846 && GET_CODE (XVECEXP (PATTERN (insn), 0, 0)) == SET)
848 for (i = 0; i < XVECLEN (PATTERN (insn), 0); i++)
850 rtx elt = XVECEXP (PATTERN (insn), 0, i);
852 switch (GET_CODE (elt))
854 /* We can ignore CLOBBERs. */
855 case CLOBBER:
856 break;
858 case SET:
859 /* Ignore SETs whose result isn't used but not those that
860 have side-effects. */
861 if (find_reg_note (insn, REG_UNUSED, SET_DEST (elt))
862 && ! side_effects_p (elt))
863 break;
865 /* If we have already found a SET, this is a second one and
866 so we cannot combine with this insn. */
867 if (set)
868 return 0;
870 set = elt;
871 break;
873 default:
874 /* Anything else means we can't combine. */
875 return 0;
879 if (set == 0
880 /* If SET_SRC is an ASM_OPERANDS we can't throw away these CLOBBERs,
881 so don't do anything with it. */
882 || GET_CODE (SET_SRC (set)) == ASM_OPERANDS)
883 return 0;
885 else
886 return 0;
888 if (set == 0)
889 return 0;
891 set = expand_field_assignment (set);
892 src = SET_SRC (set), dest = SET_DEST (set);
894 /* Don't eliminate a store in the stack pointer. */
895 if (dest == stack_pointer_rtx
896 /* If we couldn't eliminate a field assignment, we can't combine. */
897 || GET_CODE (dest) == ZERO_EXTRACT || GET_CODE (dest) == STRICT_LOW_PART
898 /* Don't combine with an insn that sets a register to itself if it has
899 a REG_EQUAL note. This may be part of a REG_NO_CONFLICT sequence. */
900 || (rtx_equal_p (src, dest) && find_reg_note (insn, REG_EQUAL, NULL_RTX))
901 /* Can't merge a function call. */
902 || GET_CODE (src) == CALL
903 /* Don't eliminate a function call argument. */
904 || (GET_CODE (i3) == CALL_INSN
905 && (find_reg_fusage (i3, USE, dest)
906 || (GET_CODE (dest) == REG
907 && REGNO (dest) < FIRST_PSEUDO_REGISTER
908 && global_regs[REGNO (dest)])))
909 /* Don't substitute into an incremented register. */
910 || FIND_REG_INC_NOTE (i3, dest)
911 || (succ && FIND_REG_INC_NOTE (succ, dest))
912 /* Don't combine the end of a libcall into anything. */
913 || find_reg_note (insn, REG_RETVAL, NULL_RTX)
914 /* Make sure that DEST is not used after SUCC but before I3. */
915 || (succ && ! all_adjacent
916 && reg_used_between_p (dest, succ, i3))
917 /* Make sure that the value that is to be substituted for the register
918 does not use any registers whose values alter in between. However,
919 If the insns are adjacent, a use can't cross a set even though we
920 think it might (this can happen for a sequence of insns each setting
921 the same destination; reg_last_set of that register might point to
922 a NOTE). If INSN has a REG_EQUIV note, the register is always
923 equivalent to the memory so the substitution is valid even if there
924 are intervening stores. Also, don't move a volatile asm or
925 UNSPEC_VOLATILE across any other insns. */
926 || (! all_adjacent
927 && (((GET_CODE (src) != MEM
928 || ! find_reg_note (insn, REG_EQUIV, src))
929 && use_crosses_set_p (src, INSN_CUID (insn)))
930 || (GET_CODE (src) == ASM_OPERANDS && MEM_VOLATILE_P (src))
931 || GET_CODE (src) == UNSPEC_VOLATILE))
932 /* If there is a REG_NO_CONFLICT note for DEST in I3 or SUCC, we get
933 better register allocation by not doing the combine. */
934 || find_reg_note (i3, REG_NO_CONFLICT, dest)
935 || (succ && find_reg_note (succ, REG_NO_CONFLICT, dest))
936 /* Don't combine across a CALL_INSN, because that would possibly
937 change whether the life span of some REGs crosses calls or not,
938 and it is a pain to update that information.
939 Exception: if source is a constant, moving it later can't hurt.
940 Accept that special case, because it helps -fforce-addr a lot. */
941 || (INSN_CUID (insn) < last_call_cuid && ! CONSTANT_P (src)))
942 return 0;
944 /* DEST must either be a REG or CC0. */
945 if (GET_CODE (dest) == REG)
947 /* If register alignment is being enforced for multi-word items in all
948 cases except for parameters, it is possible to have a register copy
949 insn referencing a hard register that is not allowed to contain the
950 mode being copied and which would not be valid as an operand of most
951 insns. Eliminate this problem by not combining with such an insn.
953 Also, on some machines we don't want to extend the life of a hard
954 register.
956 This is the same test done in can_combine except that we don't test
957 if SRC is a CALL operation to permit a hard register with
958 SMALL_REGISTER_CLASSES, and that we have to take all_adjacent
959 into account. */
961 if (GET_CODE (src) == REG
962 && ((REGNO (dest) < FIRST_PSEUDO_REGISTER
963 && ! HARD_REGNO_MODE_OK (REGNO (dest), GET_MODE (dest)))
964 /* Don't extend the life of a hard register unless it is
965 user variable (if we have few registers) or it can't
966 fit into the desired register (meaning something special
967 is going on).
968 Also avoid substituting a return register into I3, because
969 reload can't handle a conflict with constraints of other
970 inputs. */
971 || (REGNO (src) < FIRST_PSEUDO_REGISTER
972 && (! HARD_REGNO_MODE_OK (REGNO (src), GET_MODE (src))
973 #ifdef SMALL_REGISTER_CLASSES
974 || (SMALL_REGISTER_CLASSES
975 && ((! all_adjacent && ! REG_USERVAR_P (src))
976 || (FUNCTION_VALUE_REGNO_P (REGNO (src))
977 && ! REG_USERVAR_P (src))))
978 #endif
979 ))))
980 return 0;
982 else if (GET_CODE (dest) != CC0)
983 return 0;
985 /* Don't substitute for a register intended as a clobberable operand.
986 Similarly, don't substitute an expression containing a register that
987 will be clobbered in I3. */
988 if (GET_CODE (PATTERN (i3)) == PARALLEL)
989 for (i = XVECLEN (PATTERN (i3), 0) - 1; i >= 0; i--)
990 if (GET_CODE (XVECEXP (PATTERN (i3), 0, i)) == CLOBBER
991 && (reg_overlap_mentioned_p (XEXP (XVECEXP (PATTERN (i3), 0, i), 0),
992 src)
993 || rtx_equal_p (XEXP (XVECEXP (PATTERN (i3), 0, i), 0), dest)))
994 return 0;
996 /* If INSN contains anything volatile, or is an `asm' (whether volatile
997 or not), reject, unless nothing volatile comes between it and I3,
998 with the exception of SUCC. */
1000 if (GET_CODE (src) == ASM_OPERANDS || volatile_refs_p (src))
1001 for (p = NEXT_INSN (insn); p != i3; p = NEXT_INSN (p))
1002 if (GET_RTX_CLASS (GET_CODE (p)) == 'i'
1003 && p != succ && volatile_refs_p (PATTERN (p)))
1004 return 0;
1006 /* If INSN is an asm, and DEST is a hard register, reject, since it has
1007 to be an explicit register variable, and was chosen for a reason. */
1009 if (GET_CODE (src) == ASM_OPERANDS
1010 && GET_CODE (dest) == REG && REGNO (dest) < FIRST_PSEUDO_REGISTER)
1011 return 0;
1013 /* If there are any volatile insns between INSN and I3, reject, because
1014 they might affect machine state. */
1016 for (p = NEXT_INSN (insn); p != i3; p = NEXT_INSN (p))
1017 if (GET_RTX_CLASS (GET_CODE (p)) == 'i'
1018 && p != succ && volatile_insn_p (PATTERN (p)))
1019 return 0;
1021 /* If INSN or I2 contains an autoincrement or autodecrement,
1022 make sure that register is not used between there and I3,
1023 and not already used in I3 either.
1024 Also insist that I3 not be a jump; if it were one
1025 and the incremented register were spilled, we would lose. */
1027 #ifdef AUTO_INC_DEC
1028 for (link = REG_NOTES (insn); link; link = XEXP (link, 1))
1029 if (REG_NOTE_KIND (link) == REG_INC
1030 && (GET_CODE (i3) == JUMP_INSN
1031 || reg_used_between_p (XEXP (link, 0), insn, i3)
1032 || reg_overlap_mentioned_p (XEXP (link, 0), PATTERN (i3))))
1033 return 0;
1034 #endif
1036 #ifdef HAVE_cc0
1037 /* Don't combine an insn that follows a CC0-setting insn.
1038 An insn that uses CC0 must not be separated from the one that sets it.
1039 We do, however, allow I2 to follow a CC0-setting insn if that insn
1040 is passed as I1; in that case it will be deleted also.
1041 We also allow combining in this case if all the insns are adjacent
1042 because that would leave the two CC0 insns adjacent as well.
1043 It would be more logical to test whether CC0 occurs inside I1 or I2,
1044 but that would be much slower, and this ought to be equivalent. */
1046 p = prev_nonnote_insn (insn);
1047 if (p && p != pred && GET_CODE (p) == INSN && sets_cc0_p (PATTERN (p))
1048 && ! all_adjacent)
1049 return 0;
1050 #endif
1052 /* If we get here, we have passed all the tests and the combination is
1053 to be allowed. */
1055 *pdest = dest;
1056 *psrc = src;
1058 return 1;
1061 /* LOC is the location within I3 that contains its pattern or the component
1062 of a PARALLEL of the pattern. We validate that it is valid for combining.
1064 One problem is if I3 modifies its output, as opposed to replacing it
1065 entirely, we can't allow the output to contain I2DEST or I1DEST as doing
1066 so would produce an insn that is not equivalent to the original insns.
1068 Consider:
1070 (set (reg:DI 101) (reg:DI 100))
1071 (set (subreg:SI (reg:DI 101) 0) <foo>)
1073 This is NOT equivalent to:
1075 (parallel [(set (subreg:SI (reg:DI 100) 0) <foo>)
1076 (set (reg:DI 101) (reg:DI 100))])
1078 Not only does this modify 100 (in which case it might still be valid
1079 if 100 were dead in I2), it sets 101 to the ORIGINAL value of 100.
1081 We can also run into a problem if I2 sets a register that I1
1082 uses and I1 gets directly substituted into I3 (not via I2). In that
1083 case, we would be getting the wrong value of I2DEST into I3, so we
1084 must reject the combination. This case occurs when I2 and I1 both
1085 feed into I3, rather than when I1 feeds into I2, which feeds into I3.
1086 If I1_NOT_IN_SRC is non-zero, it means that finding I1 in the source
1087 of a SET must prevent combination from occurring.
1089 On machines where SMALL_REGISTER_CLASSES is defined, we don't combine
1090 if the destination of a SET is a hard register that isn't a user
1091 variable.
1093 Before doing the above check, we first try to expand a field assignment
1094 into a set of logical operations.
1096 If PI3_DEST_KILLED is non-zero, it is a pointer to a location in which
1097 we place a register that is both set and used within I3. If more than one
1098 such register is detected, we fail.
1100 Return 1 if the combination is valid, zero otherwise. */
1102 static int
1103 combinable_i3pat (i3, loc, i2dest, i1dest, i1_not_in_src, pi3dest_killed)
1104 rtx i3;
1105 rtx *loc;
1106 rtx i2dest;
1107 rtx i1dest;
1108 int i1_not_in_src;
1109 rtx *pi3dest_killed;
1111 rtx x = *loc;
1113 if (GET_CODE (x) == SET)
1115 rtx set = expand_field_assignment (x);
1116 rtx dest = SET_DEST (set);
1117 rtx src = SET_SRC (set);
1118 rtx inner_dest = dest, inner_src = src;
1120 SUBST (*loc, set);
1122 while (GET_CODE (inner_dest) == STRICT_LOW_PART
1123 || GET_CODE (inner_dest) == SUBREG
1124 || GET_CODE (inner_dest) == ZERO_EXTRACT)
1125 inner_dest = XEXP (inner_dest, 0);
1127 /* We probably don't need this any more now that LIMIT_RELOAD_CLASS
1128 was added. */
1129 #if 0
1130 while (GET_CODE (inner_src) == STRICT_LOW_PART
1131 || GET_CODE (inner_src) == SUBREG
1132 || GET_CODE (inner_src) == ZERO_EXTRACT)
1133 inner_src = XEXP (inner_src, 0);
1135 /* If it is better that two different modes keep two different pseudos,
1136 avoid combining them. This avoids producing the following pattern
1137 on a 386:
1138 (set (subreg:SI (reg/v:QI 21) 0)
1139 (lshiftrt:SI (reg/v:SI 20)
1140 (const_int 24)))
1141 If that were made, reload could not handle the pair of
1142 reg 20/21, since it would try to get any GENERAL_REGS
1143 but some of them don't handle QImode. */
1145 if (rtx_equal_p (inner_src, i2dest)
1146 && GET_CODE (inner_dest) == REG
1147 && ! MODES_TIEABLE_P (GET_MODE (i2dest), GET_MODE (inner_dest)))
1148 return 0;
1149 #endif
1151 /* Check for the case where I3 modifies its output, as
1152 discussed above. */
1153 if ((inner_dest != dest
1154 && (reg_overlap_mentioned_p (i2dest, inner_dest)
1155 || (i1dest && reg_overlap_mentioned_p (i1dest, inner_dest))))
1156 /* This is the same test done in can_combine_p except that we
1157 allow a hard register with SMALL_REGISTER_CLASSES if SRC is a
1158 CALL operation.
1159 Moreover, we can't test all_adjacent; we don't have to, since
1160 this instruction will stay in place, thus we are not considering
1161 to increase the lifetime of INNER_DEST. */
1162 || (GET_CODE (inner_dest) == REG
1163 && REGNO (inner_dest) < FIRST_PSEUDO_REGISTER
1164 && (! HARD_REGNO_MODE_OK (REGNO (inner_dest),
1165 GET_MODE (inner_dest))
1166 #ifdef SMALL_REGISTER_CLASSES
1167 || (SMALL_REGISTER_CLASSES
1168 && GET_CODE (src) != CALL && ! REG_USERVAR_P (inner_dest)
1169 && FUNCTION_VALUE_REGNO_P (REGNO (inner_dest)))
1170 #endif
1172 || (i1_not_in_src && reg_overlap_mentioned_p (i1dest, src)))
1173 return 0;
1175 /* If DEST is used in I3, it is being killed in this insn,
1176 so record that for later.
1177 Never add REG_DEAD notes for the FRAME_POINTER_REGNUM or the
1178 STACK_POINTER_REGNUM, since these are always considered to be
1179 live. Similarly for ARG_POINTER_REGNUM if it is fixed. */
1180 if (pi3dest_killed && GET_CODE (dest) == REG
1181 && reg_referenced_p (dest, PATTERN (i3))
1182 && REGNO (dest) != FRAME_POINTER_REGNUM
1183 #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM
1184 && REGNO (dest) != HARD_FRAME_POINTER_REGNUM
1185 #endif
1186 #if ARG_POINTER_REGNUM != FRAME_POINTER_REGNUM
1187 && (REGNO (dest) != ARG_POINTER_REGNUM
1188 || ! fixed_regs [REGNO (dest)])
1189 #endif
1190 && REGNO (dest) != STACK_POINTER_REGNUM)
1192 if (*pi3dest_killed)
1193 return 0;
1195 *pi3dest_killed = dest;
1199 else if (GET_CODE (x) == PARALLEL)
1201 int i;
1203 for (i = 0; i < XVECLEN (x, 0); i++)
1204 if (! combinable_i3pat (i3, &XVECEXP (x, 0, i), i2dest, i1dest,
1205 i1_not_in_src, pi3dest_killed))
1206 return 0;
1209 return 1;
1212 /* Try to combine the insns I1 and I2 into I3.
1213 Here I1 and I2 appear earlier than I3.
1214 I1 can be zero; then we combine just I2 into I3.
1216 It we are combining three insns and the resulting insn is not recognized,
1217 try splitting it into two insns. If that happens, I2 and I3 are retained
1218 and I1 is pseudo-deleted by turning it into a NOTE. Otherwise, I1 and I2
1219 are pseudo-deleted.
1221 Return 0 if the combination does not work. Then nothing is changed.
1222 If we did the combination, return the insn at which combine should
1223 resume scanning. */
1225 static rtx
1226 try_combine (i3, i2, i1)
1227 register rtx i3, i2, i1;
1229 /* New patterns for I3 and I3, respectively. */
1230 rtx newpat, newi2pat = 0;
1231 /* Indicates need to preserve SET in I1 or I2 in I3 if it is not dead. */
1232 int added_sets_1, added_sets_2;
1233 /* Total number of SETs to put into I3. */
1234 int total_sets;
1235 /* Nonzero is I2's body now appears in I3. */
1236 int i2_is_used;
1237 /* INSN_CODEs for new I3, new I2, and user of condition code. */
1238 int insn_code_number, i2_code_number, other_code_number;
1239 /* Contains I3 if the destination of I3 is used in its source, which means
1240 that the old life of I3 is being killed. If that usage is placed into
1241 I2 and not in I3, a REG_DEAD note must be made. */
1242 rtx i3dest_killed = 0;
1243 /* SET_DEST and SET_SRC of I2 and I1. */
1244 rtx i2dest, i2src, i1dest = 0, i1src = 0;
1245 /* PATTERN (I2), or a copy of it in certain cases. */
1246 rtx i2pat;
1247 /* Indicates if I2DEST or I1DEST is in I2SRC or I1_SRC. */
1248 int i2dest_in_i2src = 0, i1dest_in_i1src = 0, i2dest_in_i1src = 0;
1249 int i1_feeds_i3 = 0;
1250 /* Notes that must be added to REG_NOTES in I3 and I2. */
1251 rtx new_i3_notes, new_i2_notes;
1252 /* Notes that we substituted I3 into I2 instead of the normal case. */
1253 int i3_subst_into_i2 = 0;
1254 /* Notes that I1, I2 or I3 is a MULT operation. */
1255 int have_mult = 0;
1256 /* Number of clobbers of SCRATCH we had to add. */
1257 int i3_scratches = 0, i2_scratches = 0, other_scratches = 0;
1259 int maxreg;
1260 rtx temp;
1261 register rtx link;
1262 int i;
1264 /* If any of I1, I2, and I3 isn't really an insn, we can't do anything.
1265 This can occur when flow deletes an insn that it has merged into an
1266 auto-increment address. We also can't do anything if I3 has a
1267 REG_LIBCALL note since we don't want to disrupt the contiguity of a
1268 libcall. */
1270 if (GET_RTX_CLASS (GET_CODE (i3)) != 'i'
1271 || GET_RTX_CLASS (GET_CODE (i2)) != 'i'
1272 || (i1 && GET_RTX_CLASS (GET_CODE (i1)) != 'i')
1273 || find_reg_note (i3, REG_LIBCALL, NULL_RTX))
1274 return 0;
1276 combine_attempts++;
1278 undobuf.undos = undobuf.previous_undos = 0;
1279 undobuf.other_insn = 0;
1281 /* Save the current high-water-mark so we can free storage if we didn't
1282 accept this combination. */
1283 undobuf.storage = (char *) oballoc (0);
1285 /* Reset the hard register usage information. */
1286 CLEAR_HARD_REG_SET (newpat_used_regs);
1288 /* If I1 and I2 both feed I3, they can be in any order. To simplify the
1289 code below, set I1 to be the earlier of the two insns. */
1290 if (i1 && INSN_CUID (i1) > INSN_CUID (i2))
1291 temp = i1, i1 = i2, i2 = temp;
1293 added_links_insn = 0;
1295 /* First check for one important special-case that the code below will
1296 not handle. Namely, the case where I1 is zero, I2 has multiple sets,
1297 and I3 is a SET whose SET_SRC is a SET_DEST in I2. In that case,
1298 we may be able to replace that destination with the destination of I3.
1299 This occurs in the common code where we compute both a quotient and
1300 remainder into a structure, in which case we want to do the computation
1301 directly into the structure to avoid register-register copies.
1303 We make very conservative checks below and only try to handle the
1304 most common cases of this. For example, we only handle the case
1305 where I2 and I3 are adjacent to avoid making difficult register
1306 usage tests. */
1308 if (i1 == 0 && GET_CODE (i3) == INSN && GET_CODE (PATTERN (i3)) == SET
1309 && GET_CODE (SET_SRC (PATTERN (i3))) == REG
1310 && REGNO (SET_SRC (PATTERN (i3))) >= FIRST_PSEUDO_REGISTER
1311 #ifdef SMALL_REGISTER_CLASSES
1312 && (! SMALL_REGISTER_CLASSES
1313 || GET_CODE (SET_DEST (PATTERN (i3))) != REG
1314 || REGNO (SET_DEST (PATTERN (i3))) >= FIRST_PSEUDO_REGISTER
1315 || REG_USERVAR_P (SET_DEST (PATTERN (i3))))
1316 #endif
1317 && find_reg_note (i3, REG_DEAD, SET_SRC (PATTERN (i3)))
1318 && GET_CODE (PATTERN (i2)) == PARALLEL
1319 && ! side_effects_p (SET_DEST (PATTERN (i3)))
1320 /* If the dest of I3 is a ZERO_EXTRACT or STRICT_LOW_PART, the code
1321 below would need to check what is inside (and reg_overlap_mentioned_p
1322 doesn't support those codes anyway). Don't allow those destinations;
1323 the resulting insn isn't likely to be recognized anyway. */
1324 && GET_CODE (SET_DEST (PATTERN (i3))) != ZERO_EXTRACT
1325 && GET_CODE (SET_DEST (PATTERN (i3))) != STRICT_LOW_PART
1326 && ! reg_overlap_mentioned_p (SET_SRC (PATTERN (i3)),
1327 SET_DEST (PATTERN (i3)))
1328 && next_real_insn (i2) == i3)
1330 rtx p2 = PATTERN (i2);
1332 /* Make sure that the destination of I3,
1333 which we are going to substitute into one output of I2,
1334 is not used within another output of I2. We must avoid making this:
1335 (parallel [(set (mem (reg 69)) ...)
1336 (set (reg 69) ...)])
1337 which is not well-defined as to order of actions.
1338 (Besides, reload can't handle output reloads for this.)
1340 The problem can also happen if the dest of I3 is a memory ref,
1341 if another dest in I2 is an indirect memory ref. */
1342 for (i = 0; i < XVECLEN (p2, 0); i++)
1343 if ((GET_CODE (XVECEXP (p2, 0, i)) == SET
1344 || GET_CODE (XVECEXP (p2, 0, i)) == CLOBBER)
1345 && reg_overlap_mentioned_p (SET_DEST (PATTERN (i3)),
1346 SET_DEST (XVECEXP (p2, 0, i))))
1347 break;
1349 if (i == XVECLEN (p2, 0))
1350 for (i = 0; i < XVECLEN (p2, 0); i++)
1351 if (SET_DEST (XVECEXP (p2, 0, i)) == SET_SRC (PATTERN (i3)))
1353 combine_merges++;
1355 subst_insn = i3;
1356 subst_low_cuid = INSN_CUID (i2);
1358 added_sets_2 = added_sets_1 = 0;
1359 i2dest = SET_SRC (PATTERN (i3));
1361 /* Replace the dest in I2 with our dest and make the resulting
1362 insn the new pattern for I3. Then skip to where we
1363 validate the pattern. Everything was set up above. */
1364 SUBST (SET_DEST (XVECEXP (p2, 0, i)),
1365 SET_DEST (PATTERN (i3)));
1367 newpat = p2;
1368 i3_subst_into_i2 = 1;
1369 goto validate_replacement;
1373 #ifndef HAVE_cc0
1374 /* If we have no I1 and I2 looks like:
1375 (parallel [(set (reg:CC X) (compare:CC OP (const_int 0)))
1376 (set Y OP)])
1377 make up a dummy I1 that is
1378 (set Y OP)
1379 and change I2 to be
1380 (set (reg:CC X) (compare:CC Y (const_int 0)))
1382 (We can ignore any trailing CLOBBERs.)
1384 This undoes a previous combination and allows us to match a branch-and-
1385 decrement insn. */
1387 if (i1 == 0 && GET_CODE (PATTERN (i2)) == PARALLEL
1388 && XVECLEN (PATTERN (i2), 0) >= 2
1389 && GET_CODE (XVECEXP (PATTERN (i2), 0, 0)) == SET
1390 && (GET_MODE_CLASS (GET_MODE (SET_DEST (XVECEXP (PATTERN (i2), 0, 0))))
1391 == MODE_CC)
1392 && GET_CODE (SET_SRC (XVECEXP (PATTERN (i2), 0, 0))) == COMPARE
1393 && XEXP (SET_SRC (XVECEXP (PATTERN (i2), 0, 0)), 1) == const0_rtx
1394 && GET_CODE (XVECEXP (PATTERN (i2), 0, 1)) == SET
1395 && GET_CODE (SET_DEST (XVECEXP (PATTERN (i2), 0, 1))) == REG
1396 && rtx_equal_p (XEXP (SET_SRC (XVECEXP (PATTERN (i2), 0, 0)), 0),
1397 SET_SRC (XVECEXP (PATTERN (i2), 0, 1))))
1399 for (i = XVECLEN (PATTERN (i2), 0) - 1; i >= 2; i--)
1400 if (GET_CODE (XVECEXP (PATTERN (i2), 0, i)) != CLOBBER)
1401 break;
1403 if (i == 1)
1405 /* We make I1 with the same INSN_UID as I2. This gives it
1406 the same INSN_CUID for value tracking. Our fake I1 will
1407 never appear in the insn stream so giving it the same INSN_UID
1408 as I2 will not cause a problem. */
1410 subst_prev_insn = i1
1411 = gen_rtx (INSN, VOIDmode, INSN_UID (i2), NULL_RTX, i2,
1412 XVECEXP (PATTERN (i2), 0, 1), -1, NULL_RTX, NULL_RTX);
1414 SUBST (PATTERN (i2), XVECEXP (PATTERN (i2), 0, 0));
1415 SUBST (XEXP (SET_SRC (PATTERN (i2)), 0),
1416 SET_DEST (PATTERN (i1)));
1419 #endif
1421 /* Verify that I2 and I1 are valid for combining. */
1422 if (! can_combine_p (i2, i3, i1, NULL_RTX, &i2dest, &i2src)
1423 || (i1 && ! can_combine_p (i1, i3, NULL_RTX, i2, &i1dest, &i1src)))
1425 undo_all ();
1426 return 0;
1429 /* Record whether I2DEST is used in I2SRC and similarly for the other
1430 cases. Knowing this will help in register status updating below. */
1431 i2dest_in_i2src = reg_overlap_mentioned_p (i2dest, i2src);
1432 i1dest_in_i1src = i1 && reg_overlap_mentioned_p (i1dest, i1src);
1433 i2dest_in_i1src = i1 && reg_overlap_mentioned_p (i2dest, i1src);
1435 /* See if I1 directly feeds into I3. It does if I1DEST is not used
1436 in I2SRC. */
1437 i1_feeds_i3 = i1 && ! reg_overlap_mentioned_p (i1dest, i2src);
1439 /* Ensure that I3's pattern can be the destination of combines. */
1440 if (! combinable_i3pat (i3, &PATTERN (i3), i2dest, i1dest,
1441 i1 && i2dest_in_i1src && i1_feeds_i3,
1442 &i3dest_killed))
1444 undo_all ();
1445 return 0;
1448 /* See if any of the insns is a MULT operation. Unless one is, we will
1449 reject a combination that is, since it must be slower. Be conservative
1450 here. */
1451 if (GET_CODE (i2src) == MULT
1452 || (i1 != 0 && GET_CODE (i1src) == MULT)
1453 || (GET_CODE (PATTERN (i3)) == SET
1454 && GET_CODE (SET_SRC (PATTERN (i3))) == MULT))
1455 have_mult = 1;
1457 /* If I3 has an inc, then give up if I1 or I2 uses the reg that is inc'd.
1458 We used to do this EXCEPT in one case: I3 has a post-inc in an
1459 output operand. However, that exception can give rise to insns like
1460 mov r3,(r3)+
1461 which is a famous insn on the PDP-11 where the value of r3 used as the
1462 source was model-dependent. Avoid this sort of thing. */
1464 #if 0
1465 if (!(GET_CODE (PATTERN (i3)) == SET
1466 && GET_CODE (SET_SRC (PATTERN (i3))) == REG
1467 && GET_CODE (SET_DEST (PATTERN (i3))) == MEM
1468 && (GET_CODE (XEXP (SET_DEST (PATTERN (i3)), 0)) == POST_INC
1469 || GET_CODE (XEXP (SET_DEST (PATTERN (i3)), 0)) == POST_DEC)))
1470 /* It's not the exception. */
1471 #endif
1472 #ifdef AUTO_INC_DEC
1473 for (link = REG_NOTES (i3); link; link = XEXP (link, 1))
1474 if (REG_NOTE_KIND (link) == REG_INC
1475 && (reg_overlap_mentioned_p (XEXP (link, 0), PATTERN (i2))
1476 || (i1 != 0
1477 && reg_overlap_mentioned_p (XEXP (link, 0), PATTERN (i1)))))
1479 undo_all ();
1480 return 0;
1482 #endif
1484 /* See if the SETs in I1 or I2 need to be kept around in the merged
1485 instruction: whenever the value set there is still needed past I3.
1486 For the SETs in I2, this is easy: we see if I2DEST dies or is set in I3.
1488 For the SET in I1, we have two cases: If I1 and I2 independently
1489 feed into I3, the set in I1 needs to be kept around if I1DEST dies
1490 or is set in I3. Otherwise (if I1 feeds I2 which feeds I3), the set
1491 in I1 needs to be kept around unless I1DEST dies or is set in either
1492 I2 or I3. We can distinguish these cases by seeing if I2SRC mentions
1493 I1DEST. If so, we know I1 feeds into I2. */
1495 added_sets_2 = ! dead_or_set_p (i3, i2dest);
1497 added_sets_1
1498 = i1 && ! (i1_feeds_i3 ? dead_or_set_p (i3, i1dest)
1499 : (dead_or_set_p (i3, i1dest) || dead_or_set_p (i2, i1dest)));
1501 /* If the set in I2 needs to be kept around, we must make a copy of
1502 PATTERN (I2), so that when we substitute I1SRC for I1DEST in
1503 PATTERN (I2), we are only substituting for the original I1DEST, not into
1504 an already-substituted copy. This also prevents making self-referential
1505 rtx. If I2 is a PARALLEL, we just need the piece that assigns I2SRC to
1506 I2DEST. */
1508 i2pat = (GET_CODE (PATTERN (i2)) == PARALLEL
1509 ? gen_rtx (SET, VOIDmode, i2dest, i2src)
1510 : PATTERN (i2));
1512 if (added_sets_2)
1513 i2pat = copy_rtx (i2pat);
1515 combine_merges++;
1517 /* Substitute in the latest insn for the regs set by the earlier ones. */
1519 maxreg = max_reg_num ();
1521 subst_insn = i3;
1523 /* It is possible that the source of I2 or I1 may be performing an
1524 unneeded operation, such as a ZERO_EXTEND of something that is known
1525 to have the high part zero. Handle that case by letting subst look at
1526 the innermost one of them.
1528 Another way to do this would be to have a function that tries to
1529 simplify a single insn instead of merging two or more insns. We don't
1530 do this because of the potential of infinite loops and because
1531 of the potential extra memory required. However, doing it the way
1532 we are is a bit of a kludge and doesn't catch all cases.
1534 But only do this if -fexpensive-optimizations since it slows things down
1535 and doesn't usually win. */
1537 if (flag_expensive_optimizations)
1539 /* Pass pc_rtx so no substitutions are done, just simplifications.
1540 The cases that we are interested in here do not involve the few
1541 cases were is_replaced is checked. */
1542 if (i1)
1544 subst_low_cuid = INSN_CUID (i1);
1545 i1src = subst (i1src, pc_rtx, pc_rtx, 0, 0);
1547 else
1549 subst_low_cuid = INSN_CUID (i2);
1550 i2src = subst (i2src, pc_rtx, pc_rtx, 0, 0);
1553 undobuf.previous_undos = undobuf.undos;
1556 #ifndef HAVE_cc0
1557 /* Many machines that don't use CC0 have insns that can both perform an
1558 arithmetic operation and set the condition code. These operations will
1559 be represented as a PARALLEL with the first element of the vector
1560 being a COMPARE of an arithmetic operation with the constant zero.
1561 The second element of the vector will set some pseudo to the result
1562 of the same arithmetic operation. If we simplify the COMPARE, we won't
1563 match such a pattern and so will generate an extra insn. Here we test
1564 for this case, where both the comparison and the operation result are
1565 needed, and make the PARALLEL by just replacing I2DEST in I3SRC with
1566 I2SRC. Later we will make the PARALLEL that contains I2. */
1568 if (i1 == 0 && added_sets_2 && GET_CODE (PATTERN (i3)) == SET
1569 && GET_CODE (SET_SRC (PATTERN (i3))) == COMPARE
1570 && XEXP (SET_SRC (PATTERN (i3)), 1) == const0_rtx
1571 && rtx_equal_p (XEXP (SET_SRC (PATTERN (i3)), 0), i2dest))
1573 rtx *cc_use;
1574 enum machine_mode compare_mode;
1576 newpat = PATTERN (i3);
1577 SUBST (XEXP (SET_SRC (newpat), 0), i2src);
1579 i2_is_used = 1;
1581 #ifdef EXTRA_CC_MODES
1582 /* See if a COMPARE with the operand we substituted in should be done
1583 with the mode that is currently being used. If not, do the same
1584 processing we do in `subst' for a SET; namely, if the destination
1585 is used only once, try to replace it with a register of the proper
1586 mode and also replace the COMPARE. */
1587 if (undobuf.other_insn == 0
1588 && (cc_use = find_single_use (SET_DEST (newpat), i3,
1589 &undobuf.other_insn))
1590 && ((compare_mode = SELECT_CC_MODE (GET_CODE (*cc_use),
1591 i2src, const0_rtx))
1592 != GET_MODE (SET_DEST (newpat))))
1594 int regno = REGNO (SET_DEST (newpat));
1595 rtx new_dest = gen_rtx (REG, compare_mode, regno);
1597 if (regno < FIRST_PSEUDO_REGISTER
1598 || (REG_N_SETS (regno) == 1 && ! added_sets_2
1599 && ! REG_USERVAR_P (SET_DEST (newpat))))
1601 if (regno >= FIRST_PSEUDO_REGISTER)
1602 SUBST (regno_reg_rtx[regno], new_dest);
1604 SUBST (SET_DEST (newpat), new_dest);
1605 SUBST (XEXP (*cc_use, 0), new_dest);
1606 SUBST (SET_SRC (newpat),
1607 gen_rtx_combine (COMPARE, compare_mode,
1608 i2src, const0_rtx));
1610 else
1611 undobuf.other_insn = 0;
1613 #endif
1615 else
1616 #endif
1618 n_occurrences = 0; /* `subst' counts here */
1620 /* If I1 feeds into I2 (not into I3) and I1DEST is in I1SRC, we
1621 need to make a unique copy of I2SRC each time we substitute it
1622 to avoid self-referential rtl. */
1624 subst_low_cuid = INSN_CUID (i2);
1625 newpat = subst (PATTERN (i3), i2dest, i2src, 0,
1626 ! i1_feeds_i3 && i1dest_in_i1src);
1627 undobuf.previous_undos = undobuf.undos;
1629 /* Record whether i2's body now appears within i3's body. */
1630 i2_is_used = n_occurrences;
1633 /* If we already got a failure, don't try to do more. Otherwise,
1634 try to substitute in I1 if we have it. */
1636 if (i1 && GET_CODE (newpat) != CLOBBER)
1638 /* Before we can do this substitution, we must redo the test done
1639 above (see detailed comments there) that ensures that I1DEST
1640 isn't mentioned in any SETs in NEWPAT that are field assignments. */
1642 if (! combinable_i3pat (NULL_RTX, &newpat, i1dest, NULL_RTX,
1643 0, NULL_PTR))
1645 undo_all ();
1646 return 0;
1649 n_occurrences = 0;
1650 subst_low_cuid = INSN_CUID (i1);
1651 newpat = subst (newpat, i1dest, i1src, 0, 0);
1652 undobuf.previous_undos = undobuf.undos;
1655 /* Fail if an autoincrement side-effect has been duplicated. Be careful
1656 to count all the ways that I2SRC and I1SRC can be used. */
1657 if ((FIND_REG_INC_NOTE (i2, NULL_RTX) != 0
1658 && i2_is_used + added_sets_2 > 1)
1659 || (i1 != 0 && FIND_REG_INC_NOTE (i1, NULL_RTX) != 0
1660 && (n_occurrences + added_sets_1 + (added_sets_2 && ! i1_feeds_i3)
1661 > 1))
1662 /* Fail if we tried to make a new register (we used to abort, but there's
1663 really no reason to). */
1664 || max_reg_num () != maxreg
1665 /* Fail if we couldn't do something and have a CLOBBER. */
1666 || GET_CODE (newpat) == CLOBBER
1667 /* Fail if this new pattern is a MULT and we didn't have one before
1668 at the outer level. */
1669 || (GET_CODE (newpat) == SET && GET_CODE (SET_SRC (newpat)) == MULT
1670 && ! have_mult))
1672 undo_all ();
1673 return 0;
1676 /* If the actions of the earlier insns must be kept
1677 in addition to substituting them into the latest one,
1678 we must make a new PARALLEL for the latest insn
1679 to hold additional the SETs. */
1681 if (added_sets_1 || added_sets_2)
1683 combine_extras++;
1685 if (GET_CODE (newpat) == PARALLEL)
1687 rtvec old = XVEC (newpat, 0);
1688 total_sets = XVECLEN (newpat, 0) + added_sets_1 + added_sets_2;
1689 newpat = gen_rtx (PARALLEL, VOIDmode, rtvec_alloc (total_sets));
1690 bcopy ((char *) &old->elem[0], (char *) XVEC (newpat, 0)->elem,
1691 sizeof (old->elem[0]) * old->num_elem);
1693 else
1695 rtx old = newpat;
1696 total_sets = 1 + added_sets_1 + added_sets_2;
1697 newpat = gen_rtx (PARALLEL, VOIDmode, rtvec_alloc (total_sets));
1698 XVECEXP (newpat, 0, 0) = old;
1701 if (added_sets_1)
1702 XVECEXP (newpat, 0, --total_sets)
1703 = (GET_CODE (PATTERN (i1)) == PARALLEL
1704 ? gen_rtx (SET, VOIDmode, i1dest, i1src) : PATTERN (i1));
1706 if (added_sets_2)
1708 /* If there is no I1, use I2's body as is. We used to also not do
1709 the subst call below if I2 was substituted into I3,
1710 but that could lose a simplification. */
1711 if (i1 == 0)
1712 XVECEXP (newpat, 0, --total_sets) = i2pat;
1713 else
1714 /* See comment where i2pat is assigned. */
1715 XVECEXP (newpat, 0, --total_sets)
1716 = subst (i2pat, i1dest, i1src, 0, 0);
1720 /* We come here when we are replacing a destination in I2 with the
1721 destination of I3. */
1722 validate_replacement:
1724 /* Note which hard regs this insn has as inputs. */
1725 mark_used_regs_combine (newpat);
1727 /* Is the result of combination a valid instruction? */
1728 insn_code_number
1729 = recog_for_combine (&newpat, i3, &new_i3_notes, &i3_scratches);
1731 /* If the result isn't valid, see if it is a PARALLEL of two SETs where
1732 the second SET's destination is a register that is unused. In that case,
1733 we just need the first SET. This can occur when simplifying a divmod
1734 insn. We *must* test for this case here because the code below that
1735 splits two independent SETs doesn't handle this case correctly when it
1736 updates the register status. Also check the case where the first
1737 SET's destination is unused. That would not cause incorrect code, but
1738 does cause an unneeded insn to remain. */
1740 if (insn_code_number < 0 && GET_CODE (newpat) == PARALLEL
1741 && XVECLEN (newpat, 0) == 2
1742 && GET_CODE (XVECEXP (newpat, 0, 0)) == SET
1743 && GET_CODE (XVECEXP (newpat, 0, 1)) == SET
1744 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 1))) == REG
1745 && find_reg_note (i3, REG_UNUSED, SET_DEST (XVECEXP (newpat, 0, 1)))
1746 && ! side_effects_p (SET_SRC (XVECEXP (newpat, 0, 1)))
1747 && asm_noperands (newpat) < 0)
1749 newpat = XVECEXP (newpat, 0, 0);
1750 insn_code_number
1751 = recog_for_combine (&newpat, i3, &new_i3_notes, &i3_scratches);
1754 else if (insn_code_number < 0 && GET_CODE (newpat) == PARALLEL
1755 && XVECLEN (newpat, 0) == 2
1756 && GET_CODE (XVECEXP (newpat, 0, 0)) == SET
1757 && GET_CODE (XVECEXP (newpat, 0, 1)) == SET
1758 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 0))) == REG
1759 && find_reg_note (i3, REG_UNUSED, SET_DEST (XVECEXP (newpat, 0, 0)))
1760 && ! side_effects_p (SET_SRC (XVECEXP (newpat, 0, 0)))
1761 && asm_noperands (newpat) < 0)
1763 newpat = XVECEXP (newpat, 0, 1);
1764 insn_code_number
1765 = recog_for_combine (&newpat, i3, &new_i3_notes, &i3_scratches);
1768 /* If we were combining three insns and the result is a simple SET
1769 with no ASM_OPERANDS that wasn't recognized, try to split it into two
1770 insns. There are two ways to do this. It can be split using a
1771 machine-specific method (like when you have an addition of a large
1772 constant) or by combine in the function find_split_point. */
1774 if (i1 && insn_code_number < 0 && GET_CODE (newpat) == SET
1775 && asm_noperands (newpat) < 0)
1777 rtx m_split, *split;
1778 rtx ni2dest = i2dest;
1780 /* See if the MD file can split NEWPAT. If it can't, see if letting it
1781 use I2DEST as a scratch register will help. In the latter case,
1782 convert I2DEST to the mode of the source of NEWPAT if we can. */
1784 m_split = split_insns (newpat, i3);
1786 /* We can only use I2DEST as a scratch reg if it doesn't overlap any
1787 inputs of NEWPAT. */
1789 /* ??? If I2DEST is not safe, and I1DEST exists, then it would be
1790 possible to try that as a scratch reg. This would require adding
1791 more code to make it work though. */
1793 if (m_split == 0 && ! reg_overlap_mentioned_p (ni2dest, newpat))
1795 /* If I2DEST is a hard register or the only use of a pseudo,
1796 we can change its mode. */
1797 if (GET_MODE (SET_DEST (newpat)) != GET_MODE (i2dest)
1798 && GET_MODE (SET_DEST (newpat)) != VOIDmode
1799 && GET_CODE (i2dest) == REG
1800 && (REGNO (i2dest) < FIRST_PSEUDO_REGISTER
1801 || (REG_N_SETS (REGNO (i2dest)) == 1 && ! added_sets_2
1802 && ! REG_USERVAR_P (i2dest))))
1803 ni2dest = gen_rtx (REG, GET_MODE (SET_DEST (newpat)),
1804 REGNO (i2dest));
1806 m_split = split_insns (gen_rtx (PARALLEL, VOIDmode,
1807 gen_rtvec (2, newpat,
1808 gen_rtx (CLOBBER,
1809 VOIDmode,
1810 ni2dest))),
1811 i3);
1814 if (m_split && GET_CODE (m_split) == SEQUENCE
1815 && XVECLEN (m_split, 0) == 2
1816 && (next_real_insn (i2) == i3
1817 || ! use_crosses_set_p (PATTERN (XVECEXP (m_split, 0, 0)),
1818 INSN_CUID (i2))))
1820 rtx i2set, i3set;
1821 rtx newi3pat = PATTERN (XVECEXP (m_split, 0, 1));
1822 newi2pat = PATTERN (XVECEXP (m_split, 0, 0));
1824 i3set = single_set (XVECEXP (m_split, 0, 1));
1825 i2set = single_set (XVECEXP (m_split, 0, 0));
1827 /* In case we changed the mode of I2DEST, replace it in the
1828 pseudo-register table here. We can't do it above in case this
1829 code doesn't get executed and we do a split the other way. */
1831 if (REGNO (i2dest) >= FIRST_PSEUDO_REGISTER)
1832 SUBST (regno_reg_rtx[REGNO (i2dest)], ni2dest);
1834 i2_code_number = recog_for_combine (&newi2pat, i2, &new_i2_notes,
1835 &i2_scratches);
1837 /* If I2 or I3 has multiple SETs, we won't know how to track
1838 register status, so don't use these insns. If I2's destination
1839 is used between I2 and I3, we also can't use these insns. */
1841 if (i2_code_number >= 0 && i2set && i3set
1842 && (next_real_insn (i2) == i3
1843 || ! reg_used_between_p (SET_DEST (i2set), i2, i3)))
1844 insn_code_number = recog_for_combine (&newi3pat, i3, &new_i3_notes,
1845 &i3_scratches);
1846 if (insn_code_number >= 0)
1847 newpat = newi3pat;
1849 /* It is possible that both insns now set the destination of I3.
1850 If so, we must show an extra use of it. */
1852 if (insn_code_number >= 0)
1854 rtx new_i3_dest = SET_DEST (i3set);
1855 rtx new_i2_dest = SET_DEST (i2set);
1857 while (GET_CODE (new_i3_dest) == ZERO_EXTRACT
1858 || GET_CODE (new_i3_dest) == STRICT_LOW_PART
1859 || GET_CODE (new_i3_dest) == SUBREG)
1860 new_i3_dest = XEXP (new_i3_dest, 0);
1862 while (GET_CODE (new_i2_dest) == ZERO_EXTRACT
1863 || GET_CODE (new_i2_dest) == STRICT_LOW_PART
1864 || GET_CODE (new_i2_dest) == SUBREG)
1865 new_i2_dest = XEXP (new_i2_dest, 0);
1867 if (GET_CODE (new_i3_dest) == REG
1868 && GET_CODE (new_i2_dest) == REG
1869 && REGNO (new_i3_dest) == REGNO (new_i2_dest))
1870 REG_N_SETS (REGNO (new_i2_dest))++;
1874 /* If we can split it and use I2DEST, go ahead and see if that
1875 helps things be recognized. Verify that none of the registers
1876 are set between I2 and I3. */
1877 if (insn_code_number < 0 && (split = find_split_point (&newpat, i3)) != 0
1878 #ifdef HAVE_cc0
1879 && GET_CODE (i2dest) == REG
1880 #endif
1881 /* We need I2DEST in the proper mode. If it is a hard register
1882 or the only use of a pseudo, we can change its mode. */
1883 && (GET_MODE (*split) == GET_MODE (i2dest)
1884 || GET_MODE (*split) == VOIDmode
1885 || REGNO (i2dest) < FIRST_PSEUDO_REGISTER
1886 || (REG_N_SETS (REGNO (i2dest)) == 1 && ! added_sets_2
1887 && ! REG_USERVAR_P (i2dest)))
1888 && (next_real_insn (i2) == i3
1889 || ! use_crosses_set_p (*split, INSN_CUID (i2)))
1890 /* We can't overwrite I2DEST if its value is still used by
1891 NEWPAT. */
1892 && ! reg_referenced_p (i2dest, newpat))
1894 rtx newdest = i2dest;
1895 enum rtx_code split_code = GET_CODE (*split);
1896 enum machine_mode split_mode = GET_MODE (*split);
1898 /* Get NEWDEST as a register in the proper mode. We have already
1899 validated that we can do this. */
1900 if (GET_MODE (i2dest) != split_mode && split_mode != VOIDmode)
1902 newdest = gen_rtx (REG, split_mode, REGNO (i2dest));
1904 if (REGNO (i2dest) >= FIRST_PSEUDO_REGISTER)
1905 SUBST (regno_reg_rtx[REGNO (i2dest)], newdest);
1908 /* If *SPLIT is a (mult FOO (const_int pow2)), convert it to
1909 an ASHIFT. This can occur if it was inside a PLUS and hence
1910 appeared to be a memory address. This is a kludge. */
1911 if (split_code == MULT
1912 && GET_CODE (XEXP (*split, 1)) == CONST_INT
1913 && (i = exact_log2 (INTVAL (XEXP (*split, 1)))) >= 0)
1915 SUBST (*split, gen_rtx_combine (ASHIFT, split_mode,
1916 XEXP (*split, 0), GEN_INT (i)));
1917 /* Update split_code because we may not have a multiply
1918 anymore. */
1919 split_code = GET_CODE (*split);
1922 #ifdef INSN_SCHEDULING
1923 /* If *SPLIT is a paradoxical SUBREG, when we split it, it should
1924 be written as a ZERO_EXTEND. */
1925 if (split_code == SUBREG && GET_CODE (SUBREG_REG (*split)) == MEM)
1926 SUBST (*split, gen_rtx_combine (ZERO_EXTEND, split_mode,
1927 XEXP (*split, 0)));
1928 #endif
1930 newi2pat = gen_rtx_combine (SET, VOIDmode, newdest, *split);
1931 SUBST (*split, newdest);
1932 i2_code_number
1933 = recog_for_combine (&newi2pat, i2, &new_i2_notes, &i2_scratches);
1935 /* If the split point was a MULT and we didn't have one before,
1936 don't use one now. */
1937 if (i2_code_number >= 0 && ! (split_code == MULT && ! have_mult))
1938 insn_code_number
1939 = recog_for_combine (&newpat, i3, &new_i3_notes, &i3_scratches);
1943 /* Check for a case where we loaded from memory in a narrow mode and
1944 then sign extended it, but we need both registers. In that case,
1945 we have a PARALLEL with both loads from the same memory location.
1946 We can split this into a load from memory followed by a register-register
1947 copy. This saves at least one insn, more if register allocation can
1948 eliminate the copy.
1950 We cannot do this if the destination of the second assignment is
1951 a register that we have already assumed is zero-extended. Similarly
1952 for a SUBREG of such a register. */
1954 else if (i1 && insn_code_number < 0 && asm_noperands (newpat) < 0
1955 && GET_CODE (newpat) == PARALLEL
1956 && XVECLEN (newpat, 0) == 2
1957 && GET_CODE (XVECEXP (newpat, 0, 0)) == SET
1958 && GET_CODE (SET_SRC (XVECEXP (newpat, 0, 0))) == SIGN_EXTEND
1959 && GET_CODE (XVECEXP (newpat, 0, 1)) == SET
1960 && rtx_equal_p (SET_SRC (XVECEXP (newpat, 0, 1)),
1961 XEXP (SET_SRC (XVECEXP (newpat, 0, 0)), 0))
1962 && ! use_crosses_set_p (SET_SRC (XVECEXP (newpat, 0, 1)),
1963 INSN_CUID (i2))
1964 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 1))) != ZERO_EXTRACT
1965 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 1))) != STRICT_LOW_PART
1966 && ! (temp = SET_DEST (XVECEXP (newpat, 0, 1)),
1967 (GET_CODE (temp) == REG
1968 && reg_nonzero_bits[REGNO (temp)] != 0
1969 && GET_MODE_BITSIZE (GET_MODE (temp)) < BITS_PER_WORD
1970 && GET_MODE_BITSIZE (GET_MODE (temp)) < HOST_BITS_PER_INT
1971 && (reg_nonzero_bits[REGNO (temp)]
1972 != GET_MODE_MASK (word_mode))))
1973 && ! (GET_CODE (SET_DEST (XVECEXP (newpat, 0, 1))) == SUBREG
1974 && (temp = SUBREG_REG (SET_DEST (XVECEXP (newpat, 0, 1))),
1975 (GET_CODE (temp) == REG
1976 && reg_nonzero_bits[REGNO (temp)] != 0
1977 && GET_MODE_BITSIZE (GET_MODE (temp)) < BITS_PER_WORD
1978 && GET_MODE_BITSIZE (GET_MODE (temp)) < HOST_BITS_PER_INT
1979 && (reg_nonzero_bits[REGNO (temp)]
1980 != GET_MODE_MASK (word_mode)))))
1981 && ! reg_overlap_mentioned_p (SET_DEST (XVECEXP (newpat, 0, 1)),
1982 SET_SRC (XVECEXP (newpat, 0, 1)))
1983 && ! find_reg_note (i3, REG_UNUSED,
1984 SET_DEST (XVECEXP (newpat, 0, 0))))
1986 rtx ni2dest;
1988 newi2pat = XVECEXP (newpat, 0, 0);
1989 ni2dest = SET_DEST (XVECEXP (newpat, 0, 0));
1990 newpat = XVECEXP (newpat, 0, 1);
1991 SUBST (SET_SRC (newpat),
1992 gen_lowpart_for_combine (GET_MODE (SET_SRC (newpat)), ni2dest));
1993 i2_code_number
1994 = recog_for_combine (&newi2pat, i2, &new_i2_notes, &i2_scratches);
1996 if (i2_code_number >= 0)
1997 insn_code_number
1998 = recog_for_combine (&newpat, i3, &new_i3_notes, &i3_scratches);
2000 if (insn_code_number >= 0)
2002 rtx insn;
2003 rtx link;
2005 /* If we will be able to accept this, we have made a change to the
2006 destination of I3. This can invalidate a LOG_LINKS pointing
2007 to I3. No other part of combine.c makes such a transformation.
2009 The new I3 will have a destination that was previously the
2010 destination of I1 or I2 and which was used in i2 or I3. Call
2011 distribute_links to make a LOG_LINK from the next use of
2012 that destination. */
2014 PATTERN (i3) = newpat;
2015 distribute_links (gen_rtx (INSN_LIST, VOIDmode, i3, NULL_RTX));
2017 /* I3 now uses what used to be its destination and which is
2018 now I2's destination. That means we need a LOG_LINK from
2019 I3 to I2. But we used to have one, so we still will.
2021 However, some later insn might be using I2's dest and have
2022 a LOG_LINK pointing at I3. We must remove this link.
2023 The simplest way to remove the link is to point it at I1,
2024 which we know will be a NOTE. */
2026 for (insn = NEXT_INSN (i3);
2027 insn && (this_basic_block == n_basic_blocks - 1
2028 || insn != basic_block_head[this_basic_block + 1]);
2029 insn = NEXT_INSN (insn))
2031 if (GET_RTX_CLASS (GET_CODE (insn)) == 'i'
2032 && reg_referenced_p (ni2dest, PATTERN (insn)))
2034 for (link = LOG_LINKS (insn); link;
2035 link = XEXP (link, 1))
2036 if (XEXP (link, 0) == i3)
2037 XEXP (link, 0) = i1;
2039 break;
2045 /* Similarly, check for a case where we have a PARALLEL of two independent
2046 SETs but we started with three insns. In this case, we can do the sets
2047 as two separate insns. This case occurs when some SET allows two
2048 other insns to combine, but the destination of that SET is still live. */
2050 else if (i1 && insn_code_number < 0 && asm_noperands (newpat) < 0
2051 && GET_CODE (newpat) == PARALLEL
2052 && XVECLEN (newpat, 0) == 2
2053 && GET_CODE (XVECEXP (newpat, 0, 0)) == SET
2054 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 0))) != ZERO_EXTRACT
2055 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 0))) != STRICT_LOW_PART
2056 && GET_CODE (XVECEXP (newpat, 0, 1)) == SET
2057 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 1))) != ZERO_EXTRACT
2058 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 1))) != STRICT_LOW_PART
2059 && ! use_crosses_set_p (SET_SRC (XVECEXP (newpat, 0, 1)),
2060 INSN_CUID (i2))
2061 /* Don't pass sets with (USE (MEM ...)) dests to the following. */
2062 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 1))) != USE
2063 && GET_CODE (SET_DEST (XVECEXP (newpat, 0, 0))) != USE
2064 && ! reg_referenced_p (SET_DEST (XVECEXP (newpat, 0, 1)),
2065 XVECEXP (newpat, 0, 0))
2066 && ! reg_referenced_p (SET_DEST (XVECEXP (newpat, 0, 0)),
2067 XVECEXP (newpat, 0, 1)))
2069 newi2pat = XVECEXP (newpat, 0, 1);
2070 newpat = XVECEXP (newpat, 0, 0);
2072 i2_code_number
2073 = recog_for_combine (&newi2pat, i2, &new_i2_notes, &i2_scratches);
2075 if (i2_code_number >= 0)
2076 insn_code_number
2077 = recog_for_combine (&newpat, i3, &new_i3_notes, &i3_scratches);
2080 /* If it still isn't recognized, fail and change things back the way they
2081 were. */
2082 if ((insn_code_number < 0
2083 /* Is the result a reasonable ASM_OPERANDS? */
2084 && (! check_asm_operands (newpat) || added_sets_1 || added_sets_2)))
2086 undo_all ();
2087 return 0;
2090 /* If we had to change another insn, make sure it is valid also. */
2091 if (undobuf.other_insn)
2093 rtx other_pat = PATTERN (undobuf.other_insn);
2094 rtx new_other_notes;
2095 rtx note, next;
2097 CLEAR_HARD_REG_SET (newpat_used_regs);
2099 other_code_number
2100 = recog_for_combine (&other_pat, undobuf.other_insn,
2101 &new_other_notes, &other_scratches);
2103 if (other_code_number < 0 && ! check_asm_operands (other_pat))
2105 undo_all ();
2106 return 0;
2109 PATTERN (undobuf.other_insn) = other_pat;
2111 /* If any of the notes in OTHER_INSN were REG_UNUSED, ensure that they
2112 are still valid. Then add any non-duplicate notes added by
2113 recog_for_combine. */
2114 for (note = REG_NOTES (undobuf.other_insn); note; note = next)
2116 next = XEXP (note, 1);
2118 if (REG_NOTE_KIND (note) == REG_UNUSED
2119 && ! reg_set_p (XEXP (note, 0), PATTERN (undobuf.other_insn)))
2121 if (GET_CODE (XEXP (note, 0)) == REG)
2122 REG_N_DEATHS (REGNO (XEXP (note, 0)))--;
2124 remove_note (undobuf.other_insn, note);
2128 for (note = new_other_notes; note; note = XEXP (note, 1))
2129 if (GET_CODE (XEXP (note, 0)) == REG)
2130 REG_N_DEATHS (REGNO (XEXP (note, 0)))++;
2132 distribute_notes (new_other_notes, undobuf.other_insn,
2133 undobuf.other_insn, NULL_RTX, NULL_RTX, NULL_RTX);
2136 /* We now know that we can do this combination. Merge the insns and
2137 update the status of registers and LOG_LINKS. */
2140 rtx i3notes, i2notes, i1notes = 0;
2141 rtx i3links, i2links, i1links = 0;
2142 rtx midnotes = 0;
2143 register int regno;
2144 /* Compute which registers we expect to eliminate. newi2pat may be setting
2145 either i3dest or i2dest, so we must check it. */
2146 rtx elim_i2 = ((newi2pat && reg_set_p (i2dest, newi2pat))
2147 || i2dest_in_i2src || i2dest_in_i1src
2148 ? 0 : i2dest);
2149 rtx elim_i1 = (i1 == 0 || i1dest_in_i1src
2150 || (newi2pat && reg_set_p (i1dest, newi2pat))
2151 ? 0 : i1dest);
2153 /* Get the old REG_NOTES and LOG_LINKS from all our insns and
2154 clear them. */
2155 i3notes = REG_NOTES (i3), i3links = LOG_LINKS (i3);
2156 i2notes = REG_NOTES (i2), i2links = LOG_LINKS (i2);
2157 if (i1)
2158 i1notes = REG_NOTES (i1), i1links = LOG_LINKS (i1);
2160 /* Ensure that we do not have something that should not be shared but
2161 occurs multiple times in the new insns. Check this by first
2162 resetting all the `used' flags and then copying anything is shared. */
2164 reset_used_flags (i3notes);
2165 reset_used_flags (i2notes);
2166 reset_used_flags (i1notes);
2167 reset_used_flags (newpat);
2168 reset_used_flags (newi2pat);
2169 if (undobuf.other_insn)
2170 reset_used_flags (PATTERN (undobuf.other_insn));
2172 i3notes = copy_rtx_if_shared (i3notes);
2173 i2notes = copy_rtx_if_shared (i2notes);
2174 i1notes = copy_rtx_if_shared (i1notes);
2175 newpat = copy_rtx_if_shared (newpat);
2176 newi2pat = copy_rtx_if_shared (newi2pat);
2177 if (undobuf.other_insn)
2178 reset_used_flags (PATTERN (undobuf.other_insn));
2180 INSN_CODE (i3) = insn_code_number;
2181 PATTERN (i3) = newpat;
2182 if (undobuf.other_insn)
2183 INSN_CODE (undobuf.other_insn) = other_code_number;
2185 /* We had one special case above where I2 had more than one set and
2186 we replaced a destination of one of those sets with the destination
2187 of I3. In that case, we have to update LOG_LINKS of insns later
2188 in this basic block. Note that this (expensive) case is rare.
2190 Also, in this case, we must pretend that all REG_NOTEs for I2
2191 actually came from I3, so that REG_UNUSED notes from I2 will be
2192 properly handled. */
2194 if (i3_subst_into_i2)
2196 for (i = 0; i < XVECLEN (PATTERN (i2), 0); i++)
2197 if (GET_CODE (SET_DEST (XVECEXP (PATTERN (i2), 0, i))) == REG
2198 && SET_DEST (XVECEXP (PATTERN (i2), 0, i)) != i2dest
2199 && ! find_reg_note (i2, REG_UNUSED,
2200 SET_DEST (XVECEXP (PATTERN (i2), 0, i))))
2201 for (temp = NEXT_INSN (i2);
2202 temp && (this_basic_block == n_basic_blocks - 1
2203 || basic_block_head[this_basic_block] != temp);
2204 temp = NEXT_INSN (temp))
2205 if (temp != i3 && GET_RTX_CLASS (GET_CODE (temp)) == 'i')
2206 for (link = LOG_LINKS (temp); link; link = XEXP (link, 1))
2207 if (XEXP (link, 0) == i2)
2208 XEXP (link, 0) = i3;
2210 if (i3notes)
2212 rtx link = i3notes;
2213 while (XEXP (link, 1))
2214 link = XEXP (link, 1);
2215 XEXP (link, 1) = i2notes;
2217 else
2218 i3notes = i2notes;
2219 i2notes = 0;
2222 LOG_LINKS (i3) = 0;
2223 REG_NOTES (i3) = 0;
2224 LOG_LINKS (i2) = 0;
2225 REG_NOTES (i2) = 0;
2227 if (newi2pat)
2229 INSN_CODE (i2) = i2_code_number;
2230 PATTERN (i2) = newi2pat;
2232 else
2234 PUT_CODE (i2, NOTE);
2235 NOTE_LINE_NUMBER (i2) = NOTE_INSN_DELETED;
2236 NOTE_SOURCE_FILE (i2) = 0;
2239 if (i1)
2241 LOG_LINKS (i1) = 0;
2242 REG_NOTES (i1) = 0;
2243 PUT_CODE (i1, NOTE);
2244 NOTE_LINE_NUMBER (i1) = NOTE_INSN_DELETED;
2245 NOTE_SOURCE_FILE (i1) = 0;
2248 /* Get death notes for everything that is now used in either I3 or
2249 I2 and used to die in a previous insn. If we built two new
2250 patterns, move from I1 to I2 then I2 to I3 so that we get the
2251 proper movement on registers that I2 modifies. */
2253 if (newi2pat)
2255 move_deaths (newi2pat, NULL_RTX, INSN_CUID (i1), i2, &midnotes);
2256 move_deaths (newpat, newi2pat, INSN_CUID (i1), i3, &midnotes);
2258 else
2259 move_deaths (newpat, NULL_RTX, i1 ? INSN_CUID (i1) : INSN_CUID (i2),
2260 i3, &midnotes);
2262 /* Distribute all the LOG_LINKS and REG_NOTES from I1, I2, and I3. */
2263 if (i3notes)
2264 distribute_notes (i3notes, i3, i3, newi2pat ? i2 : NULL_RTX,
2265 elim_i2, elim_i1);
2266 if (i2notes)
2267 distribute_notes (i2notes, i2, i3, newi2pat ? i2 : NULL_RTX,
2268 elim_i2, elim_i1);
2269 if (i1notes)
2270 distribute_notes (i1notes, i1, i3, newi2pat ? i2 : NULL_RTX,
2271 elim_i2, elim_i1);
2272 if (midnotes)
2273 distribute_notes (midnotes, NULL_RTX, i3, newi2pat ? i2 : NULL_RTX,
2274 elim_i2, elim_i1);
2276 /* Distribute any notes added to I2 or I3 by recog_for_combine. We
2277 know these are REG_UNUSED and want them to go to the desired insn,
2278 so we always pass it as i3. We have not counted the notes in
2279 reg_n_deaths yet, so we need to do so now. */
2281 if (newi2pat && new_i2_notes)
2283 for (temp = new_i2_notes; temp; temp = XEXP (temp, 1))
2284 if (GET_CODE (XEXP (temp, 0)) == REG)
2285 REG_N_DEATHS (REGNO (XEXP (temp, 0)))++;
2287 distribute_notes (new_i2_notes, i2, i2, NULL_RTX, NULL_RTX, NULL_RTX);
2290 if (new_i3_notes)
2292 for (temp = new_i3_notes; temp; temp = XEXP (temp, 1))
2293 if (GET_CODE (XEXP (temp, 0)) == REG)
2294 REG_N_DEATHS (REGNO (XEXP (temp, 0)))++;
2296 distribute_notes (new_i3_notes, i3, i3, NULL_RTX, NULL_RTX, NULL_RTX);
2299 /* If I3DEST was used in I3SRC, it really died in I3. We may need to
2300 put a REG_DEAD note for it somewhere. Similarly for I2 and I1.
2301 Show an additional death due to the REG_DEAD note we make here. If
2302 we discard it in distribute_notes, we will decrement it again. */
2304 if (i3dest_killed)
2306 if (GET_CODE (i3dest_killed) == REG)
2307 REG_N_DEATHS (REGNO (i3dest_killed))++;
2309 distribute_notes (gen_rtx (EXPR_LIST, REG_DEAD, i3dest_killed,
2310 NULL_RTX),
2311 NULL_RTX, i3, newi2pat ? i2 : NULL_RTX,
2312 elim_i2, elim_i1);
2315 /* For I2 and I1, we have to be careful. If NEWI2PAT exists and sets
2316 I2DEST or I1DEST, the death must be somewhere before I2, not I3. If
2317 we passed I3 in that case, it might delete I2. */
2319 if (i2dest_in_i2src)
2321 if (GET_CODE (i2dest) == REG)
2322 REG_N_DEATHS (REGNO (i2dest))++;
2324 if (newi2pat && reg_set_p (i2dest, newi2pat))
2325 distribute_notes (gen_rtx (EXPR_LIST, REG_DEAD, i2dest, NULL_RTX),
2326 NULL_RTX, i2, NULL_RTX, NULL_RTX, NULL_RTX);
2327 else
2328 distribute_notes (gen_rtx (EXPR_LIST, REG_DEAD, i2dest, NULL_RTX),
2329 NULL_RTX, i3, newi2pat ? i2 : NULL_RTX,
2330 NULL_RTX, NULL_RTX);
2333 if (i1dest_in_i1src)
2335 if (GET_CODE (i1dest) == REG)
2336 REG_N_DEATHS (REGNO (i1dest))++;
2338 if (newi2pat && reg_set_p (i1dest, newi2pat))
2339 distribute_notes (gen_rtx (EXPR_LIST, REG_DEAD, i1dest, NULL_RTX),
2340 NULL_RTX, i2, NULL_RTX, NULL_RTX, NULL_RTX);
2341 else
2342 distribute_notes (gen_rtx (EXPR_LIST, REG_DEAD, i1dest, NULL_RTX),
2343 NULL_RTX, i3, newi2pat ? i2 : NULL_RTX,
2344 NULL_RTX, NULL_RTX);
2347 distribute_links (i3links);
2348 distribute_links (i2links);
2349 distribute_links (i1links);
2351 if (GET_CODE (i2dest) == REG)
2353 rtx link;
2354 rtx i2_insn = 0, i2_val = 0, set;
2356 /* The insn that used to set this register doesn't exist, and
2357 this life of the register may not exist either. See if one of
2358 I3's links points to an insn that sets I2DEST. If it does,
2359 that is now the last known value for I2DEST. If we don't update
2360 this and I2 set the register to a value that depended on its old
2361 contents, we will get confused. If this insn is used, thing
2362 will be set correctly in combine_instructions. */
2364 for (link = LOG_LINKS (i3); link; link = XEXP (link, 1))
2365 if ((set = single_set (XEXP (link, 0))) != 0
2366 && rtx_equal_p (i2dest, SET_DEST (set)))
2367 i2_insn = XEXP (link, 0), i2_val = SET_SRC (set);
2369 record_value_for_reg (i2dest, i2_insn, i2_val);
2371 /* If the reg formerly set in I2 died only once and that was in I3,
2372 zero its use count so it won't make `reload' do any work. */
2373 if (! added_sets_2
2374 && (newi2pat == 0 || ! reg_mentioned_p (i2dest, newi2pat))
2375 && ! i2dest_in_i2src)
2377 regno = REGNO (i2dest);
2378 REG_N_SETS (regno)--;
2379 if (REG_N_SETS (regno) == 0
2380 && ! REGNO_REG_SET_P (basic_block_live_at_start[0], regno))
2381 REG_N_REFS (regno) = 0;
2385 if (i1 && GET_CODE (i1dest) == REG)
2387 rtx link;
2388 rtx i1_insn = 0, i1_val = 0, set;
2390 for (link = LOG_LINKS (i3); link; link = XEXP (link, 1))
2391 if ((set = single_set (XEXP (link, 0))) != 0
2392 && rtx_equal_p (i1dest, SET_DEST (set)))
2393 i1_insn = XEXP (link, 0), i1_val = SET_SRC (set);
2395 record_value_for_reg (i1dest, i1_insn, i1_val);
2397 regno = REGNO (i1dest);
2398 if (! added_sets_1 && ! i1dest_in_i1src)
2400 REG_N_SETS (regno)--;
2401 if (REG_N_SETS (regno) == 0
2402 && ! REGNO_REG_SET_P (basic_block_live_at_start[0], regno))
2403 REG_N_REFS (regno) = 0;
2407 /* Update reg_nonzero_bits et al for any changes that may have been made
2408 to this insn. */
2410 note_stores (newpat, set_nonzero_bits_and_sign_copies);
2411 if (newi2pat)
2412 note_stores (newi2pat, set_nonzero_bits_and_sign_copies);
2414 /* If we added any (clobber (scratch)), add them to the max for a
2415 block. This is a very pessimistic calculation, since we might
2416 have had them already and this might not be the worst block, but
2417 it's not worth doing any better. */
2418 max_scratch += i3_scratches + i2_scratches + other_scratches;
2420 /* If I3 is now an unconditional jump, ensure that it has a
2421 BARRIER following it since it may have initially been a
2422 conditional jump. It may also be the last nonnote insn. */
2424 if ((GET_CODE (newpat) == RETURN || simplejump_p (i3))
2425 && ((temp = next_nonnote_insn (i3)) == NULL_RTX
2426 || GET_CODE (temp) != BARRIER))
2427 emit_barrier_after (i3);
2430 combine_successes++;
2432 /* Clear this here, so that subsequent get_last_value calls are not
2433 affected. */
2434 subst_prev_insn = NULL_RTX;
2436 if (added_links_insn
2437 && (newi2pat == 0 || INSN_CUID (added_links_insn) < INSN_CUID (i2))
2438 && INSN_CUID (added_links_insn) < INSN_CUID (i3))
2439 return added_links_insn;
2440 else
2441 return newi2pat ? i2 : i3;
2444 /* Undo all the modifications recorded in undobuf. */
2446 static void
2447 undo_all ()
2449 struct undo *undo, *next;
2451 for (undo = undobuf.undos; undo; undo = next)
2453 next = undo->next;
2454 if (undo->is_int)
2455 *undo->where.i = undo->old_contents.i;
2456 else
2457 *undo->where.r = undo->old_contents.r;
2459 undo->next = undobuf.frees;
2460 undobuf.frees = undo;
2463 obfree (undobuf.storage);
2464 undobuf.undos = undobuf.previous_undos = 0;
2466 /* Clear this here, so that subsequent get_last_value calls are not
2467 affected. */
2468 subst_prev_insn = NULL_RTX;
2471 /* Find the innermost point within the rtx at LOC, possibly LOC itself,
2472 where we have an arithmetic expression and return that point. LOC will
2473 be inside INSN.
2475 try_combine will call this function to see if an insn can be split into
2476 two insns. */
2478 static rtx *
2479 find_split_point (loc, insn)
2480 rtx *loc;
2481 rtx insn;
2483 rtx x = *loc;
2484 enum rtx_code code = GET_CODE (x);
2485 rtx *split;
2486 int len = 0, pos, unsignedp;
2487 rtx inner;
2489 /* First special-case some codes. */
2490 switch (code)
2492 case SUBREG:
2493 #ifdef INSN_SCHEDULING
2494 /* If we are making a paradoxical SUBREG invalid, it becomes a split
2495 point. */
2496 if (GET_CODE (SUBREG_REG (x)) == MEM)
2497 return loc;
2498 #endif
2499 return find_split_point (&SUBREG_REG (x), insn);
2501 case MEM:
2502 #ifdef HAVE_lo_sum
2503 /* If we have (mem (const ..)) or (mem (symbol_ref ...)), split it
2504 using LO_SUM and HIGH. */
2505 if (GET_CODE (XEXP (x, 0)) == CONST
2506 || GET_CODE (XEXP (x, 0)) == SYMBOL_REF)
2508 SUBST (XEXP (x, 0),
2509 gen_rtx_combine (LO_SUM, Pmode,
2510 gen_rtx_combine (HIGH, Pmode, XEXP (x, 0)),
2511 XEXP (x, 0)));
2512 return &XEXP (XEXP (x, 0), 0);
2514 #endif
2516 /* If we have a PLUS whose second operand is a constant and the
2517 address is not valid, perhaps will can split it up using
2518 the machine-specific way to split large constants. We use
2519 the first pseudo-reg (one of the virtual regs) as a placeholder;
2520 it will not remain in the result. */
2521 if (GET_CODE (XEXP (x, 0)) == PLUS
2522 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
2523 && ! memory_address_p (GET_MODE (x), XEXP (x, 0)))
2525 rtx reg = regno_reg_rtx[FIRST_PSEUDO_REGISTER];
2526 rtx seq = split_insns (gen_rtx (SET, VOIDmode, reg, XEXP (x, 0)),
2527 subst_insn);
2529 /* This should have produced two insns, each of which sets our
2530 placeholder. If the source of the second is a valid address,
2531 we can make put both sources together and make a split point
2532 in the middle. */
2534 if (seq && XVECLEN (seq, 0) == 2
2535 && GET_CODE (XVECEXP (seq, 0, 0)) == INSN
2536 && GET_CODE (PATTERN (XVECEXP (seq, 0, 0))) == SET
2537 && SET_DEST (PATTERN (XVECEXP (seq, 0, 0))) == reg
2538 && ! reg_mentioned_p (reg,
2539 SET_SRC (PATTERN (XVECEXP (seq, 0, 0))))
2540 && GET_CODE (XVECEXP (seq, 0, 1)) == INSN
2541 && GET_CODE (PATTERN (XVECEXP (seq, 0, 1))) == SET
2542 && SET_DEST (PATTERN (XVECEXP (seq, 0, 1))) == reg
2543 && memory_address_p (GET_MODE (x),
2544 SET_SRC (PATTERN (XVECEXP (seq, 0, 1)))))
2546 rtx src1 = SET_SRC (PATTERN (XVECEXP (seq, 0, 0)));
2547 rtx src2 = SET_SRC (PATTERN (XVECEXP (seq, 0, 1)));
2549 /* Replace the placeholder in SRC2 with SRC1. If we can
2550 find where in SRC2 it was placed, that can become our
2551 split point and we can replace this address with SRC2.
2552 Just try two obvious places. */
2554 src2 = replace_rtx (src2, reg, src1);
2555 split = 0;
2556 if (XEXP (src2, 0) == src1)
2557 split = &XEXP (src2, 0);
2558 else if (GET_RTX_FORMAT (GET_CODE (XEXP (src2, 0)))[0] == 'e'
2559 && XEXP (XEXP (src2, 0), 0) == src1)
2560 split = &XEXP (XEXP (src2, 0), 0);
2562 if (split)
2564 SUBST (XEXP (x, 0), src2);
2565 return split;
2569 /* If that didn't work, perhaps the first operand is complex and
2570 needs to be computed separately, so make a split point there.
2571 This will occur on machines that just support REG + CONST
2572 and have a constant moved through some previous computation. */
2574 else if (GET_RTX_CLASS (GET_CODE (XEXP (XEXP (x, 0), 0))) != 'o'
2575 && ! (GET_CODE (XEXP (XEXP (x, 0), 0)) == SUBREG
2576 && (GET_RTX_CLASS (GET_CODE (SUBREG_REG (XEXP (XEXP (x, 0), 0))))
2577 == 'o')))
2578 return &XEXP (XEXP (x, 0), 0);
2580 break;
2582 case SET:
2583 #ifdef HAVE_cc0
2584 /* If SET_DEST is CC0 and SET_SRC is not an operand, a COMPARE, or a
2585 ZERO_EXTRACT, the most likely reason why this doesn't match is that
2586 we need to put the operand into a register. So split at that
2587 point. */
2589 if (SET_DEST (x) == cc0_rtx
2590 && GET_CODE (SET_SRC (x)) != COMPARE
2591 && GET_CODE (SET_SRC (x)) != ZERO_EXTRACT
2592 && GET_RTX_CLASS (GET_CODE (SET_SRC (x))) != 'o'
2593 && ! (GET_CODE (SET_SRC (x)) == SUBREG
2594 && GET_RTX_CLASS (GET_CODE (SUBREG_REG (SET_SRC (x)))) == 'o'))
2595 return &SET_SRC (x);
2596 #endif
2598 /* See if we can split SET_SRC as it stands. */
2599 split = find_split_point (&SET_SRC (x), insn);
2600 if (split && split != &SET_SRC (x))
2601 return split;
2603 /* See if we can split SET_DEST as it stands. */
2604 split = find_split_point (&SET_DEST (x), insn);
2605 if (split && split != &SET_DEST (x))
2606 return split;
2608 /* See if this is a bitfield assignment with everything constant. If
2609 so, this is an IOR of an AND, so split it into that. */
2610 if (GET_CODE (SET_DEST (x)) == ZERO_EXTRACT
2611 && (GET_MODE_BITSIZE (GET_MODE (XEXP (SET_DEST (x), 0)))
2612 <= HOST_BITS_PER_WIDE_INT)
2613 && GET_CODE (XEXP (SET_DEST (x), 1)) == CONST_INT
2614 && GET_CODE (XEXP (SET_DEST (x), 2)) == CONST_INT
2615 && GET_CODE (SET_SRC (x)) == CONST_INT
2616 && ((INTVAL (XEXP (SET_DEST (x), 1))
2617 + INTVAL (XEXP (SET_DEST (x), 2)))
2618 <= GET_MODE_BITSIZE (GET_MODE (XEXP (SET_DEST (x), 0))))
2619 && ! side_effects_p (XEXP (SET_DEST (x), 0)))
2621 int pos = INTVAL (XEXP (SET_DEST (x), 2));
2622 int len = INTVAL (XEXP (SET_DEST (x), 1));
2623 int src = INTVAL (SET_SRC (x));
2624 rtx dest = XEXP (SET_DEST (x), 0);
2625 enum machine_mode mode = GET_MODE (dest);
2626 unsigned HOST_WIDE_INT mask = ((HOST_WIDE_INT) 1 << len) - 1;
2628 if (BITS_BIG_ENDIAN)
2629 pos = GET_MODE_BITSIZE (mode) - len - pos;
2631 if (src == mask)
2632 SUBST (SET_SRC (x),
2633 gen_binary (IOR, mode, dest, GEN_INT (src << pos)));
2634 else
2635 SUBST (SET_SRC (x),
2636 gen_binary (IOR, mode,
2637 gen_binary (AND, mode, dest,
2638 GEN_INT (~ (mask << pos)
2639 & GET_MODE_MASK (mode))),
2640 GEN_INT (src << pos)));
2642 SUBST (SET_DEST (x), dest);
2644 split = find_split_point (&SET_SRC (x), insn);
2645 if (split && split != &SET_SRC (x))
2646 return split;
2649 /* Otherwise, see if this is an operation that we can split into two.
2650 If so, try to split that. */
2651 code = GET_CODE (SET_SRC (x));
2653 switch (code)
2655 case AND:
2656 /* If we are AND'ing with a large constant that is only a single
2657 bit and the result is only being used in a context where we
2658 need to know if it is zero or non-zero, replace it with a bit
2659 extraction. This will avoid the large constant, which might
2660 have taken more than one insn to make. If the constant were
2661 not a valid argument to the AND but took only one insn to make,
2662 this is no worse, but if it took more than one insn, it will
2663 be better. */
2665 if (GET_CODE (XEXP (SET_SRC (x), 1)) == CONST_INT
2666 && GET_CODE (XEXP (SET_SRC (x), 0)) == REG
2667 && (pos = exact_log2 (INTVAL (XEXP (SET_SRC (x), 1)))) >= 7
2668 && GET_CODE (SET_DEST (x)) == REG
2669 && (split = find_single_use (SET_DEST (x), insn, NULL_PTR)) != 0
2670 && (GET_CODE (*split) == EQ || GET_CODE (*split) == NE)
2671 && XEXP (*split, 0) == SET_DEST (x)
2672 && XEXP (*split, 1) == const0_rtx)
2674 rtx extraction = make_extraction (GET_MODE (SET_DEST (x)),
2675 XEXP (SET_SRC (x), 0),
2676 pos, NULL_RTX, 1, 1, 0, 0);
2677 if (extraction != 0)
2679 SUBST (SET_SRC (x), extraction);
2680 return find_split_point (loc, insn);
2683 break;
2685 case NE:
2686 /* if STORE_FLAG_VALUE is -1, this is (NE X 0) and only one bit of X
2687 is known to be on, this can be converted into a NEG of a shift. */
2688 if (STORE_FLAG_VALUE == -1 && XEXP (SET_SRC (x), 1) == const0_rtx
2689 && GET_MODE (SET_SRC (x)) == GET_MODE (XEXP (SET_SRC (x), 0))
2690 && 1 <= (pos = exact_log2
2691 (nonzero_bits (XEXP (SET_SRC (x), 0),
2692 GET_MODE (XEXP (SET_SRC (x), 0))))))
2694 enum machine_mode mode = GET_MODE (XEXP (SET_SRC (x), 0));
2696 SUBST (SET_SRC (x),
2697 gen_rtx_combine (NEG, mode,
2698 gen_rtx_combine (LSHIFTRT, mode,
2699 XEXP (SET_SRC (x), 0),
2700 GEN_INT (pos))));
2702 split = find_split_point (&SET_SRC (x), insn);
2703 if (split && split != &SET_SRC (x))
2704 return split;
2706 break;
2708 case SIGN_EXTEND:
2709 inner = XEXP (SET_SRC (x), 0);
2711 /* We can't optimize if either mode is a partial integer
2712 mode as we don't know how many bits are significant
2713 in those modes. */
2714 if (GET_MODE_CLASS (GET_MODE (inner)) == MODE_PARTIAL_INT
2715 || GET_MODE_CLASS (GET_MODE (SET_SRC (x))) == MODE_PARTIAL_INT)
2716 break;
2718 pos = 0;
2719 len = GET_MODE_BITSIZE (GET_MODE (inner));
2720 unsignedp = 0;
2721 break;
2723 case SIGN_EXTRACT:
2724 case ZERO_EXTRACT:
2725 if (GET_CODE (XEXP (SET_SRC (x), 1)) == CONST_INT
2726 && GET_CODE (XEXP (SET_SRC (x), 2)) == CONST_INT)
2728 inner = XEXP (SET_SRC (x), 0);
2729 len = INTVAL (XEXP (SET_SRC (x), 1));
2730 pos = INTVAL (XEXP (SET_SRC (x), 2));
2732 if (BITS_BIG_ENDIAN)
2733 pos = GET_MODE_BITSIZE (GET_MODE (inner)) - len - pos;
2734 unsignedp = (code == ZERO_EXTRACT);
2736 break;
2739 if (len && pos >= 0 && pos + len <= GET_MODE_BITSIZE (GET_MODE (inner)))
2741 enum machine_mode mode = GET_MODE (SET_SRC (x));
2743 /* For unsigned, we have a choice of a shift followed by an
2744 AND or two shifts. Use two shifts for field sizes where the
2745 constant might be too large. We assume here that we can
2746 always at least get 8-bit constants in an AND insn, which is
2747 true for every current RISC. */
2749 if (unsignedp && len <= 8)
2751 SUBST (SET_SRC (x),
2752 gen_rtx_combine
2753 (AND, mode,
2754 gen_rtx_combine (LSHIFTRT, mode,
2755 gen_lowpart_for_combine (mode, inner),
2756 GEN_INT (pos)),
2757 GEN_INT (((HOST_WIDE_INT) 1 << len) - 1)));
2759 split = find_split_point (&SET_SRC (x), insn);
2760 if (split && split != &SET_SRC (x))
2761 return split;
2763 else
2765 SUBST (SET_SRC (x),
2766 gen_rtx_combine
2767 (unsignedp ? LSHIFTRT : ASHIFTRT, mode,
2768 gen_rtx_combine (ASHIFT, mode,
2769 gen_lowpart_for_combine (mode, inner),
2770 GEN_INT (GET_MODE_BITSIZE (mode)
2771 - len - pos)),
2772 GEN_INT (GET_MODE_BITSIZE (mode) - len)));
2774 split = find_split_point (&SET_SRC (x), insn);
2775 if (split && split != &SET_SRC (x))
2776 return split;
2780 /* See if this is a simple operation with a constant as the second
2781 operand. It might be that this constant is out of range and hence
2782 could be used as a split point. */
2783 if ((GET_RTX_CLASS (GET_CODE (SET_SRC (x))) == '2'
2784 || GET_RTX_CLASS (GET_CODE (SET_SRC (x))) == 'c'
2785 || GET_RTX_CLASS (GET_CODE (SET_SRC (x))) == '<')
2786 && CONSTANT_P (XEXP (SET_SRC (x), 1))
2787 && (GET_RTX_CLASS (GET_CODE (XEXP (SET_SRC (x), 0))) == 'o'
2788 || (GET_CODE (XEXP (SET_SRC (x), 0)) == SUBREG
2789 && (GET_RTX_CLASS (GET_CODE (SUBREG_REG (XEXP (SET_SRC (x), 0))))
2790 == 'o'))))
2791 return &XEXP (SET_SRC (x), 1);
2793 /* Finally, see if this is a simple operation with its first operand
2794 not in a register. The operation might require this operand in a
2795 register, so return it as a split point. We can always do this
2796 because if the first operand were another operation, we would have
2797 already found it as a split point. */
2798 if ((GET_RTX_CLASS (GET_CODE (SET_SRC (x))) == '2'
2799 || GET_RTX_CLASS (GET_CODE (SET_SRC (x))) == 'c'
2800 || GET_RTX_CLASS (GET_CODE (SET_SRC (x))) == '<'
2801 || GET_RTX_CLASS (GET_CODE (SET_SRC (x))) == '1')
2802 && ! register_operand (XEXP (SET_SRC (x), 0), VOIDmode))
2803 return &XEXP (SET_SRC (x), 0);
2805 return 0;
2807 case AND:
2808 case IOR:
2809 /* We write NOR as (and (not A) (not B)), but if we don't have a NOR,
2810 it is better to write this as (not (ior A B)) so we can split it.
2811 Similarly for IOR. */
2812 if (GET_CODE (XEXP (x, 0)) == NOT && GET_CODE (XEXP (x, 1)) == NOT)
2814 SUBST (*loc,
2815 gen_rtx_combine (NOT, GET_MODE (x),
2816 gen_rtx_combine (code == IOR ? AND : IOR,
2817 GET_MODE (x),
2818 XEXP (XEXP (x, 0), 0),
2819 XEXP (XEXP (x, 1), 0))));
2820 return find_split_point (loc, insn);
2823 /* Many RISC machines have a large set of logical insns. If the
2824 second operand is a NOT, put it first so we will try to split the
2825 other operand first. */
2826 if (GET_CODE (XEXP (x, 1)) == NOT)
2828 rtx tem = XEXP (x, 0);
2829 SUBST (XEXP (x, 0), XEXP (x, 1));
2830 SUBST (XEXP (x, 1), tem);
2832 break;
2835 /* Otherwise, select our actions depending on our rtx class. */
2836 switch (GET_RTX_CLASS (code))
2838 case 'b': /* This is ZERO_EXTRACT and SIGN_EXTRACT. */
2839 case '3':
2840 split = find_split_point (&XEXP (x, 2), insn);
2841 if (split)
2842 return split;
2843 /* ... fall through ... */
2844 case '2':
2845 case 'c':
2846 case '<':
2847 split = find_split_point (&XEXP (x, 1), insn);
2848 if (split)
2849 return split;
2850 /* ... fall through ... */
2851 case '1':
2852 /* Some machines have (and (shift ...) ...) insns. If X is not
2853 an AND, but XEXP (X, 0) is, use it as our split point. */
2854 if (GET_CODE (x) != AND && GET_CODE (XEXP (x, 0)) == AND)
2855 return &XEXP (x, 0);
2857 split = find_split_point (&XEXP (x, 0), insn);
2858 if (split)
2859 return split;
2860 return loc;
2863 /* Otherwise, we don't have a split point. */
2864 return 0;
2867 /* Throughout X, replace FROM with TO, and return the result.
2868 The result is TO if X is FROM;
2869 otherwise the result is X, but its contents may have been modified.
2870 If they were modified, a record was made in undobuf so that
2871 undo_all will (among other things) return X to its original state.
2873 If the number of changes necessary is too much to record to undo,
2874 the excess changes are not made, so the result is invalid.
2875 The changes already made can still be undone.
2876 undobuf.num_undo is incremented for such changes, so by testing that
2877 the caller can tell whether the result is valid.
2879 `n_occurrences' is incremented each time FROM is replaced.
2881 IN_DEST is non-zero if we are processing the SET_DEST of a SET.
2883 UNIQUE_COPY is non-zero if each substitution must be unique. We do this
2884 by copying if `n_occurrences' is non-zero. */
2886 static rtx
2887 subst (x, from, to, in_dest, unique_copy)
2888 register rtx x, from, to;
2889 int in_dest;
2890 int unique_copy;
2892 register enum rtx_code code = GET_CODE (x);
2893 enum machine_mode op0_mode = VOIDmode;
2894 register char *fmt;
2895 register int len, i;
2896 rtx new;
2898 /* Two expressions are equal if they are identical copies of a shared
2899 RTX or if they are both registers with the same register number
2900 and mode. */
2902 #define COMBINE_RTX_EQUAL_P(X,Y) \
2903 ((X) == (Y) \
2904 || (GET_CODE (X) == REG && GET_CODE (Y) == REG \
2905 && REGNO (X) == REGNO (Y) && GET_MODE (X) == GET_MODE (Y)))
2907 if (! in_dest && COMBINE_RTX_EQUAL_P (x, from))
2909 n_occurrences++;
2910 return (unique_copy && n_occurrences > 1 ? copy_rtx (to) : to);
2913 /* If X and FROM are the same register but different modes, they will
2914 not have been seen as equal above. However, flow.c will make a
2915 LOG_LINKS entry for that case. If we do nothing, we will try to
2916 rerecognize our original insn and, when it succeeds, we will
2917 delete the feeding insn, which is incorrect.
2919 So force this insn not to match in this (rare) case. */
2920 if (! in_dest && code == REG && GET_CODE (from) == REG
2921 && REGNO (x) == REGNO (from))
2922 return gen_rtx (CLOBBER, GET_MODE (x), const0_rtx);
2924 /* If this is an object, we are done unless it is a MEM or LO_SUM, both
2925 of which may contain things that can be combined. */
2926 if (code != MEM && code != LO_SUM && GET_RTX_CLASS (code) == 'o')
2927 return x;
2929 /* It is possible to have a subexpression appear twice in the insn.
2930 Suppose that FROM is a register that appears within TO.
2931 Then, after that subexpression has been scanned once by `subst',
2932 the second time it is scanned, TO may be found. If we were
2933 to scan TO here, we would find FROM within it and create a
2934 self-referent rtl structure which is completely wrong. */
2935 if (COMBINE_RTX_EQUAL_P (x, to))
2936 return to;
2938 len = GET_RTX_LENGTH (code);
2939 fmt = GET_RTX_FORMAT (code);
2941 /* We don't need to process a SET_DEST that is a register, CC0, or PC, so
2942 set up to skip this common case. All other cases where we want to
2943 suppress replacing something inside a SET_SRC are handled via the
2944 IN_DEST operand. */
2945 if (code == SET
2946 && (GET_CODE (SET_DEST (x)) == REG
2947 || GET_CODE (SET_DEST (x)) == CC0
2948 || GET_CODE (SET_DEST (x)) == PC))
2949 fmt = "ie";
2951 /* Get the mode of operand 0 in case X is now a SIGN_EXTEND of a
2952 constant. */
2953 if (fmt[0] == 'e')
2954 op0_mode = GET_MODE (XEXP (x, 0));
2956 for (i = 0; i < len; i++)
2958 if (fmt[i] == 'E')
2960 register int j;
2961 for (j = XVECLEN (x, i) - 1; j >= 0; j--)
2963 if (COMBINE_RTX_EQUAL_P (XVECEXP (x, i, j), from))
2965 new = (unique_copy && n_occurrences ? copy_rtx (to) : to);
2966 n_occurrences++;
2968 else
2970 new = subst (XVECEXP (x, i, j), from, to, 0, unique_copy);
2972 /* If this substitution failed, this whole thing fails. */
2973 if (GET_CODE (new) == CLOBBER && XEXP (new, 0) == const0_rtx)
2974 return new;
2977 SUBST (XVECEXP (x, i, j), new);
2980 else if (fmt[i] == 'e')
2982 if (COMBINE_RTX_EQUAL_P (XEXP (x, i), from))
2984 /* In general, don't install a subreg involving two modes not
2985 tieable. It can worsen register allocation, and can even
2986 make invalid reload insns, since the reg inside may need to
2987 be copied from in the outside mode, and that may be invalid
2988 if it is an fp reg copied in integer mode.
2990 We allow two exceptions to this: It is valid if it is inside
2991 another SUBREG and the mode of that SUBREG and the mode of
2992 the inside of TO is tieable and it is valid if X is a SET
2993 that copies FROM to CC0. */
2994 if (GET_CODE (to) == SUBREG
2995 && ! MODES_TIEABLE_P (GET_MODE (to),
2996 GET_MODE (SUBREG_REG (to)))
2997 && ! (code == SUBREG
2998 && MODES_TIEABLE_P (GET_MODE (x),
2999 GET_MODE (SUBREG_REG (to))))
3000 #ifdef HAVE_cc0
3001 && ! (code == SET && i == 1 && XEXP (x, 0) == cc0_rtx)
3002 #endif
3004 return gen_rtx (CLOBBER, VOIDmode, const0_rtx);
3006 new = (unique_copy && n_occurrences ? copy_rtx (to) : to);
3007 n_occurrences++;
3009 else
3010 /* If we are in a SET_DEST, suppress most cases unless we
3011 have gone inside a MEM, in which case we want to
3012 simplify the address. We assume here that things that
3013 are actually part of the destination have their inner
3014 parts in the first expression. This is true for SUBREG,
3015 STRICT_LOW_PART, and ZERO_EXTRACT, which are the only
3016 things aside from REG and MEM that should appear in a
3017 SET_DEST. */
3018 new = subst (XEXP (x, i), from, to,
3019 (((in_dest
3020 && (code == SUBREG || code == STRICT_LOW_PART
3021 || code == ZERO_EXTRACT))
3022 || code == SET)
3023 && i == 0), unique_copy);
3025 /* If we found that we will have to reject this combination,
3026 indicate that by returning the CLOBBER ourselves, rather than
3027 an expression containing it. This will speed things up as
3028 well as prevent accidents where two CLOBBERs are considered
3029 to be equal, thus producing an incorrect simplification. */
3031 if (GET_CODE (new) == CLOBBER && XEXP (new, 0) == const0_rtx)
3032 return new;
3034 SUBST (XEXP (x, i), new);
3038 /* Try to simplify X. If the simplification changed the code, it is likely
3039 that further simplification will help, so loop, but limit the number
3040 of repetitions that will be performed. */
3042 for (i = 0; i < 4; i++)
3044 /* If X is sufficiently simple, don't bother trying to do anything
3045 with it. */
3046 if (code != CONST_INT && code != REG && code != CLOBBER)
3047 x = simplify_rtx (x, op0_mode, i == 3, in_dest);
3049 if (GET_CODE (x) == code)
3050 break;
3052 code = GET_CODE (x);
3054 /* We no longer know the original mode of operand 0 since we
3055 have changed the form of X) */
3056 op0_mode = VOIDmode;
3059 return x;
3062 /* Simplify X, a piece of RTL. We just operate on the expression at the
3063 outer level; call `subst' to simplify recursively. Return the new
3064 expression.
3066 OP0_MODE is the original mode of XEXP (x, 0); LAST is nonzero if this
3067 will be the iteration even if an expression with a code different from
3068 X is returned; IN_DEST is nonzero if we are inside a SET_DEST. */
3070 static rtx
3071 simplify_rtx (x, op0_mode, last, in_dest)
3072 rtx x;
3073 enum machine_mode op0_mode;
3074 int last;
3075 int in_dest;
3077 enum rtx_code code = GET_CODE (x);
3078 enum machine_mode mode = GET_MODE (x);
3079 rtx temp;
3080 int i;
3082 /* If this is a commutative operation, put a constant last and a complex
3083 expression first. We don't need to do this for comparisons here. */
3084 if (GET_RTX_CLASS (code) == 'c'
3085 && ((CONSTANT_P (XEXP (x, 0)) && GET_CODE (XEXP (x, 1)) != CONST_INT)
3086 || (GET_RTX_CLASS (GET_CODE (XEXP (x, 0))) == 'o'
3087 && GET_RTX_CLASS (GET_CODE (XEXP (x, 1))) != 'o')
3088 || (GET_CODE (XEXP (x, 0)) == SUBREG
3089 && GET_RTX_CLASS (GET_CODE (SUBREG_REG (XEXP (x, 0)))) == 'o'
3090 && GET_RTX_CLASS (GET_CODE (XEXP (x, 1))) != 'o')))
3092 temp = XEXP (x, 0);
3093 SUBST (XEXP (x, 0), XEXP (x, 1));
3094 SUBST (XEXP (x, 1), temp);
3097 /* If this is a PLUS, MINUS, or MULT, and the first operand is the
3098 sign extension of a PLUS with a constant, reverse the order of the sign
3099 extension and the addition. Note that this not the same as the original
3100 code, but overflow is undefined for signed values. Also note that the
3101 PLUS will have been partially moved "inside" the sign-extension, so that
3102 the first operand of X will really look like:
3103 (ashiftrt (plus (ashift A C4) C5) C4).
3104 We convert this to
3105 (plus (ashiftrt (ashift A C4) C2) C4)
3106 and replace the first operand of X with that expression. Later parts
3107 of this function may simplify the expression further.
3109 For example, if we start with (mult (sign_extend (plus A C1)) C2),
3110 we swap the SIGN_EXTEND and PLUS. Later code will apply the
3111 distributive law to produce (plus (mult (sign_extend X) C1) C3).
3113 We do this to simplify address expressions. */
3115 if ((code == PLUS || code == MINUS || code == MULT)
3116 && GET_CODE (XEXP (x, 0)) == ASHIFTRT
3117 && GET_CODE (XEXP (XEXP (x, 0), 0)) == PLUS
3118 && GET_CODE (XEXP (XEXP (XEXP (x, 0), 0), 0)) == ASHIFT
3119 && GET_CODE (XEXP (XEXP (XEXP (XEXP (x, 0), 0), 0), 1)) == CONST_INT
3120 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
3121 && XEXP (XEXP (XEXP (XEXP (x, 0), 0), 0), 1) == XEXP (XEXP (x, 0), 1)
3122 && GET_CODE (XEXP (XEXP (XEXP (x, 0), 0), 1)) == CONST_INT
3123 && (temp = simplify_binary_operation (ASHIFTRT, mode,
3124 XEXP (XEXP (XEXP (x, 0), 0), 1),
3125 XEXP (XEXP (x, 0), 1))) != 0)
3127 rtx new
3128 = simplify_shift_const (NULL_RTX, ASHIFT, mode,
3129 XEXP (XEXP (XEXP (XEXP (x, 0), 0), 0), 0),
3130 INTVAL (XEXP (XEXP (x, 0), 1)));
3132 new = simplify_shift_const (NULL_RTX, ASHIFTRT, mode, new,
3133 INTVAL (XEXP (XEXP (x, 0), 1)));
3135 SUBST (XEXP (x, 0), gen_binary (PLUS, mode, new, temp));
3138 /* If this is a simple operation applied to an IF_THEN_ELSE, try
3139 applying it to the arms of the IF_THEN_ELSE. This often simplifies
3140 things. Check for cases where both arms are testing the same
3141 condition.
3143 Don't do anything if all operands are very simple. */
3145 if (((GET_RTX_CLASS (code) == '2' || GET_RTX_CLASS (code) == 'c'
3146 || GET_RTX_CLASS (code) == '<')
3147 && ((GET_RTX_CLASS (GET_CODE (XEXP (x, 0))) != 'o'
3148 && ! (GET_CODE (XEXP (x, 0)) == SUBREG
3149 && (GET_RTX_CLASS (GET_CODE (SUBREG_REG (XEXP (x, 0))))
3150 == 'o')))
3151 || (GET_RTX_CLASS (GET_CODE (XEXP (x, 1))) != 'o'
3152 && ! (GET_CODE (XEXP (x, 1)) == SUBREG
3153 && (GET_RTX_CLASS (GET_CODE (SUBREG_REG (XEXP (x, 1))))
3154 == 'o')))))
3155 || (GET_RTX_CLASS (code) == '1'
3156 && ((GET_RTX_CLASS (GET_CODE (XEXP (x, 0))) != 'o'
3157 && ! (GET_CODE (XEXP (x, 0)) == SUBREG
3158 && (GET_RTX_CLASS (GET_CODE (SUBREG_REG (XEXP (x, 0))))
3159 == 'o'))))))
3161 rtx cond, true, false;
3163 cond = if_then_else_cond (x, &true, &false);
3164 if (cond != 0
3165 /* If everything is a comparison, what we have is highly unlikely
3166 to be simpler, so don't use it. */
3167 && ! (GET_RTX_CLASS (code) == '<'
3168 && (GET_RTX_CLASS (GET_CODE (true)) == '<'
3169 || GET_RTX_CLASS (GET_CODE (false)) == '<')))
3171 rtx cop1 = const0_rtx;
3172 enum rtx_code cond_code = simplify_comparison (NE, &cond, &cop1);
3174 if (cond_code == NE && GET_RTX_CLASS (GET_CODE (cond)) == '<')
3175 return x;
3177 /* Simplify the alternative arms; this may collapse the true and
3178 false arms to store-flag values. */
3179 true = subst (true, pc_rtx, pc_rtx, 0, 0);
3180 false = subst (false, pc_rtx, pc_rtx, 0, 0);
3182 /* Restarting if we generate a store-flag expression will cause
3183 us to loop. Just drop through in this case. */
3185 /* If the result values are STORE_FLAG_VALUE and zero, we can
3186 just make the comparison operation. */
3187 if (true == const_true_rtx && false == const0_rtx)
3188 x = gen_binary (cond_code, mode, cond, cop1);
3189 else if (true == const0_rtx && false == const_true_rtx)
3190 x = gen_binary (reverse_condition (cond_code), mode, cond, cop1);
3192 /* Likewise, we can make the negate of a comparison operation
3193 if the result values are - STORE_FLAG_VALUE and zero. */
3194 else if (GET_CODE (true) == CONST_INT
3195 && INTVAL (true) == - STORE_FLAG_VALUE
3196 && false == const0_rtx)
3197 x = gen_unary (NEG, mode, mode,
3198 gen_binary (cond_code, mode, cond, cop1));
3199 else if (GET_CODE (false) == CONST_INT
3200 && INTVAL (false) == - STORE_FLAG_VALUE
3201 && true == const0_rtx)
3202 x = gen_unary (NEG, mode, mode,
3203 gen_binary (reverse_condition (cond_code),
3204 mode, cond, cop1));
3205 else
3206 return gen_rtx (IF_THEN_ELSE, mode,
3207 gen_binary (cond_code, VOIDmode, cond, cop1),
3208 true, false);
3210 code = GET_CODE (x);
3211 op0_mode = VOIDmode;
3215 /* Try to fold this expression in case we have constants that weren't
3216 present before. */
3217 temp = 0;
3218 switch (GET_RTX_CLASS (code))
3220 case '1':
3221 temp = simplify_unary_operation (code, mode, XEXP (x, 0), op0_mode);
3222 break;
3223 case '<':
3224 temp = simplify_relational_operation (code, op0_mode,
3225 XEXP (x, 0), XEXP (x, 1));
3226 #ifdef FLOAT_STORE_FLAG_VALUE
3227 if (temp != 0 && GET_MODE_CLASS (GET_MODE (x)) == MODE_FLOAT)
3228 temp = ((temp == const0_rtx) ? CONST0_RTX (GET_MODE (x))
3229 : immed_real_const_1 (FLOAT_STORE_FLAG_VALUE, GET_MODE (x)));
3230 #endif
3231 break;
3232 case 'c':
3233 case '2':
3234 temp = simplify_binary_operation (code, mode, XEXP (x, 0), XEXP (x, 1));
3235 break;
3236 case 'b':
3237 case '3':
3238 temp = simplify_ternary_operation (code, mode, op0_mode, XEXP (x, 0),
3239 XEXP (x, 1), XEXP (x, 2));
3240 break;
3243 if (temp)
3244 x = temp, code = GET_CODE (temp);
3246 /* First see if we can apply the inverse distributive law. */
3247 if (code == PLUS || code == MINUS
3248 || code == AND || code == IOR || code == XOR)
3250 x = apply_distributive_law (x);
3251 code = GET_CODE (x);
3254 /* If CODE is an associative operation not otherwise handled, see if we
3255 can associate some operands. This can win if they are constants or
3256 if they are logically related (i.e. (a & b) & a. */
3257 if ((code == PLUS || code == MINUS
3258 || code == MULT || code == AND || code == IOR || code == XOR
3259 || code == DIV || code == UDIV
3260 || code == SMAX || code == SMIN || code == UMAX || code == UMIN)
3261 && INTEGRAL_MODE_P (mode))
3263 if (GET_CODE (XEXP (x, 0)) == code)
3265 rtx other = XEXP (XEXP (x, 0), 0);
3266 rtx inner_op0 = XEXP (XEXP (x, 0), 1);
3267 rtx inner_op1 = XEXP (x, 1);
3268 rtx inner;
3270 /* Make sure we pass the constant operand if any as the second
3271 one if this is a commutative operation. */
3272 if (CONSTANT_P (inner_op0) && GET_RTX_CLASS (code) == 'c')
3274 rtx tem = inner_op0;
3275 inner_op0 = inner_op1;
3276 inner_op1 = tem;
3278 inner = simplify_binary_operation (code == MINUS ? PLUS
3279 : code == DIV ? MULT
3280 : code == UDIV ? MULT
3281 : code,
3282 mode, inner_op0, inner_op1);
3284 /* For commutative operations, try the other pair if that one
3285 didn't simplify. */
3286 if (inner == 0 && GET_RTX_CLASS (code) == 'c')
3288 other = XEXP (XEXP (x, 0), 1);
3289 inner = simplify_binary_operation (code, mode,
3290 XEXP (XEXP (x, 0), 0),
3291 XEXP (x, 1));
3294 if (inner)
3295 return gen_binary (code, mode, other, inner);
3299 /* A little bit of algebraic simplification here. */
3300 switch (code)
3302 case MEM:
3303 /* Ensure that our address has any ASHIFTs converted to MULT in case
3304 address-recognizing predicates are called later. */
3305 temp = make_compound_operation (XEXP (x, 0), MEM);
3306 SUBST (XEXP (x, 0), temp);
3307 break;
3309 case SUBREG:
3310 /* (subreg:A (mem:B X) N) becomes a modified MEM unless the SUBREG
3311 is paradoxical. If we can't do that safely, then it becomes
3312 something nonsensical so that this combination won't take place. */
3314 if (GET_CODE (SUBREG_REG (x)) == MEM
3315 && (GET_MODE_SIZE (mode)
3316 <= GET_MODE_SIZE (GET_MODE (SUBREG_REG (x)))))
3318 rtx inner = SUBREG_REG (x);
3319 int endian_offset = 0;
3320 /* Don't change the mode of the MEM
3321 if that would change the meaning of the address. */
3322 if (MEM_VOLATILE_P (SUBREG_REG (x))
3323 || mode_dependent_address_p (XEXP (inner, 0)))
3324 return gen_rtx (CLOBBER, mode, const0_rtx);
3326 if (BYTES_BIG_ENDIAN)
3328 if (GET_MODE_SIZE (mode) < UNITS_PER_WORD)
3329 endian_offset += UNITS_PER_WORD - GET_MODE_SIZE (mode);
3330 if (GET_MODE_SIZE (GET_MODE (inner)) < UNITS_PER_WORD)
3331 endian_offset -= (UNITS_PER_WORD
3332 - GET_MODE_SIZE (GET_MODE (inner)));
3334 /* Note if the plus_constant doesn't make a valid address
3335 then this combination won't be accepted. */
3336 x = gen_rtx (MEM, mode,
3337 plus_constant (XEXP (inner, 0),
3338 (SUBREG_WORD (x) * UNITS_PER_WORD
3339 + endian_offset)));
3340 MEM_VOLATILE_P (x) = MEM_VOLATILE_P (inner);
3341 RTX_UNCHANGING_P (x) = RTX_UNCHANGING_P (inner);
3342 MEM_IN_STRUCT_P (x) = MEM_IN_STRUCT_P (inner);
3343 return x;
3346 /* If we are in a SET_DEST, these other cases can't apply. */
3347 if (in_dest)
3348 return x;
3350 /* Changing mode twice with SUBREG => just change it once,
3351 or not at all if changing back to starting mode. */
3352 if (GET_CODE (SUBREG_REG (x)) == SUBREG)
3354 if (mode == GET_MODE (SUBREG_REG (SUBREG_REG (x)))
3355 && SUBREG_WORD (x) == 0 && SUBREG_WORD (SUBREG_REG (x)) == 0)
3356 return SUBREG_REG (SUBREG_REG (x));
3358 SUBST_INT (SUBREG_WORD (x),
3359 SUBREG_WORD (x) + SUBREG_WORD (SUBREG_REG (x)));
3360 SUBST (SUBREG_REG (x), SUBREG_REG (SUBREG_REG (x)));
3363 /* SUBREG of a hard register => just change the register number
3364 and/or mode. If the hard register is not valid in that mode,
3365 suppress this combination. If the hard register is the stack,
3366 frame, or argument pointer, leave this as a SUBREG. */
3368 if (GET_CODE (SUBREG_REG (x)) == REG
3369 && REGNO (SUBREG_REG (x)) < FIRST_PSEUDO_REGISTER
3370 && REGNO (SUBREG_REG (x)) != FRAME_POINTER_REGNUM
3371 #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM
3372 && REGNO (SUBREG_REG (x)) != HARD_FRAME_POINTER_REGNUM
3373 #endif
3374 #if FRAME_POINTER_REGNUM != ARG_POINTER_REGNUM
3375 && REGNO (SUBREG_REG (x)) != ARG_POINTER_REGNUM
3376 #endif
3377 && REGNO (SUBREG_REG (x)) != STACK_POINTER_REGNUM)
3379 if (HARD_REGNO_MODE_OK (REGNO (SUBREG_REG (x)) + SUBREG_WORD (x),
3380 mode))
3381 return gen_rtx (REG, mode,
3382 REGNO (SUBREG_REG (x)) + SUBREG_WORD (x));
3383 else
3384 return gen_rtx (CLOBBER, mode, const0_rtx);
3387 /* For a constant, try to pick up the part we want. Handle a full
3388 word and low-order part. Only do this if we are narrowing
3389 the constant; if it is being widened, we have no idea what
3390 the extra bits will have been set to. */
3392 if (CONSTANT_P (SUBREG_REG (x)) && op0_mode != VOIDmode
3393 && GET_MODE_SIZE (mode) == UNITS_PER_WORD
3394 && GET_MODE_SIZE (op0_mode) > UNITS_PER_WORD
3395 && GET_MODE_CLASS (mode) == MODE_INT)
3397 temp = operand_subword (SUBREG_REG (x), SUBREG_WORD (x),
3398 0, op0_mode);
3399 if (temp)
3400 return temp;
3403 /* If we want a subreg of a constant, at offset 0,
3404 take the low bits. On a little-endian machine, that's
3405 always valid. On a big-endian machine, it's valid
3406 only if the constant's mode fits in one word. Note that we
3407 cannot use subreg_lowpart_p since SUBREG_REG may be VOIDmode. */
3408 if (CONSTANT_P (SUBREG_REG (x))
3409 && ((GET_MODE_SIZE (op0_mode) <= UNITS_PER_WORD
3410 || ! WORDS_BIG_ENDIAN)
3411 ? SUBREG_WORD (x) == 0
3412 : (SUBREG_WORD (x)
3413 == ((GET_MODE_SIZE (op0_mode)
3414 - MAX (GET_MODE_SIZE (mode), UNITS_PER_WORD))
3415 / UNITS_PER_WORD)))
3416 && GET_MODE_SIZE (mode) <= GET_MODE_SIZE (op0_mode)
3417 && (! WORDS_BIG_ENDIAN
3418 || GET_MODE_BITSIZE (op0_mode) <= BITS_PER_WORD))
3419 return gen_lowpart_for_combine (mode, SUBREG_REG (x));
3421 /* A paradoxical SUBREG of a VOIDmode constant is the same constant,
3422 since we are saying that the high bits don't matter. */
3423 if (CONSTANT_P (SUBREG_REG (x)) && GET_MODE (SUBREG_REG (x)) == VOIDmode
3424 && GET_MODE_SIZE (mode) > GET_MODE_SIZE (op0_mode))
3425 return SUBREG_REG (x);
3427 /* Note that we cannot do any narrowing for non-constants since
3428 we might have been counting on using the fact that some bits were
3429 zero. We now do this in the SET. */
3431 break;
3433 case NOT:
3434 /* (not (plus X -1)) can become (neg X). */
3435 if (GET_CODE (XEXP (x, 0)) == PLUS
3436 && XEXP (XEXP (x, 0), 1) == constm1_rtx)
3437 return gen_rtx_combine (NEG, mode, XEXP (XEXP (x, 0), 0));
3439 /* Similarly, (not (neg X)) is (plus X -1). */
3440 if (GET_CODE (XEXP (x, 0)) == NEG)
3441 return gen_rtx_combine (PLUS, mode, XEXP (XEXP (x, 0), 0),
3442 constm1_rtx);
3444 /* (not (xor X C)) for C constant is (xor X D) with D = ~ C. */
3445 if (GET_CODE (XEXP (x, 0)) == XOR
3446 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
3447 && (temp = simplify_unary_operation (NOT, mode,
3448 XEXP (XEXP (x, 0), 1),
3449 mode)) != 0)
3450 return gen_binary (XOR, mode, XEXP (XEXP (x, 0), 0), temp);
3452 /* (not (ashift 1 X)) is (rotate ~1 X). We used to do this for operands
3453 other than 1, but that is not valid. We could do a similar
3454 simplification for (not (lshiftrt C X)) where C is just the sign bit,
3455 but this doesn't seem common enough to bother with. */
3456 if (GET_CODE (XEXP (x, 0)) == ASHIFT
3457 && XEXP (XEXP (x, 0), 0) == const1_rtx)
3458 return gen_rtx (ROTATE, mode, gen_unary (NOT, mode, mode, const1_rtx),
3459 XEXP (XEXP (x, 0), 1));
3461 if (GET_CODE (XEXP (x, 0)) == SUBREG
3462 && subreg_lowpart_p (XEXP (x, 0))
3463 && (GET_MODE_SIZE (GET_MODE (XEXP (x, 0)))
3464 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (XEXP (x, 0)))))
3465 && GET_CODE (SUBREG_REG (XEXP (x, 0))) == ASHIFT
3466 && XEXP (SUBREG_REG (XEXP (x, 0)), 0) == const1_rtx)
3468 enum machine_mode inner_mode = GET_MODE (SUBREG_REG (XEXP (x, 0)));
3470 x = gen_rtx (ROTATE, inner_mode,
3471 gen_unary (NOT, inner_mode, inner_mode, const1_rtx),
3472 XEXP (SUBREG_REG (XEXP (x, 0)), 1));
3473 return gen_lowpart_for_combine (mode, x);
3476 /* If STORE_FLAG_VALUE is -1, (not (comparison foo bar)) can be done by
3477 reversing the comparison code if valid. */
3478 if (STORE_FLAG_VALUE == -1
3479 && GET_RTX_CLASS (GET_CODE (XEXP (x, 0))) == '<'
3480 && reversible_comparison_p (XEXP (x, 0)))
3481 return gen_rtx_combine (reverse_condition (GET_CODE (XEXP (x, 0))),
3482 mode, XEXP (XEXP (x, 0), 0),
3483 XEXP (XEXP (x, 0), 1));
3485 /* (ashiftrt foo C) where C is the number of bits in FOO minus 1
3486 is (lt foo (const_int 0)) if STORE_FLAG_VALUE is -1, so we can
3487 perform the above simplification. */
3489 if (STORE_FLAG_VALUE == -1
3490 && XEXP (x, 1) == const1_rtx
3491 && GET_CODE (XEXP (x, 0)) == ASHIFTRT
3492 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
3493 && INTVAL (XEXP (XEXP (x, 0), 1)) == GET_MODE_BITSIZE (mode) - 1)
3494 return gen_rtx_combine (GE, mode, XEXP (XEXP (x, 0), 0), const0_rtx);
3496 /* Apply De Morgan's laws to reduce number of patterns for machines
3497 with negating logical insns (and-not, nand, etc.). If result has
3498 only one NOT, put it first, since that is how the patterns are
3499 coded. */
3501 if (GET_CODE (XEXP (x, 0)) == IOR || GET_CODE (XEXP (x, 0)) == AND)
3503 rtx in1 = XEXP (XEXP (x, 0), 0), in2 = XEXP (XEXP (x, 0), 1);
3505 if (GET_CODE (in1) == NOT)
3506 in1 = XEXP (in1, 0);
3507 else
3508 in1 = gen_rtx_combine (NOT, GET_MODE (in1), in1);
3510 if (GET_CODE (in2) == NOT)
3511 in2 = XEXP (in2, 0);
3512 else if (GET_CODE (in2) == CONST_INT
3513 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT)
3514 in2 = GEN_INT (GET_MODE_MASK (mode) & ~ INTVAL (in2));
3515 else
3516 in2 = gen_rtx_combine (NOT, GET_MODE (in2), in2);
3518 if (GET_CODE (in2) == NOT)
3520 rtx tem = in2;
3521 in2 = in1; in1 = tem;
3524 return gen_rtx_combine (GET_CODE (XEXP (x, 0)) == IOR ? AND : IOR,
3525 mode, in1, in2);
3527 break;
3529 case NEG:
3530 /* (neg (plus X 1)) can become (not X). */
3531 if (GET_CODE (XEXP (x, 0)) == PLUS
3532 && XEXP (XEXP (x, 0), 1) == const1_rtx)
3533 return gen_rtx_combine (NOT, mode, XEXP (XEXP (x, 0), 0));
3535 /* Similarly, (neg (not X)) is (plus X 1). */
3536 if (GET_CODE (XEXP (x, 0)) == NOT)
3537 return plus_constant (XEXP (XEXP (x, 0), 0), 1);
3539 /* (neg (minus X Y)) can become (minus Y X). */
3540 if (GET_CODE (XEXP (x, 0)) == MINUS
3541 && (! FLOAT_MODE_P (mode)
3542 /* x-y != -(y-x) with IEEE floating point. */
3543 || TARGET_FLOAT_FORMAT != IEEE_FLOAT_FORMAT
3544 || flag_fast_math))
3545 return gen_binary (MINUS, mode, XEXP (XEXP (x, 0), 1),
3546 XEXP (XEXP (x, 0), 0));
3548 /* (neg (xor A 1)) is (plus A -1) if A is known to be either 0 or 1. */
3549 if (GET_CODE (XEXP (x, 0)) == XOR && XEXP (XEXP (x, 0), 1) == const1_rtx
3550 && nonzero_bits (XEXP (XEXP (x, 0), 0), mode) == 1)
3551 return gen_binary (PLUS, mode, XEXP (XEXP (x, 0), 0), constm1_rtx);
3553 /* NEG commutes with ASHIFT since it is multiplication. Only do this
3554 if we can then eliminate the NEG (e.g.,
3555 if the operand is a constant). */
3557 if (GET_CODE (XEXP (x, 0)) == ASHIFT)
3559 temp = simplify_unary_operation (NEG, mode,
3560 XEXP (XEXP (x, 0), 0), mode);
3561 if (temp)
3563 SUBST (XEXP (XEXP (x, 0), 0), temp);
3564 return XEXP (x, 0);
3568 temp = expand_compound_operation (XEXP (x, 0));
3570 /* For C equal to the width of MODE minus 1, (neg (ashiftrt X C)) can be
3571 replaced by (lshiftrt X C). This will convert
3572 (neg (sign_extract X 1 Y)) to (zero_extract X 1 Y). */
3574 if (GET_CODE (temp) == ASHIFTRT
3575 && GET_CODE (XEXP (temp, 1)) == CONST_INT
3576 && INTVAL (XEXP (temp, 1)) == GET_MODE_BITSIZE (mode) - 1)
3577 return simplify_shift_const (temp, LSHIFTRT, mode, XEXP (temp, 0),
3578 INTVAL (XEXP (temp, 1)));
3580 /* If X has only a single bit that might be nonzero, say, bit I, convert
3581 (neg X) to (ashiftrt (ashift X C-I) C-I) where C is the bitsize of
3582 MODE minus 1. This will convert (neg (zero_extract X 1 Y)) to
3583 (sign_extract X 1 Y). But only do this if TEMP isn't a register
3584 or a SUBREG of one since we'd be making the expression more
3585 complex if it was just a register. */
3587 if (GET_CODE (temp) != REG
3588 && ! (GET_CODE (temp) == SUBREG
3589 && GET_CODE (SUBREG_REG (temp)) == REG)
3590 && (i = exact_log2 (nonzero_bits (temp, mode))) >= 0)
3592 rtx temp1 = simplify_shift_const
3593 (NULL_RTX, ASHIFTRT, mode,
3594 simplify_shift_const (NULL_RTX, ASHIFT, mode, temp,
3595 GET_MODE_BITSIZE (mode) - 1 - i),
3596 GET_MODE_BITSIZE (mode) - 1 - i);
3598 /* If all we did was surround TEMP with the two shifts, we
3599 haven't improved anything, so don't use it. Otherwise,
3600 we are better off with TEMP1. */
3601 if (GET_CODE (temp1) != ASHIFTRT
3602 || GET_CODE (XEXP (temp1, 0)) != ASHIFT
3603 || XEXP (XEXP (temp1, 0), 0) != temp)
3604 return temp1;
3606 break;
3608 case TRUNCATE:
3609 /* We can't handle truncation to a partial integer mode here
3610 because we don't know the real bitsize of the partial
3611 integer mode. */
3612 if (GET_MODE_CLASS (mode) == MODE_PARTIAL_INT)
3613 break;
3615 if (GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT)
3616 SUBST (XEXP (x, 0),
3617 force_to_mode (XEXP (x, 0), GET_MODE (XEXP (x, 0)),
3618 GET_MODE_MASK (mode), NULL_RTX, 0));
3620 /* (truncate:SI ({sign,zero}_extend:DI foo:SI)) == foo:SI. */
3621 if ((GET_CODE (XEXP (x, 0)) == SIGN_EXTEND
3622 || GET_CODE (XEXP (x, 0)) == ZERO_EXTEND)
3623 && GET_MODE (XEXP (XEXP (x, 0), 0)) == mode)
3624 return XEXP (XEXP (x, 0), 0);
3626 /* (truncate:SI (OP:DI ({sign,zero}_extend:DI foo:SI))) is
3627 (OP:SI foo:SI) if OP is NEG or ABS. */
3628 if ((GET_CODE (XEXP (x, 0)) == ABS
3629 || GET_CODE (XEXP (x, 0)) == NEG)
3630 && (GET_CODE (XEXP (XEXP (x, 0), 0)) == SIGN_EXTEND
3631 || GET_CODE (XEXP (XEXP (x, 0), 0)) == ZERO_EXTEND)
3632 && GET_MODE (XEXP (XEXP (XEXP (x, 0), 0), 0)) == mode)
3633 return gen_unary (GET_CODE (XEXP (x, 0)), mode, mode,
3634 XEXP (XEXP (XEXP (x, 0), 0), 0));
3636 /* (truncate:SI (subreg:DI (truncate:SI X) 0)) is
3637 (truncate:SI x). */
3638 if (GET_CODE (XEXP (x, 0)) == SUBREG
3639 && GET_CODE (SUBREG_REG (XEXP (x, 0))) == TRUNCATE
3640 && subreg_lowpart_p (XEXP (x, 0)))
3641 return SUBREG_REG (XEXP (x, 0));
3643 /* If we know that the value is already truncated, we can
3644 replace the TRUNCATE with a SUBREG. */
3645 if (GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0))) <= HOST_BITS_PER_WIDE_INT
3646 && (nonzero_bits (XEXP (x, 0), GET_MODE (XEXP (x, 0)))
3647 &~ GET_MODE_MASK (mode)) == 0)
3648 return gen_lowpart_for_combine (mode, XEXP (x, 0));
3650 /* A truncate of a comparison can be replaced with a subreg if
3651 STORE_FLAG_VALUE permits. This is like the previous test,
3652 but it works even if the comparison is done in a mode larger
3653 than HOST_BITS_PER_WIDE_INT. */
3654 if (GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
3655 && GET_RTX_CLASS (GET_CODE (XEXP (x, 0))) == '<'
3656 && ((HOST_WIDE_INT) STORE_FLAG_VALUE &~ GET_MODE_MASK (mode)) == 0)
3657 return gen_lowpart_for_combine (mode, XEXP (x, 0));
3659 /* Similarly, a truncate of a register whose value is a
3660 comparison can be replaced with a subreg if STORE_FLAG_VALUE
3661 permits. */
3662 if (GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
3663 && ((HOST_WIDE_INT) STORE_FLAG_VALUE &~ GET_MODE_MASK (mode)) == 0
3664 && (temp = get_last_value (XEXP (x, 0)))
3665 && GET_RTX_CLASS (GET_CODE (temp)) == '<')
3666 return gen_lowpart_for_combine (mode, XEXP (x, 0));
3668 break;
3670 case FLOAT_TRUNCATE:
3671 /* (float_truncate:SF (float_extend:DF foo:SF)) = foo:SF. */
3672 if (GET_CODE (XEXP (x, 0)) == FLOAT_EXTEND
3673 && GET_MODE (XEXP (XEXP (x, 0), 0)) == mode)
3674 return XEXP (XEXP (x, 0), 0);
3676 /* (float_truncate:SF (OP:DF (float_extend:DF foo:sf))) is
3677 (OP:SF foo:SF) if OP is NEG or ABS. */
3678 if ((GET_CODE (XEXP (x, 0)) == ABS
3679 || GET_CODE (XEXP (x, 0)) == NEG)
3680 && GET_CODE (XEXP (XEXP (x, 0), 0)) == FLOAT_EXTEND
3681 && GET_MODE (XEXP (XEXP (XEXP (x, 0), 0), 0)) == mode)
3682 return gen_unary (GET_CODE (XEXP (x, 0)), mode, mode,
3683 XEXP (XEXP (XEXP (x, 0), 0), 0));
3685 /* (float_truncate:SF (subreg:DF (float_truncate:SF X) 0))
3686 is (float_truncate:SF x). */
3687 if (GET_CODE (XEXP (x, 0)) == SUBREG
3688 && subreg_lowpart_p (XEXP (x, 0))
3689 && GET_CODE (SUBREG_REG (XEXP (x, 0))) == FLOAT_TRUNCATE)
3690 return SUBREG_REG (XEXP (x, 0));
3691 break;
3693 #ifdef HAVE_cc0
3694 case COMPARE:
3695 /* Convert (compare FOO (const_int 0)) to FOO unless we aren't
3696 using cc0, in which case we want to leave it as a COMPARE
3697 so we can distinguish it from a register-register-copy. */
3698 if (XEXP (x, 1) == const0_rtx)
3699 return XEXP (x, 0);
3701 /* In IEEE floating point, x-0 is not the same as x. */
3702 if ((TARGET_FLOAT_FORMAT != IEEE_FLOAT_FORMAT
3703 || ! FLOAT_MODE_P (GET_MODE (XEXP (x, 0)))
3704 || flag_fast_math)
3705 && XEXP (x, 1) == CONST0_RTX (GET_MODE (XEXP (x, 0))))
3706 return XEXP (x, 0);
3707 break;
3708 #endif
3710 case CONST:
3711 /* (const (const X)) can become (const X). Do it this way rather than
3712 returning the inner CONST since CONST can be shared with a
3713 REG_EQUAL note. */
3714 if (GET_CODE (XEXP (x, 0)) == CONST)
3715 SUBST (XEXP (x, 0), XEXP (XEXP (x, 0), 0));
3716 break;
3718 #ifdef HAVE_lo_sum
3719 case LO_SUM:
3720 /* Convert (lo_sum (high FOO) FOO) to FOO. This is necessary so we
3721 can add in an offset. find_split_point will split this address up
3722 again if it doesn't match. */
3723 if (GET_CODE (XEXP (x, 0)) == HIGH
3724 && rtx_equal_p (XEXP (XEXP (x, 0), 0), XEXP (x, 1)))
3725 return XEXP (x, 1);
3726 break;
3727 #endif
3729 case PLUS:
3730 /* If we have (plus (plus (A const) B)), associate it so that CONST is
3731 outermost. That's because that's the way indexed addresses are
3732 supposed to appear. This code used to check many more cases, but
3733 they are now checked elsewhere. */
3734 if (GET_CODE (XEXP (x, 0)) == PLUS
3735 && CONSTANT_ADDRESS_P (XEXP (XEXP (x, 0), 1)))
3736 return gen_binary (PLUS, mode,
3737 gen_binary (PLUS, mode, XEXP (XEXP (x, 0), 0),
3738 XEXP (x, 1)),
3739 XEXP (XEXP (x, 0), 1));
3741 /* (plus (xor (and <foo> (const_int pow2 - 1)) <c>) <-c>)
3742 when c is (const_int (pow2 + 1) / 2) is a sign extension of a
3743 bit-field and can be replaced by either a sign_extend or a
3744 sign_extract. The `and' may be a zero_extend. */
3745 if (GET_CODE (XEXP (x, 0)) == XOR
3746 && GET_CODE (XEXP (x, 1)) == CONST_INT
3747 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
3748 && INTVAL (XEXP (x, 1)) == - INTVAL (XEXP (XEXP (x, 0), 1))
3749 && (i = exact_log2 (INTVAL (XEXP (XEXP (x, 0), 1)))) >= 0
3750 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
3751 && ((GET_CODE (XEXP (XEXP (x, 0), 0)) == AND
3752 && GET_CODE (XEXP (XEXP (XEXP (x, 0), 0), 1)) == CONST_INT
3753 && (INTVAL (XEXP (XEXP (XEXP (x, 0), 0), 1))
3754 == ((HOST_WIDE_INT) 1 << (i + 1)) - 1))
3755 || (GET_CODE (XEXP (XEXP (x, 0), 0)) == ZERO_EXTEND
3756 && (GET_MODE_BITSIZE (GET_MODE (XEXP (XEXP (XEXP (x, 0), 0), 0)))
3757 == i + 1))))
3758 return simplify_shift_const
3759 (NULL_RTX, ASHIFTRT, mode,
3760 simplify_shift_const (NULL_RTX, ASHIFT, mode,
3761 XEXP (XEXP (XEXP (x, 0), 0), 0),
3762 GET_MODE_BITSIZE (mode) - (i + 1)),
3763 GET_MODE_BITSIZE (mode) - (i + 1));
3765 /* (plus (comparison A B) C) can become (neg (rev-comp A B)) if
3766 C is 1 and STORE_FLAG_VALUE is -1 or if C is -1 and STORE_FLAG_VALUE
3767 is 1. This produces better code than the alternative immediately
3768 below. */
3769 if (GET_RTX_CLASS (GET_CODE (XEXP (x, 0))) == '<'
3770 && reversible_comparison_p (XEXP (x, 0))
3771 && ((STORE_FLAG_VALUE == -1 && XEXP (x, 1) == const1_rtx)
3772 || (STORE_FLAG_VALUE == 1 && XEXP (x, 1) == constm1_rtx)))
3773 return
3774 gen_unary (NEG, mode, mode,
3775 gen_binary (reverse_condition (GET_CODE (XEXP (x, 0))),
3776 mode, XEXP (XEXP (x, 0), 0),
3777 XEXP (XEXP (x, 0), 1)));
3779 /* If only the low-order bit of X is possibly nonzero, (plus x -1)
3780 can become (ashiftrt (ashift (xor x 1) C) C) where C is
3781 the bitsize of the mode - 1. This allows simplification of
3782 "a = (b & 8) == 0;" */
3783 if (XEXP (x, 1) == constm1_rtx
3784 && GET_CODE (XEXP (x, 0)) != REG
3785 && ! (GET_CODE (XEXP (x,0)) == SUBREG
3786 && GET_CODE (SUBREG_REG (XEXP (x, 0))) == REG)
3787 && nonzero_bits (XEXP (x, 0), mode) == 1)
3788 return simplify_shift_const (NULL_RTX, ASHIFTRT, mode,
3789 simplify_shift_const (NULL_RTX, ASHIFT, mode,
3790 gen_rtx_combine (XOR, mode,
3791 XEXP (x, 0), const1_rtx),
3792 GET_MODE_BITSIZE (mode) - 1),
3793 GET_MODE_BITSIZE (mode) - 1);
3795 /* If we are adding two things that have no bits in common, convert
3796 the addition into an IOR. This will often be further simplified,
3797 for example in cases like ((a & 1) + (a & 2)), which can
3798 become a & 3. */
3800 if (GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
3801 && (nonzero_bits (XEXP (x, 0), mode)
3802 & nonzero_bits (XEXP (x, 1), mode)) == 0)
3803 return gen_binary (IOR, mode, XEXP (x, 0), XEXP (x, 1));
3804 break;
3806 case MINUS:
3807 /* If STORE_FLAG_VALUE is 1, (minus 1 (comparison foo bar)) can be done
3808 by reversing the comparison code if valid. */
3809 if (STORE_FLAG_VALUE == 1
3810 && XEXP (x, 0) == const1_rtx
3811 && GET_RTX_CLASS (GET_CODE (XEXP (x, 1))) == '<'
3812 && reversible_comparison_p (XEXP (x, 1)))
3813 return gen_binary (reverse_condition (GET_CODE (XEXP (x, 1))),
3814 mode, XEXP (XEXP (x, 1), 0),
3815 XEXP (XEXP (x, 1), 1));
3817 /* (minus <foo> (and <foo> (const_int -pow2))) becomes
3818 (and <foo> (const_int pow2-1)) */
3819 if (GET_CODE (XEXP (x, 1)) == AND
3820 && GET_CODE (XEXP (XEXP (x, 1), 1)) == CONST_INT
3821 && exact_log2 (- INTVAL (XEXP (XEXP (x, 1), 1))) >= 0
3822 && rtx_equal_p (XEXP (XEXP (x, 1), 0), XEXP (x, 0)))
3823 return simplify_and_const_int (NULL_RTX, mode, XEXP (x, 0),
3824 - INTVAL (XEXP (XEXP (x, 1), 1)) - 1);
3826 /* Canonicalize (minus A (plus B C)) to (minus (minus A B) C) for
3827 integers. */
3828 if (GET_CODE (XEXP (x, 1)) == PLUS && INTEGRAL_MODE_P (mode))
3829 return gen_binary (MINUS, mode,
3830 gen_binary (MINUS, mode, XEXP (x, 0),
3831 XEXP (XEXP (x, 1), 0)),
3832 XEXP (XEXP (x, 1), 1));
3833 break;
3835 case MULT:
3836 /* If we have (mult (plus A B) C), apply the distributive law and then
3837 the inverse distributive law to see if things simplify. This
3838 occurs mostly in addresses, often when unrolling loops. */
3840 if (GET_CODE (XEXP (x, 0)) == PLUS)
3842 x = apply_distributive_law
3843 (gen_binary (PLUS, mode,
3844 gen_binary (MULT, mode,
3845 XEXP (XEXP (x, 0), 0), XEXP (x, 1)),
3846 gen_binary (MULT, mode,
3847 XEXP (XEXP (x, 0), 1), XEXP (x, 1))));
3849 if (GET_CODE (x) != MULT)
3850 return x;
3852 break;
3854 case UDIV:
3855 /* If this is a divide by a power of two, treat it as a shift if
3856 its first operand is a shift. */
3857 if (GET_CODE (XEXP (x, 1)) == CONST_INT
3858 && (i = exact_log2 (INTVAL (XEXP (x, 1)))) >= 0
3859 && (GET_CODE (XEXP (x, 0)) == ASHIFT
3860 || GET_CODE (XEXP (x, 0)) == LSHIFTRT
3861 || GET_CODE (XEXP (x, 0)) == ASHIFTRT
3862 || GET_CODE (XEXP (x, 0)) == ROTATE
3863 || GET_CODE (XEXP (x, 0)) == ROTATERT))
3864 return simplify_shift_const (NULL_RTX, LSHIFTRT, mode, XEXP (x, 0), i);
3865 break;
3867 case EQ: case NE:
3868 case GT: case GTU: case GE: case GEU:
3869 case LT: case LTU: case LE: case LEU:
3870 /* If the first operand is a condition code, we can't do anything
3871 with it. */
3872 if (GET_CODE (XEXP (x, 0)) == COMPARE
3873 || (GET_MODE_CLASS (GET_MODE (XEXP (x, 0))) != MODE_CC
3874 #ifdef HAVE_cc0
3875 && XEXP (x, 0) != cc0_rtx
3876 #endif
3879 rtx op0 = XEXP (x, 0);
3880 rtx op1 = XEXP (x, 1);
3881 enum rtx_code new_code;
3883 if (GET_CODE (op0) == COMPARE)
3884 op1 = XEXP (op0, 1), op0 = XEXP (op0, 0);
3886 /* Simplify our comparison, if possible. */
3887 new_code = simplify_comparison (code, &op0, &op1);
3889 /* If STORE_FLAG_VALUE is 1, we can convert (ne x 0) to simply X
3890 if only the low-order bit is possibly nonzero in X (such as when
3891 X is a ZERO_EXTRACT of one bit). Similarly, we can convert EQ to
3892 (xor X 1) or (minus 1 X); we use the former. Finally, if X is
3893 known to be either 0 or -1, NE becomes a NEG and EQ becomes
3894 (plus X 1).
3896 Remove any ZERO_EXTRACT we made when thinking this was a
3897 comparison. It may now be simpler to use, e.g., an AND. If a
3898 ZERO_EXTRACT is indeed appropriate, it will be placed back by
3899 the call to make_compound_operation in the SET case. */
3901 if (STORE_FLAG_VALUE == 1
3902 && new_code == NE && GET_MODE_CLASS (mode) == MODE_INT
3903 && op1 == const0_rtx && nonzero_bits (op0, mode) == 1)
3904 return gen_lowpart_for_combine (mode,
3905 expand_compound_operation (op0));
3907 else if (STORE_FLAG_VALUE == 1
3908 && new_code == NE && GET_MODE_CLASS (mode) == MODE_INT
3909 && op1 == const0_rtx
3910 && (num_sign_bit_copies (op0, mode)
3911 == GET_MODE_BITSIZE (mode)))
3913 op0 = expand_compound_operation (op0);
3914 return gen_unary (NEG, mode, mode,
3915 gen_lowpart_for_combine (mode, op0));
3918 else if (STORE_FLAG_VALUE == 1
3919 && new_code == EQ && GET_MODE_CLASS (mode) == MODE_INT
3920 && op1 == const0_rtx
3921 && nonzero_bits (op0, mode) == 1)
3923 op0 = expand_compound_operation (op0);
3924 return gen_binary (XOR, mode,
3925 gen_lowpart_for_combine (mode, op0),
3926 const1_rtx);
3929 else if (STORE_FLAG_VALUE == 1
3930 && new_code == EQ && GET_MODE_CLASS (mode) == MODE_INT
3931 && op1 == const0_rtx
3932 && (num_sign_bit_copies (op0, mode)
3933 == GET_MODE_BITSIZE (mode)))
3935 op0 = expand_compound_operation (op0);
3936 return plus_constant (gen_lowpart_for_combine (mode, op0), 1);
3939 /* If STORE_FLAG_VALUE is -1, we have cases similar to
3940 those above. */
3941 if (STORE_FLAG_VALUE == -1
3942 && new_code == NE && GET_MODE_CLASS (mode) == MODE_INT
3943 && op1 == const0_rtx
3944 && (num_sign_bit_copies (op0, mode)
3945 == GET_MODE_BITSIZE (mode)))
3946 return gen_lowpart_for_combine (mode,
3947 expand_compound_operation (op0));
3949 else if (STORE_FLAG_VALUE == -1
3950 && new_code == NE && GET_MODE_CLASS (mode) == MODE_INT
3951 && op1 == const0_rtx
3952 && nonzero_bits (op0, mode) == 1)
3954 op0 = expand_compound_operation (op0);
3955 return gen_unary (NEG, mode, mode,
3956 gen_lowpart_for_combine (mode, op0));
3959 else if (STORE_FLAG_VALUE == -1
3960 && new_code == EQ && GET_MODE_CLASS (mode) == MODE_INT
3961 && op1 == const0_rtx
3962 && (num_sign_bit_copies (op0, mode)
3963 == GET_MODE_BITSIZE (mode)))
3965 op0 = expand_compound_operation (op0);
3966 return gen_unary (NOT, mode, mode,
3967 gen_lowpart_for_combine (mode, op0));
3970 /* If X is 0/1, (eq X 0) is X-1. */
3971 else if (STORE_FLAG_VALUE == -1
3972 && new_code == EQ && GET_MODE_CLASS (mode) == MODE_INT
3973 && op1 == const0_rtx
3974 && nonzero_bits (op0, mode) == 1)
3976 op0 = expand_compound_operation (op0);
3977 return plus_constant (gen_lowpart_for_combine (mode, op0), -1);
3980 /* If STORE_FLAG_VALUE says to just test the sign bit and X has just
3981 one bit that might be nonzero, we can convert (ne x 0) to
3982 (ashift x c) where C puts the bit in the sign bit. Remove any
3983 AND with STORE_FLAG_VALUE when we are done, since we are only
3984 going to test the sign bit. */
3985 if (new_code == NE && GET_MODE_CLASS (mode) == MODE_INT
3986 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
3987 && ((STORE_FLAG_VALUE & GET_MODE_MASK (mode))
3988 == (HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (mode) - 1))
3989 && op1 == const0_rtx
3990 && mode == GET_MODE (op0)
3991 && (i = exact_log2 (nonzero_bits (op0, mode))) >= 0)
3993 x = simplify_shift_const (NULL_RTX, ASHIFT, mode,
3994 expand_compound_operation (op0),
3995 GET_MODE_BITSIZE (mode) - 1 - i);
3996 if (GET_CODE (x) == AND && XEXP (x, 1) == const_true_rtx)
3997 return XEXP (x, 0);
3998 else
3999 return x;
4002 /* If the code changed, return a whole new comparison. */
4003 if (new_code != code)
4004 return gen_rtx_combine (new_code, mode, op0, op1);
4006 /* Otherwise, keep this operation, but maybe change its operands.
4007 This also converts (ne (compare FOO BAR) 0) to (ne FOO BAR). */
4008 SUBST (XEXP (x, 0), op0);
4009 SUBST (XEXP (x, 1), op1);
4011 break;
4013 case IF_THEN_ELSE:
4014 return simplify_if_then_else (x);
4016 case ZERO_EXTRACT:
4017 case SIGN_EXTRACT:
4018 case ZERO_EXTEND:
4019 case SIGN_EXTEND:
4020 /* If we are processing SET_DEST, we are done. */
4021 if (in_dest)
4022 return x;
4024 return expand_compound_operation (x);
4026 case SET:
4027 return simplify_set (x);
4029 case AND:
4030 case IOR:
4031 case XOR:
4032 return simplify_logical (x, last);
4034 case ABS:
4035 /* (abs (neg <foo>)) -> (abs <foo>) */
4036 if (GET_CODE (XEXP (x, 0)) == NEG)
4037 SUBST (XEXP (x, 0), XEXP (XEXP (x, 0), 0));
4039 /* If the mode of the operand is VOIDmode (i.e. if it is ASM_OPERANDS),
4040 do nothing. */
4041 if (GET_MODE (XEXP (x, 0)) == VOIDmode)
4042 break;
4044 /* If operand is something known to be positive, ignore the ABS. */
4045 if (GET_CODE (XEXP (x, 0)) == FFS || GET_CODE (XEXP (x, 0)) == ABS
4046 || ((GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0)))
4047 <= HOST_BITS_PER_WIDE_INT)
4048 && ((nonzero_bits (XEXP (x, 0), GET_MODE (XEXP (x, 0)))
4049 & ((HOST_WIDE_INT) 1
4050 << (GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0))) - 1)))
4051 == 0)))
4052 return XEXP (x, 0);
4055 /* If operand is known to be only -1 or 0, convert ABS to NEG. */
4056 if (num_sign_bit_copies (XEXP (x, 0), mode) == GET_MODE_BITSIZE (mode))
4057 return gen_rtx_combine (NEG, mode, XEXP (x, 0));
4059 break;
4061 case FFS:
4062 /* (ffs (*_extend <X>)) = (ffs <X>) */
4063 if (GET_CODE (XEXP (x, 0)) == SIGN_EXTEND
4064 || GET_CODE (XEXP (x, 0)) == ZERO_EXTEND)
4065 SUBST (XEXP (x, 0), XEXP (XEXP (x, 0), 0));
4066 break;
4068 case FLOAT:
4069 /* (float (sign_extend <X>)) = (float <X>). */
4070 if (GET_CODE (XEXP (x, 0)) == SIGN_EXTEND)
4071 SUBST (XEXP (x, 0), XEXP (XEXP (x, 0), 0));
4072 break;
4074 case ASHIFT:
4075 case LSHIFTRT:
4076 case ASHIFTRT:
4077 case ROTATE:
4078 case ROTATERT:
4079 /* If this is a shift by a constant amount, simplify it. */
4080 if (GET_CODE (XEXP (x, 1)) == CONST_INT)
4081 return simplify_shift_const (x, code, mode, XEXP (x, 0),
4082 INTVAL (XEXP (x, 1)));
4084 #ifdef SHIFT_COUNT_TRUNCATED
4085 else if (SHIFT_COUNT_TRUNCATED && GET_CODE (XEXP (x, 1)) != REG)
4086 SUBST (XEXP (x, 1),
4087 force_to_mode (XEXP (x, 1), GET_MODE (x),
4088 ((HOST_WIDE_INT) 1
4089 << exact_log2 (GET_MODE_BITSIZE (GET_MODE (x))))
4090 - 1,
4091 NULL_RTX, 0));
4092 #endif
4094 break;
4097 return x;
4100 /* Simplify X, an IF_THEN_ELSE expression. Return the new expression. */
4102 static rtx
4103 simplify_if_then_else (x)
4104 rtx x;
4106 enum machine_mode mode = GET_MODE (x);
4107 rtx cond = XEXP (x, 0);
4108 rtx true = XEXP (x, 1);
4109 rtx false = XEXP (x, 2);
4110 enum rtx_code true_code = GET_CODE (cond);
4111 int comparison_p = GET_RTX_CLASS (true_code) == '<';
4112 rtx temp;
4113 int i;
4115 /* Simplify storing of the truth value. */
4116 if (comparison_p && true == const_true_rtx && false == const0_rtx)
4117 return gen_binary (true_code, mode, XEXP (cond, 0), XEXP (cond, 1));
4119 /* Also when the truth value has to be reversed. */
4120 if (comparison_p && reversible_comparison_p (cond)
4121 && true == const0_rtx && false == const_true_rtx)
4122 return gen_binary (reverse_condition (true_code),
4123 mode, XEXP (cond, 0), XEXP (cond, 1));
4125 /* Sometimes we can simplify the arm of an IF_THEN_ELSE if a register used
4126 in it is being compared against certain values. Get the true and false
4127 comparisons and see if that says anything about the value of each arm. */
4129 if (comparison_p && reversible_comparison_p (cond)
4130 && GET_CODE (XEXP (cond, 0)) == REG)
4132 HOST_WIDE_INT nzb;
4133 rtx from = XEXP (cond, 0);
4134 enum rtx_code false_code = reverse_condition (true_code);
4135 rtx true_val = XEXP (cond, 1);
4136 rtx false_val = true_val;
4137 int swapped = 0;
4139 /* If FALSE_CODE is EQ, swap the codes and arms. */
4141 if (false_code == EQ)
4143 swapped = 1, true_code = EQ, false_code = NE;
4144 temp = true, true = false, false = temp;
4147 /* If we are comparing against zero and the expression being tested has
4148 only a single bit that might be nonzero, that is its value when it is
4149 not equal to zero. Similarly if it is known to be -1 or 0. */
4151 if (true_code == EQ && true_val == const0_rtx
4152 && exact_log2 (nzb = nonzero_bits (from, GET_MODE (from))) >= 0)
4153 false_code = EQ, false_val = GEN_INT (nzb);
4154 else if (true_code == EQ && true_val == const0_rtx
4155 && (num_sign_bit_copies (from, GET_MODE (from))
4156 == GET_MODE_BITSIZE (GET_MODE (from))))
4157 false_code = EQ, false_val = constm1_rtx;
4159 /* Now simplify an arm if we know the value of the register in the
4160 branch and it is used in the arm. Be careful due to the potential
4161 of locally-shared RTL. */
4163 if (reg_mentioned_p (from, true))
4164 true = subst (known_cond (copy_rtx (true), true_code, from, true_val),
4165 pc_rtx, pc_rtx, 0, 0);
4166 if (reg_mentioned_p (from, false))
4167 false = subst (known_cond (copy_rtx (false), false_code,
4168 from, false_val),
4169 pc_rtx, pc_rtx, 0, 0);
4171 SUBST (XEXP (x, 1), swapped ? false : true);
4172 SUBST (XEXP (x, 2), swapped ? true : false);
4174 true = XEXP (x, 1), false = XEXP (x, 2), true_code = GET_CODE (cond);
4177 /* If we have (if_then_else FOO (pc) (label_ref BAR)) and FOO can be
4178 reversed, do so to avoid needing two sets of patterns for
4179 subtract-and-branch insns. Similarly if we have a constant in the true
4180 arm, the false arm is the same as the first operand of the comparison, or
4181 the false arm is more complicated than the true arm. */
4183 if (comparison_p && reversible_comparison_p (cond)
4184 && (true == pc_rtx
4185 || (CONSTANT_P (true)
4186 && GET_CODE (false) != CONST_INT && false != pc_rtx)
4187 || true == const0_rtx
4188 || (GET_RTX_CLASS (GET_CODE (true)) == 'o'
4189 && GET_RTX_CLASS (GET_CODE (false)) != 'o')
4190 || (GET_CODE (true) == SUBREG
4191 && GET_RTX_CLASS (GET_CODE (SUBREG_REG (true))) == 'o'
4192 && GET_RTX_CLASS (GET_CODE (false)) != 'o')
4193 || reg_mentioned_p (true, false)
4194 || rtx_equal_p (false, XEXP (cond, 0))))
4196 true_code = reverse_condition (true_code);
4197 SUBST (XEXP (x, 0),
4198 gen_binary (true_code, GET_MODE (cond), XEXP (cond, 0),
4199 XEXP (cond, 1)));
4201 SUBST (XEXP (x, 1), false);
4202 SUBST (XEXP (x, 2), true);
4204 temp = true, true = false, false = temp, cond = XEXP (x, 0);
4206 /* It is possible that the conditional has been simplified out. */
4207 true_code = GET_CODE (cond);
4208 comparison_p = GET_RTX_CLASS (true_code) == '<';
4211 /* If the two arms are identical, we don't need the comparison. */
4213 if (rtx_equal_p (true, false) && ! side_effects_p (cond))
4214 return true;
4216 /* Convert a == b ? b : a to "a". */
4217 if (true_code == EQ && ! side_effects_p (cond)
4218 && rtx_equal_p (XEXP (cond, 0), false)
4219 && rtx_equal_p (XEXP (cond, 1), true))
4220 return false;
4221 else if (true_code == NE && ! side_effects_p (cond)
4222 && rtx_equal_p (XEXP (cond, 0), true)
4223 && rtx_equal_p (XEXP (cond, 1), false))
4224 return true;
4226 /* Look for cases where we have (abs x) or (neg (abs X)). */
4228 if (GET_MODE_CLASS (mode) == MODE_INT
4229 && GET_CODE (false) == NEG
4230 && rtx_equal_p (true, XEXP (false, 0))
4231 && comparison_p
4232 && rtx_equal_p (true, XEXP (cond, 0))
4233 && ! side_effects_p (true))
4234 switch (true_code)
4236 case GT:
4237 case GE:
4238 return gen_unary (ABS, mode, mode, true);
4239 case LT:
4240 case LE:
4241 return gen_unary (NEG, mode, mode, gen_unary (ABS, mode, mode, true));
4244 /* Look for MIN or MAX. */
4246 if ((! FLOAT_MODE_P (mode) || flag_fast_math)
4247 && comparison_p
4248 && rtx_equal_p (XEXP (cond, 0), true)
4249 && rtx_equal_p (XEXP (cond, 1), false)
4250 && ! side_effects_p (cond))
4251 switch (true_code)
4253 case GE:
4254 case GT:
4255 return gen_binary (SMAX, mode, true, false);
4256 case LE:
4257 case LT:
4258 return gen_binary (SMIN, mode, true, false);
4259 case GEU:
4260 case GTU:
4261 return gen_binary (UMAX, mode, true, false);
4262 case LEU:
4263 case LTU:
4264 return gen_binary (UMIN, mode, true, false);
4267 /* If we have (if_then_else COND (OP Z C1) Z) and OP is an identity when its
4268 second operand is zero, this can be done as (OP Z (mult COND C2)) where
4269 C2 = C1 * STORE_FLAG_VALUE. Similarly if OP has an outer ZERO_EXTEND or
4270 SIGN_EXTEND as long as Z is already extended (so we don't destroy it).
4271 We can do this kind of thing in some cases when STORE_FLAG_VALUE is
4272 neither 1 or -1, but it isn't worth checking for. */
4274 if ((STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1)
4275 && comparison_p && mode != VOIDmode && ! side_effects_p (x))
4277 rtx t = make_compound_operation (true, SET);
4278 rtx f = make_compound_operation (false, SET);
4279 rtx cond_op0 = XEXP (cond, 0);
4280 rtx cond_op1 = XEXP (cond, 1);
4281 enum rtx_code op, extend_op = NIL;
4282 enum machine_mode m = mode;
4283 rtx z = 0, c1;
4285 if ((GET_CODE (t) == PLUS || GET_CODE (t) == MINUS
4286 || GET_CODE (t) == IOR || GET_CODE (t) == XOR
4287 || GET_CODE (t) == ASHIFT
4288 || GET_CODE (t) == LSHIFTRT || GET_CODE (t) == ASHIFTRT)
4289 && rtx_equal_p (XEXP (t, 0), f))
4290 c1 = XEXP (t, 1), op = GET_CODE (t), z = f;
4292 /* If an identity-zero op is commutative, check whether there
4293 would be a match if we swapped the operands. */
4294 else if ((GET_CODE (t) == PLUS || GET_CODE (t) == IOR
4295 || GET_CODE (t) == XOR)
4296 && rtx_equal_p (XEXP (t, 1), f))
4297 c1 = XEXP (t, 0), op = GET_CODE (t), z = f;
4298 else if (GET_CODE (t) == SIGN_EXTEND
4299 && (GET_CODE (XEXP (t, 0)) == PLUS
4300 || GET_CODE (XEXP (t, 0)) == MINUS
4301 || GET_CODE (XEXP (t, 0)) == IOR
4302 || GET_CODE (XEXP (t, 0)) == XOR
4303 || GET_CODE (XEXP (t, 0)) == ASHIFT
4304 || GET_CODE (XEXP (t, 0)) == LSHIFTRT
4305 || GET_CODE (XEXP (t, 0)) == ASHIFTRT)
4306 && GET_CODE (XEXP (XEXP (t, 0), 0)) == SUBREG
4307 && subreg_lowpart_p (XEXP (XEXP (t, 0), 0))
4308 && rtx_equal_p (SUBREG_REG (XEXP (XEXP (t, 0), 0)), f)
4309 && (num_sign_bit_copies (f, GET_MODE (f))
4310 > (GET_MODE_BITSIZE (mode)
4311 - GET_MODE_BITSIZE (GET_MODE (XEXP (XEXP (t, 0), 0))))))
4313 c1 = XEXP (XEXP (t, 0), 1); z = f; op = GET_CODE (XEXP (t, 0));
4314 extend_op = SIGN_EXTEND;
4315 m = GET_MODE (XEXP (t, 0));
4317 else if (GET_CODE (t) == SIGN_EXTEND
4318 && (GET_CODE (XEXP (t, 0)) == PLUS
4319 || GET_CODE (XEXP (t, 0)) == IOR
4320 || GET_CODE (XEXP (t, 0)) == XOR)
4321 && GET_CODE (XEXP (XEXP (t, 0), 1)) == SUBREG
4322 && subreg_lowpart_p (XEXP (XEXP (t, 0), 1))
4323 && rtx_equal_p (SUBREG_REG (XEXP (XEXP (t, 0), 1)), f)
4324 && (num_sign_bit_copies (f, GET_MODE (f))
4325 > (GET_MODE_BITSIZE (mode)
4326 - GET_MODE_BITSIZE (GET_MODE (XEXP (XEXP (t, 0), 1))))))
4328 c1 = XEXP (XEXP (t, 0), 0); z = f; op = GET_CODE (XEXP (t, 0));
4329 extend_op = SIGN_EXTEND;
4330 m = GET_MODE (XEXP (t, 0));
4332 else if (GET_CODE (t) == ZERO_EXTEND
4333 && (GET_CODE (XEXP (t, 0)) == PLUS
4334 || GET_CODE (XEXP (t, 0)) == MINUS
4335 || GET_CODE (XEXP (t, 0)) == IOR
4336 || GET_CODE (XEXP (t, 0)) == XOR
4337 || GET_CODE (XEXP (t, 0)) == ASHIFT
4338 || GET_CODE (XEXP (t, 0)) == LSHIFTRT
4339 || GET_CODE (XEXP (t, 0)) == ASHIFTRT)
4340 && GET_CODE (XEXP (XEXP (t, 0), 0)) == SUBREG
4341 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
4342 && subreg_lowpart_p (XEXP (XEXP (t, 0), 0))
4343 && rtx_equal_p (SUBREG_REG (XEXP (XEXP (t, 0), 0)), f)
4344 && ((nonzero_bits (f, GET_MODE (f))
4345 & ~ GET_MODE_MASK (GET_MODE (XEXP (XEXP (t, 0), 0))))
4346 == 0))
4348 c1 = XEXP (XEXP (t, 0), 1); z = f; op = GET_CODE (XEXP (t, 0));
4349 extend_op = ZERO_EXTEND;
4350 m = GET_MODE (XEXP (t, 0));
4352 else if (GET_CODE (t) == ZERO_EXTEND
4353 && (GET_CODE (XEXP (t, 0)) == PLUS
4354 || GET_CODE (XEXP (t, 0)) == IOR
4355 || GET_CODE (XEXP (t, 0)) == XOR)
4356 && GET_CODE (XEXP (XEXP (t, 0), 1)) == SUBREG
4357 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
4358 && subreg_lowpart_p (XEXP (XEXP (t, 0), 1))
4359 && rtx_equal_p (SUBREG_REG (XEXP (XEXP (t, 0), 1)), f)
4360 && ((nonzero_bits (f, GET_MODE (f))
4361 & ~ GET_MODE_MASK (GET_MODE (XEXP (XEXP (t, 0), 1))))
4362 == 0))
4364 c1 = XEXP (XEXP (t, 0), 0); z = f; op = GET_CODE (XEXP (t, 0));
4365 extend_op = ZERO_EXTEND;
4366 m = GET_MODE (XEXP (t, 0));
4369 if (z)
4371 temp = subst (gen_binary (true_code, m, cond_op0, cond_op1),
4372 pc_rtx, pc_rtx, 0, 0);
4373 temp = gen_binary (MULT, m, temp,
4374 gen_binary (MULT, m, c1, const_true_rtx));
4375 temp = subst (temp, pc_rtx, pc_rtx, 0, 0);
4376 temp = gen_binary (op, m, gen_lowpart_for_combine (m, z), temp);
4378 if (extend_op != NIL)
4379 temp = gen_unary (extend_op, mode, m, temp);
4381 return temp;
4385 /* If we have (if_then_else (ne A 0) C1 0) and either A is known to be 0 or
4386 1 and C1 is a single bit or A is known to be 0 or -1 and C1 is the
4387 negation of a single bit, we can convert this operation to a shift. We
4388 can actually do this more generally, but it doesn't seem worth it. */
4390 if (true_code == NE && XEXP (cond, 1) == const0_rtx
4391 && false == const0_rtx && GET_CODE (true) == CONST_INT
4392 && ((1 == nonzero_bits (XEXP (cond, 0), mode)
4393 && (i = exact_log2 (INTVAL (true))) >= 0)
4394 || ((num_sign_bit_copies (XEXP (cond, 0), mode)
4395 == GET_MODE_BITSIZE (mode))
4396 && (i = exact_log2 (- INTVAL (true))) >= 0)))
4397 return
4398 simplify_shift_const (NULL_RTX, ASHIFT, mode,
4399 gen_lowpart_for_combine (mode, XEXP (cond, 0)), i);
4401 return x;
4404 /* Simplify X, a SET expression. Return the new expression. */
4406 static rtx
4407 simplify_set (x)
4408 rtx x;
4410 rtx src = SET_SRC (x);
4411 rtx dest = SET_DEST (x);
4412 enum machine_mode mode
4413 = GET_MODE (src) != VOIDmode ? GET_MODE (src) : GET_MODE (dest);
4414 rtx other_insn;
4415 rtx *cc_use;
4417 /* (set (pc) (return)) gets written as (return). */
4418 if (GET_CODE (dest) == PC && GET_CODE (src) == RETURN)
4419 return src;
4421 /* Now that we know for sure which bits of SRC we are using, see if we can
4422 simplify the expression for the object knowing that we only need the
4423 low-order bits. */
4425 if (GET_MODE_CLASS (mode) == MODE_INT)
4426 src = force_to_mode (src, mode, GET_MODE_MASK (mode), NULL_RTX, 0);
4428 /* If we are setting CC0 or if the source is a COMPARE, look for the use of
4429 the comparison result and try to simplify it unless we already have used
4430 undobuf.other_insn. */
4431 if ((GET_CODE (src) == COMPARE
4432 #ifdef HAVE_cc0
4433 || dest == cc0_rtx
4434 #endif
4436 && (cc_use = find_single_use (dest, subst_insn, &other_insn)) != 0
4437 && (undobuf.other_insn == 0 || other_insn == undobuf.other_insn)
4438 && GET_RTX_CLASS (GET_CODE (*cc_use)) == '<'
4439 && rtx_equal_p (XEXP (*cc_use, 0), dest))
4441 enum rtx_code old_code = GET_CODE (*cc_use);
4442 enum rtx_code new_code;
4443 rtx op0, op1;
4444 int other_changed = 0;
4445 enum machine_mode compare_mode = GET_MODE (dest);
4447 if (GET_CODE (src) == COMPARE)
4448 op0 = XEXP (src, 0), op1 = XEXP (src, 1);
4449 else
4450 op0 = src, op1 = const0_rtx;
4452 /* Simplify our comparison, if possible. */
4453 new_code = simplify_comparison (old_code, &op0, &op1);
4455 #ifdef EXTRA_CC_MODES
4456 /* If this machine has CC modes other than CCmode, check to see if we
4457 need to use a different CC mode here. */
4458 compare_mode = SELECT_CC_MODE (new_code, op0, op1);
4459 #endif /* EXTRA_CC_MODES */
4461 #if !defined (HAVE_cc0) && defined (EXTRA_CC_MODES)
4462 /* If the mode changed, we have to change SET_DEST, the mode in the
4463 compare, and the mode in the place SET_DEST is used. If SET_DEST is
4464 a hard register, just build new versions with the proper mode. If it
4465 is a pseudo, we lose unless it is only time we set the pseudo, in
4466 which case we can safely change its mode. */
4467 if (compare_mode != GET_MODE (dest))
4469 int regno = REGNO (dest);
4470 rtx new_dest = gen_rtx (REG, compare_mode, regno);
4472 if (regno < FIRST_PSEUDO_REGISTER
4473 || (REG_N_SETS (regno) == 1 && ! REG_USERVAR_P (dest)))
4475 if (regno >= FIRST_PSEUDO_REGISTER)
4476 SUBST (regno_reg_rtx[regno], new_dest);
4478 SUBST (SET_DEST (x), new_dest);
4479 SUBST (XEXP (*cc_use, 0), new_dest);
4480 other_changed = 1;
4482 dest = new_dest;
4485 #endif
4487 /* If the code changed, we have to build a new comparison in
4488 undobuf.other_insn. */
4489 if (new_code != old_code)
4491 unsigned HOST_WIDE_INT mask;
4493 SUBST (*cc_use, gen_rtx_combine (new_code, GET_MODE (*cc_use),
4494 dest, const0_rtx));
4496 /* If the only change we made was to change an EQ into an NE or
4497 vice versa, OP0 has only one bit that might be nonzero, and OP1
4498 is zero, check if changing the user of the condition code will
4499 produce a valid insn. If it won't, we can keep the original code
4500 in that insn by surrounding our operation with an XOR. */
4502 if (((old_code == NE && new_code == EQ)
4503 || (old_code == EQ && new_code == NE))
4504 && ! other_changed && op1 == const0_rtx
4505 && GET_MODE_BITSIZE (GET_MODE (op0)) <= HOST_BITS_PER_WIDE_INT
4506 && exact_log2 (mask = nonzero_bits (op0, GET_MODE (op0))) >= 0)
4508 rtx pat = PATTERN (other_insn), note = 0;
4509 int scratches;
4511 if ((recog_for_combine (&pat, other_insn, &note, &scratches) < 0
4512 && ! check_asm_operands (pat)))
4514 PUT_CODE (*cc_use, old_code);
4515 other_insn = 0;
4517 op0 = gen_binary (XOR, GET_MODE (op0), op0, GEN_INT (mask));
4521 other_changed = 1;
4524 if (other_changed)
4525 undobuf.other_insn = other_insn;
4527 #ifdef HAVE_cc0
4528 /* If we are now comparing against zero, change our source if
4529 needed. If we do not use cc0, we always have a COMPARE. */
4530 if (op1 == const0_rtx && dest == cc0_rtx)
4532 SUBST (SET_SRC (x), op0);
4533 src = op0;
4535 else
4536 #endif
4538 /* Otherwise, if we didn't previously have a COMPARE in the
4539 correct mode, we need one. */
4540 if (GET_CODE (src) != COMPARE || GET_MODE (src) != compare_mode)
4542 SUBST (SET_SRC (x),
4543 gen_rtx_combine (COMPARE, compare_mode, op0, op1));
4544 src = SET_SRC (x);
4546 else
4548 /* Otherwise, update the COMPARE if needed. */
4549 SUBST (XEXP (src, 0), op0);
4550 SUBST (XEXP (src, 1), op1);
4553 else
4555 /* Get SET_SRC in a form where we have placed back any
4556 compound expressions. Then do the checks below. */
4557 src = make_compound_operation (src, SET);
4558 SUBST (SET_SRC (x), src);
4561 /* If we have (set x (subreg:m1 (op:m2 ...) 0)) with OP being some operation,
4562 and X being a REG or (subreg (reg)), we may be able to convert this to
4563 (set (subreg:m2 x) (op)).
4565 We can always do this if M1 is narrower than M2 because that means that
4566 we only care about the low bits of the result.
4568 However, on machines without WORD_REGISTER_OPERATIONS defined, we cannot
4569 perform a narrower operation that requested since the high-order bits will
4570 be undefined. On machine where it is defined, this transformation is safe
4571 as long as M1 and M2 have the same number of words. */
4573 if (GET_CODE (src) == SUBREG && subreg_lowpart_p (src)
4574 && GET_RTX_CLASS (GET_CODE (SUBREG_REG (src))) != 'o'
4575 && (((GET_MODE_SIZE (GET_MODE (src)) + (UNITS_PER_WORD - 1))
4576 / UNITS_PER_WORD)
4577 == ((GET_MODE_SIZE (GET_MODE (SUBREG_REG (src)))
4578 + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD))
4579 #ifndef WORD_REGISTER_OPERATIONS
4580 && (GET_MODE_SIZE (GET_MODE (src))
4581 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (src))))
4582 #endif
4583 #ifdef CLASS_CANNOT_CHANGE_SIZE
4584 && ! (GET_CODE (dest) == REG && REGNO (dest) < FIRST_PSEUDO_REGISTER
4585 && (TEST_HARD_REG_BIT
4586 (reg_class_contents[(int) CLASS_CANNOT_CHANGE_SIZE],
4587 REGNO (dest)))
4588 && (GET_MODE_SIZE (GET_MODE (src))
4589 != GET_MODE_SIZE (GET_MODE (SUBREG_REG (src)))))
4590 #endif
4591 && (GET_CODE (dest) == REG
4592 || (GET_CODE (dest) == SUBREG
4593 && GET_CODE (SUBREG_REG (dest)) == REG)))
4595 SUBST (SET_DEST (x),
4596 gen_lowpart_for_combine (GET_MODE (SUBREG_REG (src)),
4597 dest));
4598 SUBST (SET_SRC (x), SUBREG_REG (src));
4600 src = SET_SRC (x), dest = SET_DEST (x);
4603 #ifdef LOAD_EXTEND_OP
4604 /* If we have (set FOO (subreg:M (mem:N BAR) 0)) with M wider than N, this
4605 would require a paradoxical subreg. Replace the subreg with a
4606 zero_extend to avoid the reload that would otherwise be required. */
4608 if (GET_CODE (src) == SUBREG && subreg_lowpart_p (src)
4609 && LOAD_EXTEND_OP (GET_MODE (SUBREG_REG (src))) != NIL
4610 && SUBREG_WORD (src) == 0
4611 && (GET_MODE_SIZE (GET_MODE (src))
4612 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (src))))
4613 && GET_CODE (SUBREG_REG (src)) == MEM)
4615 SUBST (SET_SRC (x),
4616 gen_rtx_combine (LOAD_EXTEND_OP (GET_MODE (SUBREG_REG (src))),
4617 GET_MODE (src), XEXP (src, 0)));
4619 src = SET_SRC (x);
4621 #endif
4623 /* If we don't have a conditional move, SET_SRC is an IF_THEN_ELSE, and we
4624 are comparing an item known to be 0 or -1 against 0, use a logical
4625 operation instead. Check for one of the arms being an IOR of the other
4626 arm with some value. We compute three terms to be IOR'ed together. In
4627 practice, at most two will be nonzero. Then we do the IOR's. */
4629 if (GET_CODE (dest) != PC
4630 && GET_CODE (src) == IF_THEN_ELSE
4631 && GET_MODE_CLASS (GET_MODE (src)) == MODE_INT
4632 && (GET_CODE (XEXP (src, 0)) == EQ || GET_CODE (XEXP (src, 0)) == NE)
4633 && XEXP (XEXP (src, 0), 1) == const0_rtx
4634 && GET_MODE (src) == GET_MODE (XEXP (XEXP (src, 0), 0))
4635 #ifdef HAVE_conditional_move
4636 && ! can_conditionally_move_p (GET_MODE (src))
4637 #endif
4638 && (num_sign_bit_copies (XEXP (XEXP (src, 0), 0),
4639 GET_MODE (XEXP (XEXP (src, 0), 0)))
4640 == GET_MODE_BITSIZE (GET_MODE (XEXP (XEXP (src, 0), 0))))
4641 && ! side_effects_p (src))
4643 rtx true = (GET_CODE (XEXP (src, 0)) == NE
4644 ? XEXP (src, 1) : XEXP (src, 2));
4645 rtx false = (GET_CODE (XEXP (src, 0)) == NE
4646 ? XEXP (src, 2) : XEXP (src, 1));
4647 rtx term1 = const0_rtx, term2, term3;
4649 if (GET_CODE (true) == IOR && rtx_equal_p (XEXP (true, 0), false))
4650 term1 = false, true = XEXP (true, 1), false = const0_rtx;
4651 else if (GET_CODE (true) == IOR
4652 && rtx_equal_p (XEXP (true, 1), false))
4653 term1 = false, true = XEXP (true, 0), false = const0_rtx;
4654 else if (GET_CODE (false) == IOR
4655 && rtx_equal_p (XEXP (false, 0), true))
4656 term1 = true, false = XEXP (false, 1), true = const0_rtx;
4657 else if (GET_CODE (false) == IOR
4658 && rtx_equal_p (XEXP (false, 1), true))
4659 term1 = true, false = XEXP (false, 0), true = const0_rtx;
4661 term2 = gen_binary (AND, GET_MODE (src), XEXP (XEXP (src, 0), 0), true);
4662 term3 = gen_binary (AND, GET_MODE (src),
4663 gen_unary (NOT, GET_MODE (src), GET_MODE (src),
4664 XEXP (XEXP (src, 0), 0)),
4665 false);
4667 SUBST (SET_SRC (x),
4668 gen_binary (IOR, GET_MODE (src),
4669 gen_binary (IOR, GET_MODE (src), term1, term2),
4670 term3));
4672 src = SET_SRC (x);
4675 /* If either SRC or DEST is a CLOBBER of (const_int 0), make this
4676 whole thing fail. */
4677 if (GET_CODE (src) == CLOBBER && XEXP (src, 0) == const0_rtx)
4678 return src;
4679 else if (GET_CODE (dest) == CLOBBER && XEXP (dest, 0) == const0_rtx)
4680 return dest;
4681 else
4682 /* Convert this into a field assignment operation, if possible. */
4683 return make_field_assignment (x);
4686 /* Simplify, X, and AND, IOR, or XOR operation, and return the simplified
4687 result. LAST is nonzero if this is the last retry. */
4689 static rtx
4690 simplify_logical (x, last)
4691 rtx x;
4692 int last;
4694 enum machine_mode mode = GET_MODE (x);
4695 rtx op0 = XEXP (x, 0);
4696 rtx op1 = XEXP (x, 1);
4698 switch (GET_CODE (x))
4700 case AND:
4701 /* Convert (A ^ B) & A to A & (~ B) since the latter is often a single
4702 insn (and may simplify more). */
4703 if (GET_CODE (op0) == XOR
4704 && rtx_equal_p (XEXP (op0, 0), op1)
4705 && ! side_effects_p (op1))
4706 x = gen_binary (AND, mode,
4707 gen_unary (NOT, mode, mode, XEXP (op0, 1)), op1);
4709 if (GET_CODE (op0) == XOR
4710 && rtx_equal_p (XEXP (op0, 1), op1)
4711 && ! side_effects_p (op1))
4712 x = gen_binary (AND, mode,
4713 gen_unary (NOT, mode, mode, XEXP (op0, 0)), op1);
4715 /* Similarly for (~ (A ^ B)) & A. */
4716 if (GET_CODE (op0) == NOT
4717 && GET_CODE (XEXP (op0, 0)) == XOR
4718 && rtx_equal_p (XEXP (XEXP (op0, 0), 0), op1)
4719 && ! side_effects_p (op1))
4720 x = gen_binary (AND, mode, XEXP (XEXP (op0, 0), 1), op1);
4722 if (GET_CODE (op0) == NOT
4723 && GET_CODE (XEXP (op0, 0)) == XOR
4724 && rtx_equal_p (XEXP (XEXP (op0, 0), 1), op1)
4725 && ! side_effects_p (op1))
4726 x = gen_binary (AND, mode, XEXP (XEXP (op0, 0), 0), op1);
4728 if (GET_CODE (op1) == CONST_INT)
4730 x = simplify_and_const_int (x, mode, op0, INTVAL (op1));
4732 /* If we have (ior (and (X C1) C2)) and the next restart would be
4733 the last, simplify this by making C1 as small as possible
4734 and then exit. */
4735 if (last
4736 && GET_CODE (x) == IOR && GET_CODE (op0) == AND
4737 && GET_CODE (XEXP (op0, 1)) == CONST_INT
4738 && GET_CODE (op1) == CONST_INT)
4739 return gen_binary (IOR, mode,
4740 gen_binary (AND, mode, XEXP (op0, 0),
4741 GEN_INT (INTVAL (XEXP (op0, 1))
4742 & ~ INTVAL (op1))), op1);
4744 if (GET_CODE (x) != AND)
4745 return x;
4747 if (GET_RTX_CLASS (GET_CODE (x)) == 'c'
4748 || GET_RTX_CLASS (GET_CODE (x)) == '2')
4749 op0 = XEXP (x, 0), op1 = XEXP (x, 1);
4752 /* Convert (A | B) & A to A. */
4753 if (GET_CODE (op0) == IOR
4754 && (rtx_equal_p (XEXP (op0, 0), op1)
4755 || rtx_equal_p (XEXP (op0, 1), op1))
4756 && ! side_effects_p (XEXP (op0, 0))
4757 && ! side_effects_p (XEXP (op0, 1)))
4758 return op1;
4760 /* In the following group of tests (and those in case IOR below),
4761 we start with some combination of logical operations and apply
4762 the distributive law followed by the inverse distributive law.
4763 Most of the time, this results in no change. However, if some of
4764 the operands are the same or inverses of each other, simplifications
4765 will result.
4767 For example, (and (ior A B) (not B)) can occur as the result of
4768 expanding a bit field assignment. When we apply the distributive
4769 law to this, we get (ior (and (A (not B))) (and (B (not B)))),
4770 which then simplifies to (and (A (not B))).
4772 If we have (and (ior A B) C), apply the distributive law and then
4773 the inverse distributive law to see if things simplify. */
4775 if (GET_CODE (op0) == IOR || GET_CODE (op0) == XOR)
4777 x = apply_distributive_law
4778 (gen_binary (GET_CODE (op0), mode,
4779 gen_binary (AND, mode, XEXP (op0, 0), op1),
4780 gen_binary (AND, mode, XEXP (op0, 1), op1)));
4781 if (GET_CODE (x) != AND)
4782 return x;
4785 if (GET_CODE (op1) == IOR || GET_CODE (op1) == XOR)
4786 return apply_distributive_law
4787 (gen_binary (GET_CODE (op1), mode,
4788 gen_binary (AND, mode, XEXP (op1, 0), op0),
4789 gen_binary (AND, mode, XEXP (op1, 1), op0)));
4791 /* Similarly, taking advantage of the fact that
4792 (and (not A) (xor B C)) == (xor (ior A B) (ior A C)) */
4794 if (GET_CODE (op0) == NOT && GET_CODE (op1) == XOR)
4795 return apply_distributive_law
4796 (gen_binary (XOR, mode,
4797 gen_binary (IOR, mode, XEXP (op0, 0), XEXP (op1, 0)),
4798 gen_binary (IOR, mode, XEXP (op0, 0), XEXP (op1, 1))));
4800 else if (GET_CODE (op1) == NOT && GET_CODE (op0) == XOR)
4801 return apply_distributive_law
4802 (gen_binary (XOR, mode,
4803 gen_binary (IOR, mode, XEXP (op1, 0), XEXP (op0, 0)),
4804 gen_binary (IOR, mode, XEXP (op1, 0), XEXP (op0, 1))));
4805 break;
4807 case IOR:
4808 /* (ior A C) is C if all bits of A that might be nonzero are on in C. */
4809 if (GET_CODE (op1) == CONST_INT
4810 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
4811 && (nonzero_bits (op0, mode) & ~ INTVAL (op1)) == 0)
4812 return op1;
4814 /* Convert (A & B) | A to A. */
4815 if (GET_CODE (op0) == AND
4816 && (rtx_equal_p (XEXP (op0, 0), op1)
4817 || rtx_equal_p (XEXP (op0, 1), op1))
4818 && ! side_effects_p (XEXP (op0, 0))
4819 && ! side_effects_p (XEXP (op0, 1)))
4820 return op1;
4822 /* If we have (ior (and A B) C), apply the distributive law and then
4823 the inverse distributive law to see if things simplify. */
4825 if (GET_CODE (op0) == AND)
4827 x = apply_distributive_law
4828 (gen_binary (AND, mode,
4829 gen_binary (IOR, mode, XEXP (op0, 0), op1),
4830 gen_binary (IOR, mode, XEXP (op0, 1), op1)));
4832 if (GET_CODE (x) != IOR)
4833 return x;
4836 if (GET_CODE (op1) == AND)
4838 x = apply_distributive_law
4839 (gen_binary (AND, mode,
4840 gen_binary (IOR, mode, XEXP (op1, 0), op0),
4841 gen_binary (IOR, mode, XEXP (op1, 1), op0)));
4843 if (GET_CODE (x) != IOR)
4844 return x;
4847 /* Convert (ior (ashift A CX) (lshiftrt A CY)) where CX+CY equals the
4848 mode size to (rotate A CX). */
4850 if (((GET_CODE (op0) == ASHIFT && GET_CODE (op1) == LSHIFTRT)
4851 || (GET_CODE (op1) == ASHIFT && GET_CODE (op0) == LSHIFTRT))
4852 && rtx_equal_p (XEXP (op0, 0), XEXP (op1, 0))
4853 && GET_CODE (XEXP (op0, 1)) == CONST_INT
4854 && GET_CODE (XEXP (op1, 1)) == CONST_INT
4855 && (INTVAL (XEXP (op0, 1)) + INTVAL (XEXP (op1, 1))
4856 == GET_MODE_BITSIZE (mode)))
4857 return gen_rtx (ROTATE, mode, XEXP (op0, 0),
4858 (GET_CODE (op0) == ASHIFT
4859 ? XEXP (op0, 1) : XEXP (op1, 1)));
4861 /* If OP0 is (ashiftrt (plus ...) C), it might actually be
4862 a (sign_extend (plus ...)). If so, OP1 is a CONST_INT, and the PLUS
4863 does not affect any of the bits in OP1, it can really be done
4864 as a PLUS and we can associate. We do this by seeing if OP1
4865 can be safely shifted left C bits. */
4866 if (GET_CODE (op1) == CONST_INT && GET_CODE (op0) == ASHIFTRT
4867 && GET_CODE (XEXP (op0, 0)) == PLUS
4868 && GET_CODE (XEXP (XEXP (op0, 0), 1)) == CONST_INT
4869 && GET_CODE (XEXP (op0, 1)) == CONST_INT
4870 && INTVAL (XEXP (op0, 1)) < HOST_BITS_PER_WIDE_INT)
4872 int count = INTVAL (XEXP (op0, 1));
4873 HOST_WIDE_INT mask = INTVAL (op1) << count;
4875 if (mask >> count == INTVAL (op1)
4876 && (mask & nonzero_bits (XEXP (op0, 0), mode)) == 0)
4878 SUBST (XEXP (XEXP (op0, 0), 1),
4879 GEN_INT (INTVAL (XEXP (XEXP (op0, 0), 1)) | mask));
4880 return op0;
4883 break;
4885 case XOR:
4886 /* Convert (XOR (NOT x) (NOT y)) to (XOR x y).
4887 Also convert (XOR (NOT x) y) to (NOT (XOR x y)), similarly for
4888 (NOT y). */
4890 int num_negated = 0;
4892 if (GET_CODE (op0) == NOT)
4893 num_negated++, op0 = XEXP (op0, 0);
4894 if (GET_CODE (op1) == NOT)
4895 num_negated++, op1 = XEXP (op1, 0);
4897 if (num_negated == 2)
4899 SUBST (XEXP (x, 0), op0);
4900 SUBST (XEXP (x, 1), op1);
4902 else if (num_negated == 1)
4903 return gen_unary (NOT, mode, mode, gen_binary (XOR, mode, op0, op1));
4906 /* Convert (xor (and A B) B) to (and (not A) B). The latter may
4907 correspond to a machine insn or result in further simplifications
4908 if B is a constant. */
4910 if (GET_CODE (op0) == AND
4911 && rtx_equal_p (XEXP (op0, 1), op1)
4912 && ! side_effects_p (op1))
4913 return gen_binary (AND, mode,
4914 gen_unary (NOT, mode, mode, XEXP (op0, 0)),
4915 op1);
4917 else if (GET_CODE (op0) == AND
4918 && rtx_equal_p (XEXP (op0, 0), op1)
4919 && ! side_effects_p (op1))
4920 return gen_binary (AND, mode,
4921 gen_unary (NOT, mode, mode, XEXP (op0, 1)),
4922 op1);
4924 /* (xor (comparison foo bar) (const_int 1)) can become the reversed
4925 comparison if STORE_FLAG_VALUE is 1. */
4926 if (STORE_FLAG_VALUE == 1
4927 && op1 == const1_rtx
4928 && GET_RTX_CLASS (GET_CODE (op0)) == '<'
4929 && reversible_comparison_p (op0))
4930 return gen_rtx_combine (reverse_condition (GET_CODE (op0)),
4931 mode, XEXP (op0, 0), XEXP (op0, 1));
4933 /* (lshiftrt foo C) where C is the number of bits in FOO minus 1
4934 is (lt foo (const_int 0)), so we can perform the above
4935 simplification if STORE_FLAG_VALUE is 1. */
4937 if (STORE_FLAG_VALUE == 1
4938 && op1 == const1_rtx
4939 && GET_CODE (op0) == LSHIFTRT
4940 && GET_CODE (XEXP (op0, 1)) == CONST_INT
4941 && INTVAL (XEXP (op0, 1)) == GET_MODE_BITSIZE (mode) - 1)
4942 return gen_rtx_combine (GE, mode, XEXP (op0, 0), const0_rtx);
4944 /* (xor (comparison foo bar) (const_int sign-bit))
4945 when STORE_FLAG_VALUE is the sign bit. */
4946 if (GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
4947 && ((STORE_FLAG_VALUE & GET_MODE_MASK (mode))
4948 == (HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (mode) - 1))
4949 && op1 == const_true_rtx
4950 && GET_RTX_CLASS (GET_CODE (op0)) == '<'
4951 && reversible_comparison_p (op0))
4952 return gen_rtx_combine (reverse_condition (GET_CODE (op0)),
4953 mode, XEXP (op0, 0), XEXP (op0, 1));
4954 break;
4957 return x;
4960 /* We consider ZERO_EXTRACT, SIGN_EXTRACT, and SIGN_EXTEND as "compound
4961 operations" because they can be replaced with two more basic operations.
4962 ZERO_EXTEND is also considered "compound" because it can be replaced with
4963 an AND operation, which is simpler, though only one operation.
4965 The function expand_compound_operation is called with an rtx expression
4966 and will convert it to the appropriate shifts and AND operations,
4967 simplifying at each stage.
4969 The function make_compound_operation is called to convert an expression
4970 consisting of shifts and ANDs into the equivalent compound expression.
4971 It is the inverse of this function, loosely speaking. */
4973 static rtx
4974 expand_compound_operation (x)
4975 rtx x;
4977 int pos = 0, len;
4978 int unsignedp = 0;
4979 int modewidth;
4980 rtx tem;
4982 switch (GET_CODE (x))
4984 case ZERO_EXTEND:
4985 unsignedp = 1;
4986 case SIGN_EXTEND:
4987 /* We can't necessarily use a const_int for a multiword mode;
4988 it depends on implicitly extending the value.
4989 Since we don't know the right way to extend it,
4990 we can't tell whether the implicit way is right.
4992 Even for a mode that is no wider than a const_int,
4993 we can't win, because we need to sign extend one of its bits through
4994 the rest of it, and we don't know which bit. */
4995 if (GET_CODE (XEXP (x, 0)) == CONST_INT)
4996 return x;
4998 /* Return if (subreg:MODE FROM 0) is not a safe replacement for
4999 (zero_extend:MODE FROM) or (sign_extend:MODE FROM). It is for any MEM
5000 because (SUBREG (MEM...)) is guaranteed to cause the MEM to be
5001 reloaded. If not for that, MEM's would very rarely be safe.
5003 Reject MODEs bigger than a word, because we might not be able
5004 to reference a two-register group starting with an arbitrary register
5005 (and currently gen_lowpart might crash for a SUBREG). */
5007 if (GET_MODE_SIZE (GET_MODE (XEXP (x, 0))) > UNITS_PER_WORD)
5008 return x;
5010 len = GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0)));
5011 /* If the inner object has VOIDmode (the only way this can happen
5012 is if it is a ASM_OPERANDS), we can't do anything since we don't
5013 know how much masking to do. */
5014 if (len == 0)
5015 return x;
5017 break;
5019 case ZERO_EXTRACT:
5020 unsignedp = 1;
5021 case SIGN_EXTRACT:
5022 /* If the operand is a CLOBBER, just return it. */
5023 if (GET_CODE (XEXP (x, 0)) == CLOBBER)
5024 return XEXP (x, 0);
5026 if (GET_CODE (XEXP (x, 1)) != CONST_INT
5027 || GET_CODE (XEXP (x, 2)) != CONST_INT
5028 || GET_MODE (XEXP (x, 0)) == VOIDmode)
5029 return x;
5031 len = INTVAL (XEXP (x, 1));
5032 pos = INTVAL (XEXP (x, 2));
5034 /* If this goes outside the object being extracted, replace the object
5035 with a (use (mem ...)) construct that only combine understands
5036 and is used only for this purpose. */
5037 if (len + pos > GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0))))
5038 SUBST (XEXP (x, 0), gen_rtx (USE, GET_MODE (x), XEXP (x, 0)));
5040 if (BITS_BIG_ENDIAN)
5041 pos = GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0))) - len - pos;
5043 break;
5045 default:
5046 return x;
5049 /* We can optimize some special cases of ZERO_EXTEND. */
5050 if (GET_CODE (x) == ZERO_EXTEND)
5052 /* (zero_extend:DI (truncate:SI foo:DI)) is just foo:DI if we
5053 know that the last value didn't have any inappropriate bits
5054 set. */
5055 if (GET_CODE (XEXP (x, 0)) == TRUNCATE
5056 && GET_MODE (XEXP (XEXP (x, 0), 0)) == GET_MODE (x)
5057 && GET_MODE_BITSIZE (GET_MODE (x)) <= HOST_BITS_PER_WIDE_INT
5058 && (nonzero_bits (XEXP (XEXP (x, 0), 0), GET_MODE (x))
5059 & ~ GET_MODE_MASK (GET_MODE (XEXP (x, 0)))) == 0)
5060 return XEXP (XEXP (x, 0), 0);
5062 /* Likewise for (zero_extend:DI (subreg:SI foo:DI 0)). */
5063 if (GET_CODE (XEXP (x, 0)) == SUBREG
5064 && GET_MODE (SUBREG_REG (XEXP (x, 0))) == GET_MODE (x)
5065 && subreg_lowpart_p (XEXP (x, 0))
5066 && GET_MODE_BITSIZE (GET_MODE (x)) <= HOST_BITS_PER_WIDE_INT
5067 && (nonzero_bits (SUBREG_REG (XEXP (x, 0)), GET_MODE (x))
5068 & ~ GET_MODE_MASK (GET_MODE (SUBREG_REG (x)))) == 0)
5069 return SUBREG_REG (XEXP (x, 0));
5071 /* (zero_extend:DI (truncate:SI foo:DI)) is just foo:DI when foo
5072 is a comparison and STORE_FLAG_VALUE permits. This is like
5073 the first case, but it works even when GET_MODE (x) is larger
5074 than HOST_WIDE_INT. */
5075 if (GET_CODE (XEXP (x, 0)) == TRUNCATE
5076 && GET_MODE (XEXP (XEXP (x, 0), 0)) == GET_MODE (x)
5077 && GET_RTX_CLASS (GET_CODE (XEXP (XEXP (x, 0), 0))) == '<'
5078 && (GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0)))
5079 <= HOST_BITS_PER_WIDE_INT)
5080 && ((HOST_WIDE_INT) STORE_FLAG_VALUE
5081 & ~ GET_MODE_MASK (GET_MODE (XEXP (x, 0)))) == 0)
5082 return XEXP (XEXP (x, 0), 0);
5084 /* Likewise for (zero_extend:DI (subreg:SI foo:DI 0)). */
5085 if (GET_CODE (XEXP (x, 0)) == SUBREG
5086 && GET_MODE (SUBREG_REG (XEXP (x, 0))) == GET_MODE (x)
5087 && subreg_lowpart_p (XEXP (x, 0))
5088 && GET_RTX_CLASS (GET_CODE (SUBREG_REG (XEXP (x, 0)))) == '<'
5089 && (GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0)))
5090 <= HOST_BITS_PER_WIDE_INT)
5091 && ((HOST_WIDE_INT) STORE_FLAG_VALUE
5092 & ~ GET_MODE_MASK (GET_MODE (XEXP (x, 0)))) == 0)
5093 return SUBREG_REG (XEXP (x, 0));
5095 /* If sign extension is cheaper than zero extension, then use it
5096 if we know that no extraneous bits are set, and that the high
5097 bit is not set. */
5098 if (flag_expensive_optimizations
5099 && ((GET_MODE_BITSIZE (GET_MODE (x)) <= HOST_BITS_PER_WIDE_INT
5100 && ((nonzero_bits (XEXP (x, 0), GET_MODE (x))
5101 & ~ (((unsigned HOST_WIDE_INT)
5102 GET_MODE_MASK (GET_MODE (XEXP (x, 0))))
5103 >> 1))
5104 == 0))
5105 || (GET_RTX_CLASS (GET_CODE (XEXP (x, 0))) == '<'
5106 && (GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0)))
5107 <= HOST_BITS_PER_WIDE_INT)
5108 && (((HOST_WIDE_INT) STORE_FLAG_VALUE
5109 & ~ (((unsigned HOST_WIDE_INT)
5110 GET_MODE_MASK (GET_MODE (XEXP (x, 0))))
5111 >> 1))
5112 == 0))))
5114 rtx temp = gen_rtx (SIGN_EXTEND, GET_MODE (x), XEXP (x, 0));
5116 if (rtx_cost (temp, SET) < rtx_cost (x, SET))
5117 return expand_compound_operation (temp);
5121 /* If we reach here, we want to return a pair of shifts. The inner
5122 shift is a left shift of BITSIZE - POS - LEN bits. The outer
5123 shift is a right shift of BITSIZE - LEN bits. It is arithmetic or
5124 logical depending on the value of UNSIGNEDP.
5126 If this was a ZERO_EXTEND or ZERO_EXTRACT, this pair of shifts will be
5127 converted into an AND of a shift.
5129 We must check for the case where the left shift would have a negative
5130 count. This can happen in a case like (x >> 31) & 255 on machines
5131 that can't shift by a constant. On those machines, we would first
5132 combine the shift with the AND to produce a variable-position
5133 extraction. Then the constant of 31 would be substituted in to produce
5134 a such a position. */
5136 modewidth = GET_MODE_BITSIZE (GET_MODE (x));
5137 if (modewidth >= pos - len)
5138 tem = simplify_shift_const (NULL_RTX, unsignedp ? LSHIFTRT : ASHIFTRT,
5139 GET_MODE (x),
5140 simplify_shift_const (NULL_RTX, ASHIFT,
5141 GET_MODE (x),
5142 XEXP (x, 0),
5143 modewidth - pos - len),
5144 modewidth - len);
5146 else if (unsignedp && len < HOST_BITS_PER_WIDE_INT)
5147 tem = simplify_and_const_int (NULL_RTX, GET_MODE (x),
5148 simplify_shift_const (NULL_RTX, LSHIFTRT,
5149 GET_MODE (x),
5150 XEXP (x, 0), pos),
5151 ((HOST_WIDE_INT) 1 << len) - 1);
5152 else
5153 /* Any other cases we can't handle. */
5154 return x;
5157 /* If we couldn't do this for some reason, return the original
5158 expression. */
5159 if (GET_CODE (tem) == CLOBBER)
5160 return x;
5162 return tem;
5165 /* X is a SET which contains an assignment of one object into
5166 a part of another (such as a bit-field assignment, STRICT_LOW_PART,
5167 or certain SUBREGS). If possible, convert it into a series of
5168 logical operations.
5170 We half-heartedly support variable positions, but do not at all
5171 support variable lengths. */
5173 static rtx
5174 expand_field_assignment (x)
5175 rtx x;
5177 rtx inner;
5178 rtx pos; /* Always counts from low bit. */
5179 int len;
5180 rtx mask;
5181 enum machine_mode compute_mode;
5183 /* Loop until we find something we can't simplify. */
5184 while (1)
5186 if (GET_CODE (SET_DEST (x)) == STRICT_LOW_PART
5187 && GET_CODE (XEXP (SET_DEST (x), 0)) == SUBREG)
5189 inner = SUBREG_REG (XEXP (SET_DEST (x), 0));
5190 len = GET_MODE_BITSIZE (GET_MODE (XEXP (SET_DEST (x), 0)));
5191 pos = GEN_INT (BITS_PER_WORD * SUBREG_WORD (XEXP (SET_DEST (x), 0)));
5193 else if (GET_CODE (SET_DEST (x)) == ZERO_EXTRACT
5194 && GET_CODE (XEXP (SET_DEST (x), 1)) == CONST_INT)
5196 inner = XEXP (SET_DEST (x), 0);
5197 len = INTVAL (XEXP (SET_DEST (x), 1));
5198 pos = XEXP (SET_DEST (x), 2);
5200 /* If the position is constant and spans the width of INNER,
5201 surround INNER with a USE to indicate this. */
5202 if (GET_CODE (pos) == CONST_INT
5203 && INTVAL (pos) + len > GET_MODE_BITSIZE (GET_MODE (inner)))
5204 inner = gen_rtx (USE, GET_MODE (SET_DEST (x)), inner);
5206 if (BITS_BIG_ENDIAN)
5208 if (GET_CODE (pos) == CONST_INT)
5209 pos = GEN_INT (GET_MODE_BITSIZE (GET_MODE (inner)) - len
5210 - INTVAL (pos));
5211 else if (GET_CODE (pos) == MINUS
5212 && GET_CODE (XEXP (pos, 1)) == CONST_INT
5213 && (INTVAL (XEXP (pos, 1))
5214 == GET_MODE_BITSIZE (GET_MODE (inner)) - len))
5215 /* If position is ADJUST - X, new position is X. */
5216 pos = XEXP (pos, 0);
5217 else
5218 pos = gen_binary (MINUS, GET_MODE (pos),
5219 GEN_INT (GET_MODE_BITSIZE (GET_MODE (inner))
5220 - len),
5221 pos);
5225 /* A SUBREG between two modes that occupy the same numbers of words
5226 can be done by moving the SUBREG to the source. */
5227 else if (GET_CODE (SET_DEST (x)) == SUBREG
5228 && (((GET_MODE_SIZE (GET_MODE (SET_DEST (x)))
5229 + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD)
5230 == ((GET_MODE_SIZE (GET_MODE (SUBREG_REG (SET_DEST (x))))
5231 + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD)))
5233 x = gen_rtx (SET, VOIDmode, SUBREG_REG (SET_DEST (x)),
5234 gen_lowpart_for_combine (GET_MODE (SUBREG_REG (SET_DEST (x))),
5235 SET_SRC (x)));
5236 continue;
5238 else
5239 break;
5241 while (GET_CODE (inner) == SUBREG && subreg_lowpart_p (inner))
5242 inner = SUBREG_REG (inner);
5244 compute_mode = GET_MODE (inner);
5246 /* Compute a mask of LEN bits, if we can do this on the host machine. */
5247 if (len < HOST_BITS_PER_WIDE_INT)
5248 mask = GEN_INT (((HOST_WIDE_INT) 1 << len) - 1);
5249 else
5250 break;
5252 /* Now compute the equivalent expression. Make a copy of INNER
5253 for the SET_DEST in case it is a MEM into which we will substitute;
5254 we don't want shared RTL in that case. */
5255 x = gen_rtx (SET, VOIDmode, copy_rtx (inner),
5256 gen_binary (IOR, compute_mode,
5257 gen_binary (AND, compute_mode,
5258 gen_unary (NOT, compute_mode,
5259 compute_mode,
5260 gen_binary (ASHIFT,
5261 compute_mode,
5262 mask, pos)),
5263 inner),
5264 gen_binary (ASHIFT, compute_mode,
5265 gen_binary (AND, compute_mode,
5266 gen_lowpart_for_combine
5267 (compute_mode,
5268 SET_SRC (x)),
5269 mask),
5270 pos)));
5273 return x;
5276 /* Return an RTX for a reference to LEN bits of INNER. If POS_RTX is nonzero,
5277 it is an RTX that represents a variable starting position; otherwise,
5278 POS is the (constant) starting bit position (counted from the LSB).
5280 INNER may be a USE. This will occur when we started with a bitfield
5281 that went outside the boundary of the object in memory, which is
5282 allowed on most machines. To isolate this case, we produce a USE
5283 whose mode is wide enough and surround the MEM with it. The only
5284 code that understands the USE is this routine. If it is not removed,
5285 it will cause the resulting insn not to match.
5287 UNSIGNEDP is non-zero for an unsigned reference and zero for a
5288 signed reference.
5290 IN_DEST is non-zero if this is a reference in the destination of a
5291 SET. This is used when a ZERO_ or SIGN_EXTRACT isn't needed. If non-zero,
5292 a STRICT_LOW_PART will be used, if zero, ZERO_EXTEND or SIGN_EXTEND will
5293 be used.
5295 IN_COMPARE is non-zero if we are in a COMPARE. This means that a
5296 ZERO_EXTRACT should be built even for bits starting at bit 0.
5298 MODE is the desired mode of the result (if IN_DEST == 0).
5300 The result is an RTX for the extraction or NULL_RTX if the target
5301 can't handle it. */
5303 static rtx
5304 make_extraction (mode, inner, pos, pos_rtx, len,
5305 unsignedp, in_dest, in_compare)
5306 enum machine_mode mode;
5307 rtx inner;
5308 int pos;
5309 rtx pos_rtx;
5310 int len;
5311 int unsignedp;
5312 int in_dest, in_compare;
5314 /* This mode describes the size of the storage area
5315 to fetch the overall value from. Within that, we
5316 ignore the POS lowest bits, etc. */
5317 enum machine_mode is_mode = GET_MODE (inner);
5318 enum machine_mode inner_mode;
5319 enum machine_mode wanted_inner_mode = byte_mode;
5320 enum machine_mode wanted_inner_reg_mode = word_mode;
5321 enum machine_mode pos_mode = word_mode;
5322 enum machine_mode extraction_mode = word_mode;
5323 enum machine_mode tmode = mode_for_size (len, MODE_INT, 1);
5324 int spans_byte = 0;
5325 rtx new = 0;
5326 rtx orig_pos_rtx = pos_rtx;
5327 int orig_pos;
5329 /* Get some information about INNER and get the innermost object. */
5330 if (GET_CODE (inner) == USE)
5331 /* (use:SI (mem:QI foo)) stands for (mem:SI foo). */
5332 /* We don't need to adjust the position because we set up the USE
5333 to pretend that it was a full-word object. */
5334 spans_byte = 1, inner = XEXP (inner, 0);
5335 else if (GET_CODE (inner) == SUBREG && subreg_lowpart_p (inner))
5337 /* If going from (subreg:SI (mem:QI ...)) to (mem:QI ...),
5338 consider just the QI as the memory to extract from.
5339 The subreg adds or removes high bits; its mode is
5340 irrelevant to the meaning of this extraction,
5341 since POS and LEN count from the lsb. */
5342 if (GET_CODE (SUBREG_REG (inner)) == MEM)
5343 is_mode = GET_MODE (SUBREG_REG (inner));
5344 inner = SUBREG_REG (inner);
5347 inner_mode = GET_MODE (inner);
5349 if (pos_rtx && GET_CODE (pos_rtx) == CONST_INT)
5350 pos = INTVAL (pos_rtx), pos_rtx = 0;
5352 /* See if this can be done without an extraction. We never can if the
5353 width of the field is not the same as that of some integer mode. For
5354 registers, we can only avoid the extraction if the position is at the
5355 low-order bit and this is either not in the destination or we have the
5356 appropriate STRICT_LOW_PART operation available.
5358 For MEM, we can avoid an extract if the field starts on an appropriate
5359 boundary and we can change the mode of the memory reference. However,
5360 we cannot directly access the MEM if we have a USE and the underlying
5361 MEM is not TMODE. This combination means that MEM was being used in a
5362 context where bits outside its mode were being referenced; that is only
5363 valid in bit-field insns. */
5365 if (tmode != BLKmode
5366 && ! (spans_byte && inner_mode != tmode)
5367 && ((pos_rtx == 0 && (pos % BITS_PER_WORD) == 0
5368 && GET_CODE (inner) != MEM
5369 && (! in_dest
5370 || (GET_CODE (inner) == REG
5371 && (movstrict_optab->handlers[(int) tmode].insn_code
5372 != CODE_FOR_nothing))))
5373 || (GET_CODE (inner) == MEM && pos_rtx == 0
5374 && (pos
5375 % (STRICT_ALIGNMENT ? GET_MODE_ALIGNMENT (tmode)
5376 : BITS_PER_UNIT)) == 0
5377 /* We can't do this if we are widening INNER_MODE (it
5378 may not be aligned, for one thing). */
5379 && GET_MODE_BITSIZE (inner_mode) >= GET_MODE_BITSIZE (tmode)
5380 && (inner_mode == tmode
5381 || (! mode_dependent_address_p (XEXP (inner, 0))
5382 && ! MEM_VOLATILE_P (inner))))))
5384 /* If INNER is a MEM, make a new MEM that encompasses just the desired
5385 field. If the original and current mode are the same, we need not
5386 adjust the offset. Otherwise, we do if bytes big endian.
5388 If INNER is not a MEM, get a piece consisting of just the field
5389 of interest (in this case POS % BITS_PER_WORD must be 0). */
5391 if (GET_CODE (inner) == MEM)
5393 int offset;
5394 /* POS counts from lsb, but make OFFSET count in memory order. */
5395 if (BYTES_BIG_ENDIAN)
5396 offset = (GET_MODE_BITSIZE (is_mode) - len - pos) / BITS_PER_UNIT;
5397 else
5398 offset = pos / BITS_PER_UNIT;
5400 new = gen_rtx (MEM, tmode, plus_constant (XEXP (inner, 0), offset));
5401 RTX_UNCHANGING_P (new) = RTX_UNCHANGING_P (inner);
5402 MEM_VOLATILE_P (new) = MEM_VOLATILE_P (inner);
5403 MEM_IN_STRUCT_P (new) = MEM_IN_STRUCT_P (inner);
5405 else if (GET_CODE (inner) == REG)
5407 /* We can't call gen_lowpart_for_combine here since we always want
5408 a SUBREG and it would sometimes return a new hard register. */
5409 if (tmode != inner_mode)
5410 new = gen_rtx (SUBREG, tmode, inner,
5411 (WORDS_BIG_ENDIAN
5412 && GET_MODE_SIZE (inner_mode) > UNITS_PER_WORD
5413 ? (((GET_MODE_SIZE (inner_mode)
5414 - GET_MODE_SIZE (tmode))
5415 / UNITS_PER_WORD)
5416 - pos / BITS_PER_WORD)
5417 : pos / BITS_PER_WORD));
5418 else
5419 new = inner;
5421 else
5422 new = force_to_mode (inner, tmode,
5423 len >= HOST_BITS_PER_WIDE_INT
5424 ? GET_MODE_MASK (tmode)
5425 : ((HOST_WIDE_INT) 1 << len) - 1,
5426 NULL_RTX, 0);
5428 /* If this extraction is going into the destination of a SET,
5429 make a STRICT_LOW_PART unless we made a MEM. */
5431 if (in_dest)
5432 return (GET_CODE (new) == MEM ? new
5433 : (GET_CODE (new) != SUBREG
5434 ? gen_rtx (CLOBBER, tmode, const0_rtx)
5435 : gen_rtx_combine (STRICT_LOW_PART, VOIDmode, new)));
5437 /* Otherwise, sign- or zero-extend unless we already are in the
5438 proper mode. */
5440 return (mode == tmode ? new
5441 : gen_rtx_combine (unsignedp ? ZERO_EXTEND : SIGN_EXTEND,
5442 mode, new));
5445 /* Unless this is a COMPARE or we have a funny memory reference,
5446 don't do anything with zero-extending field extracts starting at
5447 the low-order bit since they are simple AND operations. */
5448 if (pos_rtx == 0 && pos == 0 && ! in_dest
5449 && ! in_compare && ! spans_byte && unsignedp)
5450 return 0;
5452 /* Unless we are allowed to span bytes, reject this if we would be
5453 spanning bytes or if the position is not a constant and the length
5454 is not 1. In all other cases, we would only be going outside
5455 out object in cases when an original shift would have been
5456 undefined. */
5457 if (! spans_byte
5458 && ((pos_rtx == 0 && pos + len > GET_MODE_BITSIZE (is_mode))
5459 || (pos_rtx != 0 && len != 1)))
5460 return 0;
5462 /* Get the mode to use should INNER not be a MEM, the mode for the position,
5463 and the mode for the result. */
5464 #ifdef HAVE_insv
5465 if (in_dest)
5467 wanted_inner_reg_mode = insn_operand_mode[(int) CODE_FOR_insv][0];
5468 pos_mode = insn_operand_mode[(int) CODE_FOR_insv][2];
5469 extraction_mode = insn_operand_mode[(int) CODE_FOR_insv][3];
5471 #endif
5473 #ifdef HAVE_extzv
5474 if (! in_dest && unsignedp)
5476 wanted_inner_reg_mode = insn_operand_mode[(int) CODE_FOR_extzv][1];
5477 pos_mode = insn_operand_mode[(int) CODE_FOR_extzv][3];
5478 extraction_mode = insn_operand_mode[(int) CODE_FOR_extzv][0];
5480 #endif
5482 #ifdef HAVE_extv
5483 if (! in_dest && ! unsignedp)
5485 wanted_inner_reg_mode = insn_operand_mode[(int) CODE_FOR_extv][1];
5486 pos_mode = insn_operand_mode[(int) CODE_FOR_extv][3];
5487 extraction_mode = insn_operand_mode[(int) CODE_FOR_extv][0];
5489 #endif
5491 /* Never narrow an object, since that might not be safe. */
5493 if (mode != VOIDmode
5494 && GET_MODE_SIZE (extraction_mode) < GET_MODE_SIZE (mode))
5495 extraction_mode = mode;
5497 if (pos_rtx && GET_MODE (pos_rtx) != VOIDmode
5498 && GET_MODE_SIZE (pos_mode) < GET_MODE_SIZE (GET_MODE (pos_rtx)))
5499 pos_mode = GET_MODE (pos_rtx);
5501 /* If this is not from memory, the desired mode is wanted_inner_reg_mode;
5502 if we have to change the mode of memory and cannot, the desired mode is
5503 EXTRACTION_MODE. */
5504 if (GET_CODE (inner) != MEM)
5505 wanted_inner_mode = wanted_inner_reg_mode;
5506 else if (inner_mode != wanted_inner_mode
5507 && (mode_dependent_address_p (XEXP (inner, 0))
5508 || MEM_VOLATILE_P (inner)))
5509 wanted_inner_mode = extraction_mode;
5511 orig_pos = pos;
5513 if (BITS_BIG_ENDIAN)
5515 /* POS is passed as if BITS_BIG_ENDIAN == 0, so we need to convert it to
5516 BITS_BIG_ENDIAN style. If position is constant, compute new
5517 position. Otherwise, build subtraction.
5518 Note that POS is relative to the mode of the original argument.
5519 If it's a MEM we need to recompute POS relative to that.
5520 However, if we're extracting from (or inserting into) a register,
5521 we want to recompute POS relative to wanted_inner_mode. */
5522 int width = (GET_CODE (inner) == MEM
5523 ? GET_MODE_BITSIZE (is_mode)
5524 : GET_MODE_BITSIZE (wanted_inner_mode));
5526 if (pos_rtx == 0)
5527 pos = width - len - pos;
5528 else
5529 pos_rtx
5530 = gen_rtx_combine (MINUS, GET_MODE (pos_rtx),
5531 GEN_INT (width - len), pos_rtx);
5532 /* POS may be less than 0 now, but we check for that below.
5533 Note that it can only be less than 0 if GET_CODE (inner) != MEM. */
5536 /* If INNER has a wider mode, make it smaller. If this is a constant
5537 extract, try to adjust the byte to point to the byte containing
5538 the value. */
5539 if (wanted_inner_mode != VOIDmode
5540 && GET_MODE_SIZE (wanted_inner_mode) < GET_MODE_SIZE (is_mode)
5541 && ((GET_CODE (inner) == MEM
5542 && (inner_mode == wanted_inner_mode
5543 || (! mode_dependent_address_p (XEXP (inner, 0))
5544 && ! MEM_VOLATILE_P (inner))))))
5546 int offset = 0;
5548 /* The computations below will be correct if the machine is big
5549 endian in both bits and bytes or little endian in bits and bytes.
5550 If it is mixed, we must adjust. */
5552 /* If bytes are big endian and we had a paradoxical SUBREG, we must
5553 adjust OFFSET to compensate. */
5554 if (BYTES_BIG_ENDIAN
5555 && ! spans_byte
5556 && GET_MODE_SIZE (inner_mode) < GET_MODE_SIZE (is_mode))
5557 offset -= GET_MODE_SIZE (is_mode) - GET_MODE_SIZE (inner_mode);
5559 /* If this is a constant position, we can move to the desired byte. */
5560 if (pos_rtx == 0)
5562 offset += pos / BITS_PER_UNIT;
5563 pos %= GET_MODE_BITSIZE (wanted_inner_mode);
5566 if (BYTES_BIG_ENDIAN != BITS_BIG_ENDIAN
5567 && ! spans_byte
5568 && is_mode != wanted_inner_mode)
5569 offset = (GET_MODE_SIZE (is_mode)
5570 - GET_MODE_SIZE (wanted_inner_mode) - offset);
5572 if (offset != 0 || inner_mode != wanted_inner_mode)
5574 rtx newmem = gen_rtx (MEM, wanted_inner_mode,
5575 plus_constant (XEXP (inner, 0), offset));
5576 RTX_UNCHANGING_P (newmem) = RTX_UNCHANGING_P (inner);
5577 MEM_VOLATILE_P (newmem) = MEM_VOLATILE_P (inner);
5578 MEM_IN_STRUCT_P (newmem) = MEM_IN_STRUCT_P (inner);
5579 inner = newmem;
5583 /* If INNER is not memory, we can always get it into the proper mode. If we
5584 are changing its mode, POS must be a constant and smaller than the size
5585 of the new mode. */
5586 else if (GET_CODE (inner) != MEM)
5588 if (GET_MODE (inner) != wanted_inner_mode
5589 && (pos_rtx != 0
5590 || orig_pos + len > GET_MODE_BITSIZE (wanted_inner_mode)))
5591 return 0;
5593 inner = force_to_mode (inner, wanted_inner_mode,
5594 pos_rtx
5595 || len + orig_pos >= HOST_BITS_PER_WIDE_INT
5596 ? GET_MODE_MASK (wanted_inner_mode)
5597 : (((HOST_WIDE_INT) 1 << len) - 1) << orig_pos,
5598 NULL_RTX, 0);
5601 /* Adjust mode of POS_RTX, if needed. If we want a wider mode, we
5602 have to zero extend. Otherwise, we can just use a SUBREG. */
5603 if (pos_rtx != 0
5604 && GET_MODE_SIZE (pos_mode) > GET_MODE_SIZE (GET_MODE (pos_rtx)))
5605 pos_rtx = gen_rtx_combine (ZERO_EXTEND, pos_mode, pos_rtx);
5606 else if (pos_rtx != 0
5607 && GET_MODE_SIZE (pos_mode) < GET_MODE_SIZE (GET_MODE (pos_rtx)))
5608 pos_rtx = gen_lowpart_for_combine (pos_mode, pos_rtx);
5610 /* Make POS_RTX unless we already have it and it is correct. If we don't
5611 have a POS_RTX but we do have an ORIG_POS_RTX, the latter must
5612 be a CONST_INT. */
5613 if (pos_rtx == 0 && orig_pos_rtx != 0 && INTVAL (orig_pos_rtx) == pos)
5614 pos_rtx = orig_pos_rtx;
5616 else if (pos_rtx == 0)
5617 pos_rtx = GEN_INT (pos);
5619 /* Make the required operation. See if we can use existing rtx. */
5620 new = gen_rtx_combine (unsignedp ? ZERO_EXTRACT : SIGN_EXTRACT,
5621 extraction_mode, inner, GEN_INT (len), pos_rtx);
5622 if (! in_dest)
5623 new = gen_lowpart_for_combine (mode, new);
5625 return new;
5628 /* See if X contains an ASHIFT of COUNT or more bits that can be commuted
5629 with any other operations in X. Return X without that shift if so. */
5631 static rtx
5632 extract_left_shift (x, count)
5633 rtx x;
5634 int count;
5636 enum rtx_code code = GET_CODE (x);
5637 enum machine_mode mode = GET_MODE (x);
5638 rtx tem;
5640 switch (code)
5642 case ASHIFT:
5643 /* This is the shift itself. If it is wide enough, we will return
5644 either the value being shifted if the shift count is equal to
5645 COUNT or a shift for the difference. */
5646 if (GET_CODE (XEXP (x, 1)) == CONST_INT
5647 && INTVAL (XEXP (x, 1)) >= count)
5648 return simplify_shift_const (NULL_RTX, ASHIFT, mode, XEXP (x, 0),
5649 INTVAL (XEXP (x, 1)) - count);
5650 break;
5652 case NEG: case NOT:
5653 if ((tem = extract_left_shift (XEXP (x, 0), count)) != 0)
5654 return gen_unary (code, mode, mode, tem);
5656 break;
5658 case PLUS: case IOR: case XOR: case AND:
5659 /* If we can safely shift this constant and we find the inner shift,
5660 make a new operation. */
5661 if (GET_CODE (XEXP (x,1)) == CONST_INT
5662 && (INTVAL (XEXP (x, 1)) & (((HOST_WIDE_INT) 1 << count)) - 1) == 0
5663 && (tem = extract_left_shift (XEXP (x, 0), count)) != 0)
5664 return gen_binary (code, mode, tem,
5665 GEN_INT (INTVAL (XEXP (x, 1)) >> count));
5667 break;
5670 return 0;
5673 /* Look at the expression rooted at X. Look for expressions
5674 equivalent to ZERO_EXTRACT, SIGN_EXTRACT, ZERO_EXTEND, SIGN_EXTEND.
5675 Form these expressions.
5677 Return the new rtx, usually just X.
5679 Also, for machines like the Vax that don't have logical shift insns,
5680 try to convert logical to arithmetic shift operations in cases where
5681 they are equivalent. This undoes the canonicalizations to logical
5682 shifts done elsewhere.
5684 We try, as much as possible, to re-use rtl expressions to save memory.
5686 IN_CODE says what kind of expression we are processing. Normally, it is
5687 SET. In a memory address (inside a MEM, PLUS or minus, the latter two
5688 being kludges), it is MEM. When processing the arguments of a comparison
5689 or a COMPARE against zero, it is COMPARE. */
5691 static rtx
5692 make_compound_operation (x, in_code)
5693 rtx x;
5694 enum rtx_code in_code;
5696 enum rtx_code code = GET_CODE (x);
5697 enum machine_mode mode = GET_MODE (x);
5698 int mode_width = GET_MODE_BITSIZE (mode);
5699 rtx rhs, lhs;
5700 enum rtx_code next_code;
5701 int i;
5702 rtx new = 0;
5703 rtx tem;
5704 char *fmt;
5706 /* Select the code to be used in recursive calls. Once we are inside an
5707 address, we stay there. If we have a comparison, set to COMPARE,
5708 but once inside, go back to our default of SET. */
5710 next_code = (code == MEM || code == PLUS || code == MINUS ? MEM
5711 : ((code == COMPARE || GET_RTX_CLASS (code) == '<')
5712 && XEXP (x, 1) == const0_rtx) ? COMPARE
5713 : in_code == COMPARE ? SET : in_code);
5715 /* Process depending on the code of this operation. If NEW is set
5716 non-zero, it will be returned. */
5718 switch (code)
5720 case ASHIFT:
5721 /* Convert shifts by constants into multiplications if inside
5722 an address. */
5723 if (in_code == MEM && GET_CODE (XEXP (x, 1)) == CONST_INT
5724 && INTVAL (XEXP (x, 1)) < HOST_BITS_PER_WIDE_INT
5725 && INTVAL (XEXP (x, 1)) >= 0)
5727 new = make_compound_operation (XEXP (x, 0), next_code);
5728 new = gen_rtx_combine (MULT, mode, new,
5729 GEN_INT ((HOST_WIDE_INT) 1
5730 << INTVAL (XEXP (x, 1))));
5732 break;
5734 case AND:
5735 /* If the second operand is not a constant, we can't do anything
5736 with it. */
5737 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
5738 break;
5740 /* If the constant is a power of two minus one and the first operand
5741 is a logical right shift, make an extraction. */
5742 if (GET_CODE (XEXP (x, 0)) == LSHIFTRT
5743 && (i = exact_log2 (INTVAL (XEXP (x, 1)) + 1)) >= 0)
5745 new = make_compound_operation (XEXP (XEXP (x, 0), 0), next_code);
5746 new = make_extraction (mode, new, 0, XEXP (XEXP (x, 0), 1), i, 1,
5747 0, in_code == COMPARE);
5750 /* Same as previous, but for (subreg (lshiftrt ...)) in first op. */
5751 else if (GET_CODE (XEXP (x, 0)) == SUBREG
5752 && subreg_lowpart_p (XEXP (x, 0))
5753 && GET_CODE (SUBREG_REG (XEXP (x, 0))) == LSHIFTRT
5754 && (i = exact_log2 (INTVAL (XEXP (x, 1)) + 1)) >= 0)
5756 new = make_compound_operation (XEXP (SUBREG_REG (XEXP (x, 0)), 0),
5757 next_code);
5758 new = make_extraction (GET_MODE (SUBREG_REG (XEXP (x, 0))), new, 0,
5759 XEXP (SUBREG_REG (XEXP (x, 0)), 1), i, 1,
5760 0, in_code == COMPARE);
5762 /* Same as previous, but for (xor/ior (lshiftrt...) (lshiftrt...)). */
5763 else if ((GET_CODE (XEXP (x, 0)) == XOR
5764 || GET_CODE (XEXP (x, 0)) == IOR)
5765 && GET_CODE (XEXP (XEXP (x, 0), 0)) == LSHIFTRT
5766 && GET_CODE (XEXP (XEXP (x, 0), 1)) == LSHIFTRT
5767 && (i = exact_log2 (INTVAL (XEXP (x, 1)) + 1)) >= 0)
5769 /* Apply the distributive law, and then try to make extractions. */
5770 new = gen_rtx_combine (GET_CODE (XEXP (x, 0)), mode,
5771 gen_rtx (AND, mode, XEXP (XEXP (x, 0), 0),
5772 XEXP (x, 1)),
5773 gen_rtx (AND, mode, XEXP (XEXP (x, 0), 1),
5774 XEXP (x, 1)));
5775 new = make_compound_operation (new, in_code);
5778 /* If we are have (and (rotate X C) M) and C is larger than the number
5779 of bits in M, this is an extraction. */
5781 else if (GET_CODE (XEXP (x, 0)) == ROTATE
5782 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
5783 && (i = exact_log2 (INTVAL (XEXP (x, 1)) + 1)) >= 0
5784 && i <= INTVAL (XEXP (XEXP (x, 0), 1)))
5786 new = make_compound_operation (XEXP (XEXP (x, 0), 0), next_code);
5787 new = make_extraction (mode, new,
5788 (GET_MODE_BITSIZE (mode)
5789 - INTVAL (XEXP (XEXP (x, 0), 1))),
5790 NULL_RTX, i, 1, 0, in_code == COMPARE);
5793 /* On machines without logical shifts, if the operand of the AND is
5794 a logical shift and our mask turns off all the propagated sign
5795 bits, we can replace the logical shift with an arithmetic shift. */
5796 else if (ashr_optab->handlers[(int) mode].insn_code != CODE_FOR_nothing
5797 && (lshr_optab->handlers[(int) mode].insn_code
5798 == CODE_FOR_nothing)
5799 && GET_CODE (XEXP (x, 0)) == LSHIFTRT
5800 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
5801 && INTVAL (XEXP (XEXP (x, 0), 1)) >= 0
5802 && INTVAL (XEXP (XEXP (x, 0), 1)) < HOST_BITS_PER_WIDE_INT
5803 && mode_width <= HOST_BITS_PER_WIDE_INT)
5805 unsigned HOST_WIDE_INT mask = GET_MODE_MASK (mode);
5807 mask >>= INTVAL (XEXP (XEXP (x, 0), 1));
5808 if ((INTVAL (XEXP (x, 1)) & ~mask) == 0)
5809 SUBST (XEXP (x, 0),
5810 gen_rtx_combine (ASHIFTRT, mode,
5811 make_compound_operation (XEXP (XEXP (x, 0), 0),
5812 next_code),
5813 XEXP (XEXP (x, 0), 1)));
5816 /* If the constant is one less than a power of two, this might be
5817 representable by an extraction even if no shift is present.
5818 If it doesn't end up being a ZERO_EXTEND, we will ignore it unless
5819 we are in a COMPARE. */
5820 else if ((i = exact_log2 (INTVAL (XEXP (x, 1)) + 1)) >= 0)
5821 new = make_extraction (mode,
5822 make_compound_operation (XEXP (x, 0),
5823 next_code),
5824 0, NULL_RTX, i, 1, 0, in_code == COMPARE);
5826 /* If we are in a comparison and this is an AND with a power of two,
5827 convert this into the appropriate bit extract. */
5828 else if (in_code == COMPARE
5829 && (i = exact_log2 (INTVAL (XEXP (x, 1)))) >= 0)
5830 new = make_extraction (mode,
5831 make_compound_operation (XEXP (x, 0),
5832 next_code),
5833 i, NULL_RTX, 1, 1, 0, 1);
5835 break;
5837 case LSHIFTRT:
5838 /* If the sign bit is known to be zero, replace this with an
5839 arithmetic shift. */
5840 if (ashr_optab->handlers[(int) mode].insn_code == CODE_FOR_nothing
5841 && lshr_optab->handlers[(int) mode].insn_code != CODE_FOR_nothing
5842 && mode_width <= HOST_BITS_PER_WIDE_INT
5843 && (nonzero_bits (XEXP (x, 0), mode) & (1 << (mode_width - 1))) == 0)
5845 new = gen_rtx_combine (ASHIFTRT, mode,
5846 make_compound_operation (XEXP (x, 0),
5847 next_code),
5848 XEXP (x, 1));
5849 break;
5852 /* ... fall through ... */
5854 case ASHIFTRT:
5855 lhs = XEXP (x, 0);
5856 rhs = XEXP (x, 1);
5858 /* If we have (ashiftrt (ashift foo C1) C2) with C2 >= C1,
5859 this is a SIGN_EXTRACT. */
5860 if (GET_CODE (rhs) == CONST_INT
5861 && GET_CODE (lhs) == ASHIFT
5862 && GET_CODE (XEXP (lhs, 1)) == CONST_INT
5863 && INTVAL (rhs) >= INTVAL (XEXP (lhs, 1)))
5865 new = make_compound_operation (XEXP (lhs, 0), next_code);
5866 new = make_extraction (mode, new,
5867 INTVAL (rhs) - INTVAL (XEXP (lhs, 1)),
5868 NULL_RTX, mode_width - INTVAL (rhs),
5869 code == LSHIFTRT, 0, in_code == COMPARE);
5872 /* See if we have operations between an ASHIFTRT and an ASHIFT.
5873 If so, try to merge the shifts into a SIGN_EXTEND. We could
5874 also do this for some cases of SIGN_EXTRACT, but it doesn't
5875 seem worth the effort; the case checked for occurs on Alpha. */
5877 if (GET_RTX_CLASS (GET_CODE (lhs)) != 'o'
5878 && ! (GET_CODE (lhs) == SUBREG
5879 && (GET_RTX_CLASS (GET_CODE (SUBREG_REG (lhs))) == 'o'))
5880 && GET_CODE (rhs) == CONST_INT
5881 && INTVAL (rhs) < HOST_BITS_PER_WIDE_INT
5882 && (new = extract_left_shift (lhs, INTVAL (rhs))) != 0)
5883 new = make_extraction (mode, make_compound_operation (new, next_code),
5884 0, NULL_RTX, mode_width - INTVAL (rhs),
5885 code == LSHIFTRT, 0, in_code == COMPARE);
5887 break;
5889 case SUBREG:
5890 /* Call ourselves recursively on the inner expression. If we are
5891 narrowing the object and it has a different RTL code from
5892 what it originally did, do this SUBREG as a force_to_mode. */
5894 tem = make_compound_operation (SUBREG_REG (x), in_code);
5895 if (GET_CODE (tem) != GET_CODE (SUBREG_REG (x))
5896 && GET_MODE_SIZE (mode) < GET_MODE_SIZE (GET_MODE (tem))
5897 && subreg_lowpart_p (x))
5899 rtx newer = force_to_mode (tem, mode,
5900 GET_MODE_MASK (mode), NULL_RTX, 0);
5902 /* If we have something other than a SUBREG, we might have
5903 done an expansion, so rerun outselves. */
5904 if (GET_CODE (newer) != SUBREG)
5905 newer = make_compound_operation (newer, in_code);
5907 return newer;
5911 if (new)
5913 x = gen_lowpart_for_combine (mode, new);
5914 code = GET_CODE (x);
5917 /* Now recursively process each operand of this operation. */
5918 fmt = GET_RTX_FORMAT (code);
5919 for (i = 0; i < GET_RTX_LENGTH (code); i++)
5920 if (fmt[i] == 'e')
5922 new = make_compound_operation (XEXP (x, i), next_code);
5923 SUBST (XEXP (x, i), new);
5926 return x;
5929 /* Given M see if it is a value that would select a field of bits
5930 within an item, but not the entire word. Return -1 if not.
5931 Otherwise, return the starting position of the field, where 0 is the
5932 low-order bit.
5934 *PLEN is set to the length of the field. */
5936 static int
5937 get_pos_from_mask (m, plen)
5938 unsigned HOST_WIDE_INT m;
5939 int *plen;
5941 /* Get the bit number of the first 1 bit from the right, -1 if none. */
5942 int pos = exact_log2 (m & - m);
5944 if (pos < 0)
5945 return -1;
5947 /* Now shift off the low-order zero bits and see if we have a power of
5948 two minus 1. */
5949 *plen = exact_log2 ((m >> pos) + 1);
5951 if (*plen <= 0)
5952 return -1;
5954 return pos;
5957 /* See if X can be simplified knowing that we will only refer to it in
5958 MODE and will only refer to those bits that are nonzero in MASK.
5959 If other bits are being computed or if masking operations are done
5960 that select a superset of the bits in MASK, they can sometimes be
5961 ignored.
5963 Return a possibly simplified expression, but always convert X to
5964 MODE. If X is a CONST_INT, AND the CONST_INT with MASK.
5966 Also, if REG is non-zero and X is a register equal in value to REG,
5967 replace X with REG.
5969 If JUST_SELECT is nonzero, don't optimize by noticing that bits in MASK
5970 are all off in X. This is used when X will be complemented, by either
5971 NOT, NEG, or XOR. */
5973 static rtx
5974 force_to_mode (x, mode, mask, reg, just_select)
5975 rtx x;
5976 enum machine_mode mode;
5977 unsigned HOST_WIDE_INT mask;
5978 rtx reg;
5979 int just_select;
5981 enum rtx_code code = GET_CODE (x);
5982 int next_select = just_select || code == XOR || code == NOT || code == NEG;
5983 enum machine_mode op_mode;
5984 unsigned HOST_WIDE_INT fuller_mask, nonzero;
5985 rtx op0, op1, temp;
5987 /* If this is a CALL or ASM_OPERANDS, don't do anything. Some of the
5988 code below will do the wrong thing since the mode of such an
5989 expression is VOIDmode. */
5990 if (code == CALL || code == ASM_OPERANDS)
5991 return x;
5993 /* We want to perform the operation is its present mode unless we know
5994 that the operation is valid in MODE, in which case we do the operation
5995 in MODE. */
5996 op_mode = ((GET_MODE_CLASS (mode) == GET_MODE_CLASS (GET_MODE (x))
5997 && code_to_optab[(int) code] != 0
5998 && (code_to_optab[(int) code]->handlers[(int) mode].insn_code
5999 != CODE_FOR_nothing))
6000 ? mode : GET_MODE (x));
6002 /* It is not valid to do a right-shift in a narrower mode
6003 than the one it came in with. */
6004 if ((code == LSHIFTRT || code == ASHIFTRT)
6005 && GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (GET_MODE (x)))
6006 op_mode = GET_MODE (x);
6008 /* Truncate MASK to fit OP_MODE. */
6009 if (op_mode)
6010 mask &= GET_MODE_MASK (op_mode);
6012 /* When we have an arithmetic operation, or a shift whose count we
6013 do not know, we need to assume that all bit the up to the highest-order
6014 bit in MASK will be needed. This is how we form such a mask. */
6015 if (op_mode)
6016 fuller_mask = (GET_MODE_BITSIZE (op_mode) >= HOST_BITS_PER_WIDE_INT
6017 ? GET_MODE_MASK (op_mode)
6018 : ((HOST_WIDE_INT) 1 << (floor_log2 (mask) + 1)) - 1);
6019 else
6020 fuller_mask = ~ (HOST_WIDE_INT) 0;
6022 /* Determine what bits of X are guaranteed to be (non)zero. */
6023 nonzero = nonzero_bits (x, mode);
6025 /* If none of the bits in X are needed, return a zero. */
6026 if (! just_select && (nonzero & mask) == 0)
6027 return const0_rtx;
6029 /* If X is a CONST_INT, return a new one. Do this here since the
6030 test below will fail. */
6031 if (GET_CODE (x) == CONST_INT)
6033 HOST_WIDE_INT cval = INTVAL (x) & mask;
6034 int width = GET_MODE_BITSIZE (mode);
6036 /* If MODE is narrower that HOST_WIDE_INT and CVAL is a negative
6037 number, sign extend it. */
6038 if (width > 0 && width < HOST_BITS_PER_WIDE_INT
6039 && (cval & ((HOST_WIDE_INT) 1 << (width - 1))) != 0)
6040 cval |= (HOST_WIDE_INT) -1 << width;
6042 return GEN_INT (cval);
6045 /* If X is narrower than MODE and we want all the bits in X's mode, just
6046 get X in the proper mode. */
6047 if (GET_MODE_SIZE (GET_MODE (x)) < GET_MODE_SIZE (mode)
6048 && (GET_MODE_MASK (GET_MODE (x)) & ~ mask) == 0)
6049 return gen_lowpart_for_combine (mode, x);
6051 /* If we aren't changing the mode, X is not a SUBREG, and all zero bits in
6052 MASK are already known to be zero in X, we need not do anything. */
6053 if (GET_MODE (x) == mode && code != SUBREG && (~ mask & nonzero) == 0)
6054 return x;
6056 switch (code)
6058 case CLOBBER:
6059 /* If X is a (clobber (const_int)), return it since we know we are
6060 generating something that won't match. */
6061 return x;
6063 case USE:
6064 /* X is a (use (mem ..)) that was made from a bit-field extraction that
6065 spanned the boundary of the MEM. If we are now masking so it is
6066 within that boundary, we don't need the USE any more. */
6067 if (! BITS_BIG_ENDIAN
6068 && (mask & ~ GET_MODE_MASK (GET_MODE (XEXP (x, 0)))) == 0)
6069 return force_to_mode (XEXP (x, 0), mode, mask, reg, next_select);
6070 break;
6072 case SIGN_EXTEND:
6073 case ZERO_EXTEND:
6074 case ZERO_EXTRACT:
6075 case SIGN_EXTRACT:
6076 x = expand_compound_operation (x);
6077 if (GET_CODE (x) != code)
6078 return force_to_mode (x, mode, mask, reg, next_select);
6079 break;
6081 case REG:
6082 if (reg != 0 && (rtx_equal_p (get_last_value (reg), x)
6083 || rtx_equal_p (reg, get_last_value (x))))
6084 x = reg;
6085 break;
6087 case SUBREG:
6088 if (subreg_lowpart_p (x)
6089 /* We can ignore the effect of this SUBREG if it narrows the mode or
6090 if the constant masks to zero all the bits the mode doesn't
6091 have. */
6092 && ((GET_MODE_SIZE (GET_MODE (x))
6093 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (x))))
6094 || (0 == (mask
6095 & GET_MODE_MASK (GET_MODE (x))
6096 & ~ GET_MODE_MASK (GET_MODE (SUBREG_REG (x)))))))
6097 return force_to_mode (SUBREG_REG (x), mode, mask, reg, next_select);
6098 break;
6100 case AND:
6101 /* If this is an AND with a constant, convert it into an AND
6102 whose constant is the AND of that constant with MASK. If it
6103 remains an AND of MASK, delete it since it is redundant. */
6105 if (GET_CODE (XEXP (x, 1)) == CONST_INT)
6107 x = simplify_and_const_int (x, op_mode, XEXP (x, 0),
6108 mask & INTVAL (XEXP (x, 1)));
6110 /* If X is still an AND, see if it is an AND with a mask that
6111 is just some low-order bits. If so, and it is MASK, we don't
6112 need it. */
6114 if (GET_CODE (x) == AND && GET_CODE (XEXP (x, 1)) == CONST_INT
6115 && INTVAL (XEXP (x, 1)) == mask)
6116 x = XEXP (x, 0);
6118 /* If it remains an AND, try making another AND with the bits
6119 in the mode mask that aren't in MASK turned on. If the
6120 constant in the AND is wide enough, this might make a
6121 cheaper constant. */
6123 if (GET_CODE (x) == AND && GET_CODE (XEXP (x, 1)) == CONST_INT
6124 && GET_MODE_MASK (GET_MODE (x)) != mask
6125 && GET_MODE_BITSIZE (GET_MODE (x)) <= HOST_BITS_PER_WIDE_INT)
6127 HOST_WIDE_INT cval = (INTVAL (XEXP (x, 1))
6128 | (GET_MODE_MASK (GET_MODE (x)) & ~ mask));
6129 int width = GET_MODE_BITSIZE (GET_MODE (x));
6130 rtx y;
6132 /* If MODE is narrower that HOST_WIDE_INT and CVAL is a negative
6133 number, sign extend it. */
6134 if (width > 0 && width < HOST_BITS_PER_WIDE_INT
6135 && (cval & ((HOST_WIDE_INT) 1 << (width - 1))) != 0)
6136 cval |= (HOST_WIDE_INT) -1 << width;
6138 y = gen_binary (AND, GET_MODE (x), XEXP (x, 0), GEN_INT (cval));
6139 if (rtx_cost (y, SET) < rtx_cost (x, SET))
6140 x = y;
6143 break;
6146 goto binop;
6148 case PLUS:
6149 /* In (and (plus FOO C1) M), if M is a mask that just turns off
6150 low-order bits (as in an alignment operation) and FOO is already
6151 aligned to that boundary, mask C1 to that boundary as well.
6152 This may eliminate that PLUS and, later, the AND. */
6155 int width = GET_MODE_BITSIZE (mode);
6156 unsigned HOST_WIDE_INT smask = mask;
6158 /* If MODE is narrower than HOST_WIDE_INT and mask is a negative
6159 number, sign extend it. */
6161 if (width < HOST_BITS_PER_WIDE_INT
6162 && (smask & ((HOST_WIDE_INT) 1 << (width - 1))) != 0)
6163 smask |= (HOST_WIDE_INT) -1 << width;
6165 if (GET_CODE (XEXP (x, 1)) == CONST_INT
6166 && exact_log2 (- smask) >= 0
6167 && (nonzero_bits (XEXP (x, 0), mode) & ~ mask) == 0
6168 && (INTVAL (XEXP (x, 1)) & ~ mask) != 0)
6169 return force_to_mode (plus_constant (XEXP (x, 0),
6170 INTVAL (XEXP (x, 1)) & mask),
6171 mode, mask, reg, next_select);
6174 /* ... fall through ... */
6176 case MINUS:
6177 case MULT:
6178 /* For PLUS, MINUS and MULT, we need any bits less significant than the
6179 most significant bit in MASK since carries from those bits will
6180 affect the bits we are interested in. */
6181 mask = fuller_mask;
6182 goto binop;
6184 case IOR:
6185 case XOR:
6186 /* If X is (ior (lshiftrt FOO C1) C2), try to commute the IOR and
6187 LSHIFTRT so we end up with an (and (lshiftrt (ior ...) ...) ...)
6188 operation which may be a bitfield extraction. Ensure that the
6189 constant we form is not wider than the mode of X. */
6191 if (GET_CODE (XEXP (x, 0)) == LSHIFTRT
6192 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
6193 && INTVAL (XEXP (XEXP (x, 0), 1)) >= 0
6194 && INTVAL (XEXP (XEXP (x, 0), 1)) < HOST_BITS_PER_WIDE_INT
6195 && GET_CODE (XEXP (x, 1)) == CONST_INT
6196 && ((INTVAL (XEXP (XEXP (x, 0), 1))
6197 + floor_log2 (INTVAL (XEXP (x, 1))))
6198 < GET_MODE_BITSIZE (GET_MODE (x)))
6199 && (INTVAL (XEXP (x, 1))
6200 & ~ nonzero_bits (XEXP (x, 0), GET_MODE (x))) == 0)
6202 temp = GEN_INT ((INTVAL (XEXP (x, 1)) & mask)
6203 << INTVAL (XEXP (XEXP (x, 0), 1)));
6204 temp = gen_binary (GET_CODE (x), GET_MODE (x),
6205 XEXP (XEXP (x, 0), 0), temp);
6206 x = gen_binary (LSHIFTRT, GET_MODE (x), temp,
6207 XEXP (XEXP (x, 0), 1));
6208 return force_to_mode (x, mode, mask, reg, next_select);
6211 binop:
6212 /* For most binary operations, just propagate into the operation and
6213 change the mode if we have an operation of that mode. */
6215 op0 = gen_lowpart_for_combine (op_mode,
6216 force_to_mode (XEXP (x, 0), mode, mask,
6217 reg, next_select));
6218 op1 = gen_lowpart_for_combine (op_mode,
6219 force_to_mode (XEXP (x, 1), mode, mask,
6220 reg, next_select));
6222 /* If OP1 is a CONST_INT and X is an IOR or XOR, clear bits outside
6223 MASK since OP1 might have been sign-extended but we never want
6224 to turn on extra bits, since combine might have previously relied
6225 on them being off. */
6226 if (GET_CODE (op1) == CONST_INT && (code == IOR || code == XOR)
6227 && (INTVAL (op1) & mask) != 0)
6228 op1 = GEN_INT (INTVAL (op1) & mask);
6230 if (op_mode != GET_MODE (x) || op0 != XEXP (x, 0) || op1 != XEXP (x, 1))
6231 x = gen_binary (code, op_mode, op0, op1);
6232 break;
6234 case ASHIFT:
6235 /* For left shifts, do the same, but just for the first operand.
6236 However, we cannot do anything with shifts where we cannot
6237 guarantee that the counts are smaller than the size of the mode
6238 because such a count will have a different meaning in a
6239 wider mode. */
6241 if (! (GET_CODE (XEXP (x, 1)) == CONST_INT
6242 && INTVAL (XEXP (x, 1)) >= 0
6243 && INTVAL (XEXP (x, 1)) < GET_MODE_BITSIZE (mode))
6244 && ! (GET_MODE (XEXP (x, 1)) != VOIDmode
6245 && (nonzero_bits (XEXP (x, 1), GET_MODE (XEXP (x, 1)))
6246 < (unsigned HOST_WIDE_INT) GET_MODE_BITSIZE (mode))))
6247 break;
6249 /* If the shift count is a constant and we can do arithmetic in
6250 the mode of the shift, refine which bits we need. Otherwise, use the
6251 conservative form of the mask. */
6252 if (GET_CODE (XEXP (x, 1)) == CONST_INT
6253 && INTVAL (XEXP (x, 1)) >= 0
6254 && INTVAL (XEXP (x, 1)) < GET_MODE_BITSIZE (op_mode)
6255 && GET_MODE_BITSIZE (op_mode) <= HOST_BITS_PER_WIDE_INT)
6256 mask >>= INTVAL (XEXP (x, 1));
6257 else
6258 mask = fuller_mask;
6260 op0 = gen_lowpart_for_combine (op_mode,
6261 force_to_mode (XEXP (x, 0), op_mode,
6262 mask, reg, next_select));
6264 if (op_mode != GET_MODE (x) || op0 != XEXP (x, 0))
6265 x = gen_binary (code, op_mode, op0, XEXP (x, 1));
6266 break;
6268 case LSHIFTRT:
6269 /* Here we can only do something if the shift count is a constant,
6270 this shift constant is valid for the host, and we can do arithmetic
6271 in OP_MODE. */
6273 if (GET_CODE (XEXP (x, 1)) == CONST_INT
6274 && INTVAL (XEXP (x, 1)) < HOST_BITS_PER_WIDE_INT
6275 && GET_MODE_BITSIZE (op_mode) <= HOST_BITS_PER_WIDE_INT)
6277 rtx inner = XEXP (x, 0);
6279 /* Select the mask of the bits we need for the shift operand. */
6280 mask <<= INTVAL (XEXP (x, 1));
6282 /* We can only change the mode of the shift if we can do arithmetic
6283 in the mode of the shift and MASK is no wider than the width of
6284 OP_MODE. */
6285 if (GET_MODE_BITSIZE (op_mode) > HOST_BITS_PER_WIDE_INT
6286 || (mask & ~ GET_MODE_MASK (op_mode)) != 0)
6287 op_mode = GET_MODE (x);
6289 inner = force_to_mode (inner, op_mode, mask, reg, next_select);
6291 if (GET_MODE (x) != op_mode || inner != XEXP (x, 0))
6292 x = gen_binary (LSHIFTRT, op_mode, inner, XEXP (x, 1));
6295 /* If we have (and (lshiftrt FOO C1) C2) where the combination of the
6296 shift and AND produces only copies of the sign bit (C2 is one less
6297 than a power of two), we can do this with just a shift. */
6299 if (GET_CODE (x) == LSHIFTRT
6300 && GET_CODE (XEXP (x, 1)) == CONST_INT
6301 && ((INTVAL (XEXP (x, 1))
6302 + num_sign_bit_copies (XEXP (x, 0), GET_MODE (XEXP (x, 0))))
6303 >= GET_MODE_BITSIZE (GET_MODE (x)))
6304 && exact_log2 (mask + 1) >= 0
6305 && (num_sign_bit_copies (XEXP (x, 0), GET_MODE (XEXP (x, 0)))
6306 >= exact_log2 (mask + 1)))
6307 x = gen_binary (LSHIFTRT, GET_MODE (x), XEXP (x, 0),
6308 GEN_INT (GET_MODE_BITSIZE (GET_MODE (x))
6309 - exact_log2 (mask + 1)));
6310 break;
6312 case ASHIFTRT:
6313 /* If we are just looking for the sign bit, we don't need this shift at
6314 all, even if it has a variable count. */
6315 if (GET_MODE_BITSIZE (GET_MODE (x)) <= HOST_BITS_PER_WIDE_INT
6316 && (mask == ((HOST_WIDE_INT) 1
6317 << (GET_MODE_BITSIZE (GET_MODE (x)) - 1))))
6318 return force_to_mode (XEXP (x, 0), mode, mask, reg, next_select);
6320 /* If this is a shift by a constant, get a mask that contains those bits
6321 that are not copies of the sign bit. We then have two cases: If
6322 MASK only includes those bits, this can be a logical shift, which may
6323 allow simplifications. If MASK is a single-bit field not within
6324 those bits, we are requesting a copy of the sign bit and hence can
6325 shift the sign bit to the appropriate location. */
6327 if (GET_CODE (XEXP (x, 1)) == CONST_INT && INTVAL (XEXP (x, 1)) >= 0
6328 && INTVAL (XEXP (x, 1)) < HOST_BITS_PER_WIDE_INT)
6330 int i = -1;
6332 /* If the considered data is wider then HOST_WIDE_INT, we can't
6333 represent a mask for all its bits in a single scalar.
6334 But we only care about the lower bits, so calculate these. */
6336 if (GET_MODE_BITSIZE (GET_MODE (x)) > HOST_BITS_PER_WIDE_INT)
6338 nonzero = ~ (HOST_WIDE_INT) 0;
6340 /* GET_MODE_BITSIZE (GET_MODE (x)) - INTVAL (XEXP (x, 1))
6341 is the number of bits a full-width mask would have set.
6342 We need only shift if these are fewer than nonzero can
6343 hold. If not, we must keep all bits set in nonzero. */
6345 if (GET_MODE_BITSIZE (GET_MODE (x)) - INTVAL (XEXP (x, 1))
6346 < HOST_BITS_PER_WIDE_INT)
6347 nonzero >>= INTVAL (XEXP (x, 1))
6348 + HOST_BITS_PER_WIDE_INT
6349 - GET_MODE_BITSIZE (GET_MODE (x)) ;
6351 else
6353 nonzero = GET_MODE_MASK (GET_MODE (x));
6354 nonzero >>= INTVAL (XEXP (x, 1));
6357 if ((mask & ~ nonzero) == 0
6358 || (i = exact_log2 (mask)) >= 0)
6360 x = simplify_shift_const
6361 (x, LSHIFTRT, GET_MODE (x), XEXP (x, 0),
6362 i < 0 ? INTVAL (XEXP (x, 1))
6363 : GET_MODE_BITSIZE (GET_MODE (x)) - 1 - i);
6365 if (GET_CODE (x) != ASHIFTRT)
6366 return force_to_mode (x, mode, mask, reg, next_select);
6370 /* If MASK is 1, convert this to a LSHIFTRT. This can be done
6371 even if the shift count isn't a constant. */
6372 if (mask == 1)
6373 x = gen_binary (LSHIFTRT, GET_MODE (x), XEXP (x, 0), XEXP (x, 1));
6375 /* If this is a sign-extension operation that just affects bits
6376 we don't care about, remove it. Be sure the call above returned
6377 something that is still a shift. */
6379 if ((GET_CODE (x) == LSHIFTRT || GET_CODE (x) == ASHIFTRT)
6380 && GET_CODE (XEXP (x, 1)) == CONST_INT
6381 && INTVAL (XEXP (x, 1)) >= 0
6382 && (INTVAL (XEXP (x, 1))
6383 <= GET_MODE_BITSIZE (GET_MODE (x)) - (floor_log2 (mask) + 1))
6384 && GET_CODE (XEXP (x, 0)) == ASHIFT
6385 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
6386 && INTVAL (XEXP (XEXP (x, 0), 1)) == INTVAL (XEXP (x, 1)))
6387 return force_to_mode (XEXP (XEXP (x, 0), 0), mode, mask,
6388 reg, next_select);
6390 break;
6392 case ROTATE:
6393 case ROTATERT:
6394 /* If the shift count is constant and we can do computations
6395 in the mode of X, compute where the bits we care about are.
6396 Otherwise, we can't do anything. Don't change the mode of
6397 the shift or propagate MODE into the shift, though. */
6398 if (GET_CODE (XEXP (x, 1)) == CONST_INT
6399 && INTVAL (XEXP (x, 1)) >= 0)
6401 temp = simplify_binary_operation (code == ROTATE ? ROTATERT : ROTATE,
6402 GET_MODE (x), GEN_INT (mask),
6403 XEXP (x, 1));
6404 if (temp && GET_CODE(temp) == CONST_INT)
6405 SUBST (XEXP (x, 0),
6406 force_to_mode (XEXP (x, 0), GET_MODE (x),
6407 INTVAL (temp), reg, next_select));
6409 break;
6411 case NEG:
6412 /* If we just want the low-order bit, the NEG isn't needed since it
6413 won't change the low-order bit. */
6414 if (mask == 1)
6415 return force_to_mode (XEXP (x, 0), mode, mask, reg, just_select);
6417 /* We need any bits less significant than the most significant bit in
6418 MASK since carries from those bits will affect the bits we are
6419 interested in. */
6420 mask = fuller_mask;
6421 goto unop;
6423 case NOT:
6424 /* (not FOO) is (xor FOO CONST), so if FOO is an LSHIFTRT, we can do the
6425 same as the XOR case above. Ensure that the constant we form is not
6426 wider than the mode of X. */
6428 if (GET_CODE (XEXP (x, 0)) == LSHIFTRT
6429 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
6430 && INTVAL (XEXP (XEXP (x, 0), 1)) >= 0
6431 && (INTVAL (XEXP (XEXP (x, 0), 1)) + floor_log2 (mask)
6432 < GET_MODE_BITSIZE (GET_MODE (x)))
6433 && INTVAL (XEXP (XEXP (x, 0), 1)) < HOST_BITS_PER_WIDE_INT)
6435 temp = GEN_INT (mask << INTVAL (XEXP (XEXP (x, 0), 1)));
6436 temp = gen_binary (XOR, GET_MODE (x), XEXP (XEXP (x, 0), 0), temp);
6437 x = gen_binary (LSHIFTRT, GET_MODE (x), temp, XEXP (XEXP (x, 0), 1));
6439 return force_to_mode (x, mode, mask, reg, next_select);
6442 /* (and (not FOO) CONST) is (not (or FOO (not CONST))), so we must
6443 use the full mask inside the NOT. */
6444 mask = fuller_mask;
6446 unop:
6447 op0 = gen_lowpart_for_combine (op_mode,
6448 force_to_mode (XEXP (x, 0), mode, mask,
6449 reg, next_select));
6450 if (op_mode != GET_MODE (x) || op0 != XEXP (x, 0))
6451 x = gen_unary (code, op_mode, op_mode, op0);
6452 break;
6454 case NE:
6455 /* (and (ne FOO 0) CONST) can be (and FOO CONST) if CONST is included
6456 in STORE_FLAG_VALUE and FOO has a single bit that might be nonzero,
6457 which is equal to STORE_FLAG_VALUE. */
6458 if ((mask & ~ STORE_FLAG_VALUE) == 0 && XEXP (x, 1) == const0_rtx
6459 && exact_log2 (nonzero_bits (XEXP (x, 0), mode)) >= 0
6460 && nonzero_bits (XEXP (x, 0), mode) == STORE_FLAG_VALUE)
6461 return force_to_mode (XEXP (x, 0), mode, mask, reg, next_select);
6463 break;
6465 case IF_THEN_ELSE:
6466 /* We have no way of knowing if the IF_THEN_ELSE can itself be
6467 written in a narrower mode. We play it safe and do not do so. */
6469 SUBST (XEXP (x, 1),
6470 gen_lowpart_for_combine (GET_MODE (x),
6471 force_to_mode (XEXP (x, 1), mode,
6472 mask, reg, next_select)));
6473 SUBST (XEXP (x, 2),
6474 gen_lowpart_for_combine (GET_MODE (x),
6475 force_to_mode (XEXP (x, 2), mode,
6476 mask, reg,next_select)));
6477 break;
6480 /* Ensure we return a value of the proper mode. */
6481 return gen_lowpart_for_combine (mode, x);
6484 /* Return nonzero if X is an expression that has one of two values depending on
6485 whether some other value is zero or nonzero. In that case, we return the
6486 value that is being tested, *PTRUE is set to the value if the rtx being
6487 returned has a nonzero value, and *PFALSE is set to the other alternative.
6489 If we return zero, we set *PTRUE and *PFALSE to X. */
6491 static rtx
6492 if_then_else_cond (x, ptrue, pfalse)
6493 rtx x;
6494 rtx *ptrue, *pfalse;
6496 enum machine_mode mode = GET_MODE (x);
6497 enum rtx_code code = GET_CODE (x);
6498 int size = GET_MODE_BITSIZE (mode);
6499 rtx cond0, cond1, true0, true1, false0, false1;
6500 unsigned HOST_WIDE_INT nz;
6502 /* If this is a unary operation whose operand has one of two values, apply
6503 our opcode to compute those values. */
6504 if (GET_RTX_CLASS (code) == '1'
6505 && (cond0 = if_then_else_cond (XEXP (x, 0), &true0, &false0)) != 0)
6507 *ptrue = gen_unary (code, mode, GET_MODE (XEXP (x, 0)), true0);
6508 *pfalse = gen_unary (code, mode, GET_MODE (XEXP (x, 0)), false0);
6509 return cond0;
6512 /* If this is a COMPARE, do nothing, since the IF_THEN_ELSE we would
6513 make can't possibly match and would suppress other optimizations. */
6514 else if (code == COMPARE)
6517 /* If this is a binary operation, see if either side has only one of two
6518 values. If either one does or if both do and they are conditional on
6519 the same value, compute the new true and false values. */
6520 else if (GET_RTX_CLASS (code) == 'c' || GET_RTX_CLASS (code) == '2'
6521 || GET_RTX_CLASS (code) == '<')
6523 cond0 = if_then_else_cond (XEXP (x, 0), &true0, &false0);
6524 cond1 = if_then_else_cond (XEXP (x, 1), &true1, &false1);
6526 if ((cond0 != 0 || cond1 != 0)
6527 && ! (cond0 != 0 && cond1 != 0 && ! rtx_equal_p (cond0, cond1)))
6529 /* If if_then_else_cond returned zero, then true/false are the
6530 same rtl. We must copy one of them to prevent invalid rtl
6531 sharing. */
6532 if (cond0 == 0)
6533 true0 = copy_rtx (true0);
6534 else if (cond1 == 0)
6535 true1 = copy_rtx (true1);
6537 *ptrue = gen_binary (code, mode, true0, true1);
6538 *pfalse = gen_binary (code, mode, false0, false1);
6539 return cond0 ? cond0 : cond1;
6542 /* See if we have PLUS, IOR, XOR, MINUS or UMAX, where one of the
6543 operands is zero when the other is non-zero, and vice-versa,
6544 and STORE_FLAG_VALUE is 1 or -1. */
6546 if ((STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1)
6547 && (code == PLUS || code == IOR || code == XOR || code == MINUS
6548 || code == UMAX)
6549 && GET_CODE (XEXP (x, 0)) == MULT && GET_CODE (XEXP (x, 1)) == MULT)
6551 rtx op0 = XEXP (XEXP (x, 0), 1);
6552 rtx op1 = XEXP (XEXP (x, 1), 1);
6554 cond0 = XEXP (XEXP (x, 0), 0);
6555 cond1 = XEXP (XEXP (x, 1), 0);
6557 if (GET_RTX_CLASS (GET_CODE (cond0)) == '<'
6558 && GET_RTX_CLASS (GET_CODE (cond1)) == '<'
6559 && reversible_comparison_p (cond1)
6560 && ((GET_CODE (cond0) == reverse_condition (GET_CODE (cond1))
6561 && rtx_equal_p (XEXP (cond0, 0), XEXP (cond1, 0))
6562 && rtx_equal_p (XEXP (cond0, 1), XEXP (cond1, 1)))
6563 || ((swap_condition (GET_CODE (cond0))
6564 == reverse_condition (GET_CODE (cond1)))
6565 && rtx_equal_p (XEXP (cond0, 0), XEXP (cond1, 1))
6566 && rtx_equal_p (XEXP (cond0, 1), XEXP (cond1, 0))))
6567 && ! side_effects_p (x))
6569 *ptrue = gen_binary (MULT, mode, op0, const_true_rtx);
6570 *pfalse = gen_binary (MULT, mode,
6571 (code == MINUS
6572 ? gen_unary (NEG, mode, mode, op1) : op1),
6573 const_true_rtx);
6574 return cond0;
6578 /* Similarly for MULT, AND and UMIN, execpt that for these the result
6579 is always zero. */
6580 if ((STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1)
6581 && (code == MULT || code == AND || code == UMIN)
6582 && GET_CODE (XEXP (x, 0)) == MULT && GET_CODE (XEXP (x, 1)) == MULT)
6584 cond0 = XEXP (XEXP (x, 0), 0);
6585 cond1 = XEXP (XEXP (x, 1), 0);
6587 if (GET_RTX_CLASS (GET_CODE (cond0)) == '<'
6588 && GET_RTX_CLASS (GET_CODE (cond1)) == '<'
6589 && reversible_comparison_p (cond1)
6590 && ((GET_CODE (cond0) == reverse_condition (GET_CODE (cond1))
6591 && rtx_equal_p (XEXP (cond0, 0), XEXP (cond1, 0))
6592 && rtx_equal_p (XEXP (cond0, 1), XEXP (cond1, 1)))
6593 || ((swap_condition (GET_CODE (cond0))
6594 == reverse_condition (GET_CODE (cond1)))
6595 && rtx_equal_p (XEXP (cond0, 0), XEXP (cond1, 1))
6596 && rtx_equal_p (XEXP (cond0, 1), XEXP (cond1, 0))))
6597 && ! side_effects_p (x))
6599 *ptrue = *pfalse = const0_rtx;
6600 return cond0;
6605 else if (code == IF_THEN_ELSE)
6607 /* If we have IF_THEN_ELSE already, extract the condition and
6608 canonicalize it if it is NE or EQ. */
6609 cond0 = XEXP (x, 0);
6610 *ptrue = XEXP (x, 1), *pfalse = XEXP (x, 2);
6611 if (GET_CODE (cond0) == NE && XEXP (cond0, 1) == const0_rtx)
6612 return XEXP (cond0, 0);
6613 else if (GET_CODE (cond0) == EQ && XEXP (cond0, 1) == const0_rtx)
6615 *ptrue = XEXP (x, 2), *pfalse = XEXP (x, 1);
6616 return XEXP (cond0, 0);
6618 else
6619 return cond0;
6622 /* If X is a normal SUBREG with both inner and outer modes integral,
6623 we can narrow both the true and false values of the inner expression,
6624 if there is a condition. */
6625 else if (code == SUBREG && GET_MODE_CLASS (mode) == MODE_INT
6626 && GET_MODE_CLASS (GET_MODE (SUBREG_REG (x))) == MODE_INT
6627 && GET_MODE_SIZE (mode) <= GET_MODE_SIZE (GET_MODE (SUBREG_REG (x)))
6628 && 0 != (cond0 = if_then_else_cond (SUBREG_REG (x),
6629 &true0, &false0)))
6631 *ptrue = force_to_mode (true0, mode, GET_MODE_MASK (mode), NULL_RTX, 0);
6632 *pfalse
6633 = force_to_mode (false0, mode, GET_MODE_MASK (mode), NULL_RTX, 0);
6635 return cond0;
6638 /* If X is a constant, this isn't special and will cause confusions
6639 if we treat it as such. Likewise if it is equivalent to a constant. */
6640 else if (CONSTANT_P (x)
6641 || ((cond0 = get_last_value (x)) != 0 && CONSTANT_P (cond0)))
6644 /* If X is known to be either 0 or -1, those are the true and
6645 false values when testing X. */
6646 else if (num_sign_bit_copies (x, mode) == size)
6648 *ptrue = constm1_rtx, *pfalse = const0_rtx;
6649 return x;
6652 /* Likewise for 0 or a single bit. */
6653 else if (exact_log2 (nz = nonzero_bits (x, mode)) >= 0)
6655 *ptrue = GEN_INT (nz), *pfalse = const0_rtx;
6656 return x;
6659 /* Otherwise fail; show no condition with true and false values the same. */
6660 *ptrue = *pfalse = x;
6661 return 0;
6664 /* Return the value of expression X given the fact that condition COND
6665 is known to be true when applied to REG as its first operand and VAL
6666 as its second. X is known to not be shared and so can be modified in
6667 place.
6669 We only handle the simplest cases, and specifically those cases that
6670 arise with IF_THEN_ELSE expressions. */
6672 static rtx
6673 known_cond (x, cond, reg, val)
6674 rtx x;
6675 enum rtx_code cond;
6676 rtx reg, val;
6678 enum rtx_code code = GET_CODE (x);
6679 rtx temp;
6680 char *fmt;
6681 int i, j;
6683 if (side_effects_p (x))
6684 return x;
6686 if (cond == EQ && rtx_equal_p (x, reg))
6687 return val;
6689 /* If X is (abs REG) and we know something about REG's relationship
6690 with zero, we may be able to simplify this. */
6692 if (code == ABS && rtx_equal_p (XEXP (x, 0), reg) && val == const0_rtx)
6693 switch (cond)
6695 case GE: case GT: case EQ:
6696 return XEXP (x, 0);
6697 case LT: case LE:
6698 return gen_unary (NEG, GET_MODE (XEXP (x, 0)), GET_MODE (XEXP (x, 0)),
6699 XEXP (x, 0));
6702 /* The only other cases we handle are MIN, MAX, and comparisons if the
6703 operands are the same as REG and VAL. */
6705 else if (GET_RTX_CLASS (code) == '<' || GET_RTX_CLASS (code) == 'c')
6707 if (rtx_equal_p (XEXP (x, 0), val))
6708 cond = swap_condition (cond), temp = val, val = reg, reg = temp;
6710 if (rtx_equal_p (XEXP (x, 0), reg) && rtx_equal_p (XEXP (x, 1), val))
6712 if (GET_RTX_CLASS (code) == '<')
6713 return (comparison_dominates_p (cond, code) ? const_true_rtx
6714 : (comparison_dominates_p (cond,
6715 reverse_condition (code))
6716 ? const0_rtx : x));
6718 else if (code == SMAX || code == SMIN
6719 || code == UMIN || code == UMAX)
6721 int unsignedp = (code == UMIN || code == UMAX);
6723 if (code == SMAX || code == UMAX)
6724 cond = reverse_condition (cond);
6726 switch (cond)
6728 case GE: case GT:
6729 return unsignedp ? x : XEXP (x, 1);
6730 case LE: case LT:
6731 return unsignedp ? x : XEXP (x, 0);
6732 case GEU: case GTU:
6733 return unsignedp ? XEXP (x, 1) : x;
6734 case LEU: case LTU:
6735 return unsignedp ? XEXP (x, 0) : x;
6741 fmt = GET_RTX_FORMAT (code);
6742 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
6744 if (fmt[i] == 'e')
6745 SUBST (XEXP (x, i), known_cond (XEXP (x, i), cond, reg, val));
6746 else if (fmt[i] == 'E')
6747 for (j = XVECLEN (x, i) - 1; j >= 0; j--)
6748 SUBST (XVECEXP (x, i, j), known_cond (XVECEXP (x, i, j),
6749 cond, reg, val));
6752 return x;
6755 /* See if X and Y are equal for the purposes of seeing if we can rewrite an
6756 assignment as a field assignment. */
6758 static int
6759 rtx_equal_for_field_assignment_p (x, y)
6760 rtx x;
6761 rtx y;
6763 rtx last_x, last_y;
6765 if (x == y || rtx_equal_p (x, y))
6766 return 1;
6768 if (x == 0 || y == 0 || GET_MODE (x) != GET_MODE (y))
6769 return 0;
6771 /* Check for a paradoxical SUBREG of a MEM compared with the MEM.
6772 Note that all SUBREGs of MEM are paradoxical; otherwise they
6773 would have been rewritten. */
6774 if (GET_CODE (x) == MEM && GET_CODE (y) == SUBREG
6775 && GET_CODE (SUBREG_REG (y)) == MEM
6776 && rtx_equal_p (SUBREG_REG (y),
6777 gen_lowpart_for_combine (GET_MODE (SUBREG_REG (y)), x)))
6778 return 1;
6780 if (GET_CODE (y) == MEM && GET_CODE (x) == SUBREG
6781 && GET_CODE (SUBREG_REG (x)) == MEM
6782 && rtx_equal_p (SUBREG_REG (x),
6783 gen_lowpart_for_combine (GET_MODE (SUBREG_REG (x)), y)))
6784 return 1;
6786 last_x = get_last_value (x);
6787 last_y = get_last_value (y);
6789 return ((last_x != 0
6790 && GET_CODE (last_x) != CLOBBER
6791 && rtx_equal_for_field_assignment_p (last_x, y))
6792 || (last_y != 0
6793 && GET_CODE (last_y) != CLOBBER
6794 && rtx_equal_for_field_assignment_p (x, last_y))
6795 || (last_x != 0 && last_y != 0
6796 && GET_CODE (last_x) != CLOBBER
6797 && GET_CODE (last_y) != CLOBBER
6798 && rtx_equal_for_field_assignment_p (last_x, last_y)));
6801 /* See if X, a SET operation, can be rewritten as a bit-field assignment.
6802 Return that assignment if so.
6804 We only handle the most common cases. */
6806 static rtx
6807 make_field_assignment (x)
6808 rtx x;
6810 rtx dest = SET_DEST (x);
6811 rtx src = SET_SRC (x);
6812 rtx assign;
6813 rtx rhs, lhs;
6814 HOST_WIDE_INT c1;
6815 int pos, len;
6816 rtx other;
6817 enum machine_mode mode;
6819 /* If SRC was (and (not (ashift (const_int 1) POS)) DEST), this is
6820 a clear of a one-bit field. We will have changed it to
6821 (and (rotate (const_int -2) POS) DEST), so check for that. Also check
6822 for a SUBREG. */
6824 if (GET_CODE (src) == AND && GET_CODE (XEXP (src, 0)) == ROTATE
6825 && GET_CODE (XEXP (XEXP (src, 0), 0)) == CONST_INT
6826 && INTVAL (XEXP (XEXP (src, 0), 0)) == -2
6827 && rtx_equal_for_field_assignment_p (dest, XEXP (src, 1)))
6829 assign = make_extraction (VOIDmode, dest, 0, XEXP (XEXP (src, 0), 1),
6830 1, 1, 1, 0);
6831 if (assign != 0)
6832 return gen_rtx (SET, VOIDmode, assign, const0_rtx);
6833 return x;
6836 else if (GET_CODE (src) == AND && GET_CODE (XEXP (src, 0)) == SUBREG
6837 && subreg_lowpart_p (XEXP (src, 0))
6838 && (GET_MODE_SIZE (GET_MODE (XEXP (src, 0)))
6839 < GET_MODE_SIZE (GET_MODE (SUBREG_REG (XEXP (src, 0)))))
6840 && GET_CODE (SUBREG_REG (XEXP (src, 0))) == ROTATE
6841 && INTVAL (XEXP (SUBREG_REG (XEXP (src, 0)), 0)) == -2
6842 && rtx_equal_for_field_assignment_p (dest, XEXP (src, 1)))
6844 assign = make_extraction (VOIDmode, dest, 0,
6845 XEXP (SUBREG_REG (XEXP (src, 0)), 1),
6846 1, 1, 1, 0);
6847 if (assign != 0)
6848 return gen_rtx (SET, VOIDmode, assign, const0_rtx);
6849 return x;
6852 /* If SRC is (ior (ashift (const_int 1) POS) DEST), this is a set of a
6853 one-bit field. */
6854 else if (GET_CODE (src) == IOR && GET_CODE (XEXP (src, 0)) == ASHIFT
6855 && XEXP (XEXP (src, 0), 0) == const1_rtx
6856 && rtx_equal_for_field_assignment_p (dest, XEXP (src, 1)))
6858 assign = make_extraction (VOIDmode, dest, 0, XEXP (XEXP (src, 0), 1),
6859 1, 1, 1, 0);
6860 if (assign != 0)
6861 return gen_rtx (SET, VOIDmode, assign, const1_rtx);
6862 return x;
6865 /* The other case we handle is assignments into a constant-position
6866 field. They look like (ior/xor (and DEST C1) OTHER). If C1 represents
6867 a mask that has all one bits except for a group of zero bits and
6868 OTHER is known to have zeros where C1 has ones, this is such an
6869 assignment. Compute the position and length from C1. Shift OTHER
6870 to the appropriate position, force it to the required mode, and
6871 make the extraction. Check for the AND in both operands. */
6873 if (GET_CODE (src) != IOR && GET_CODE (src) != XOR)
6874 return x;
6876 rhs = expand_compound_operation (XEXP (src, 0));
6877 lhs = expand_compound_operation (XEXP (src, 1));
6879 if (GET_CODE (rhs) == AND
6880 && GET_CODE (XEXP (rhs, 1)) == CONST_INT
6881 && rtx_equal_for_field_assignment_p (XEXP (rhs, 0), dest))
6882 c1 = INTVAL (XEXP (rhs, 1)), other = lhs;
6883 else if (GET_CODE (lhs) == AND
6884 && GET_CODE (XEXP (lhs, 1)) == CONST_INT
6885 && rtx_equal_for_field_assignment_p (XEXP (lhs, 0), dest))
6886 c1 = INTVAL (XEXP (lhs, 1)), other = rhs;
6887 else
6888 return x;
6890 pos = get_pos_from_mask ((~ c1) & GET_MODE_MASK (GET_MODE (dest)), &len);
6891 if (pos < 0 || pos + len > GET_MODE_BITSIZE (GET_MODE (dest))
6892 || (GET_MODE_BITSIZE (GET_MODE (other)) <= HOST_BITS_PER_WIDE_INT
6893 && (c1 & nonzero_bits (other, GET_MODE (other))) != 0))
6894 return x;
6896 assign = make_extraction (VOIDmode, dest, pos, NULL_RTX, len, 1, 1, 0);
6897 if (assign == 0)
6898 return x;
6900 /* The mode to use for the source is the mode of the assignment, or of
6901 what is inside a possible STRICT_LOW_PART. */
6902 mode = (GET_CODE (assign) == STRICT_LOW_PART
6903 ? GET_MODE (XEXP (assign, 0)) : GET_MODE (assign));
6905 /* Shift OTHER right POS places and make it the source, restricting it
6906 to the proper length and mode. */
6908 src = force_to_mode (simplify_shift_const (NULL_RTX, LSHIFTRT,
6909 GET_MODE (src), other, pos),
6910 mode,
6911 GET_MODE_BITSIZE (mode) >= HOST_BITS_PER_WIDE_INT
6912 ? GET_MODE_MASK (mode)
6913 : ((HOST_WIDE_INT) 1 << len) - 1,
6914 dest, 0);
6916 return gen_rtx_combine (SET, VOIDmode, assign, src);
6919 /* See if X is of the form (+ (* a c) (* b c)) and convert to (* (+ a b) c)
6920 if so. */
6922 static rtx
6923 apply_distributive_law (x)
6924 rtx x;
6926 enum rtx_code code = GET_CODE (x);
6927 rtx lhs, rhs, other;
6928 rtx tem;
6929 enum rtx_code inner_code;
6931 /* Distributivity is not true for floating point.
6932 It can change the value. So don't do it.
6933 -- rms and moshier@world.std.com. */
6934 if (FLOAT_MODE_P (GET_MODE (x)))
6935 return x;
6937 /* The outer operation can only be one of the following: */
6938 if (code != IOR && code != AND && code != XOR
6939 && code != PLUS && code != MINUS)
6940 return x;
6942 lhs = XEXP (x, 0), rhs = XEXP (x, 1);
6944 /* If either operand is a primitive we can't do anything, so get out
6945 fast. */
6946 if (GET_RTX_CLASS (GET_CODE (lhs)) == 'o'
6947 || GET_RTX_CLASS (GET_CODE (rhs)) == 'o')
6948 return x;
6950 lhs = expand_compound_operation (lhs);
6951 rhs = expand_compound_operation (rhs);
6952 inner_code = GET_CODE (lhs);
6953 if (inner_code != GET_CODE (rhs))
6954 return x;
6956 /* See if the inner and outer operations distribute. */
6957 switch (inner_code)
6959 case LSHIFTRT:
6960 case ASHIFTRT:
6961 case AND:
6962 case IOR:
6963 /* These all distribute except over PLUS. */
6964 if (code == PLUS || code == MINUS)
6965 return x;
6966 break;
6968 case MULT:
6969 if (code != PLUS && code != MINUS)
6970 return x;
6971 break;
6973 case ASHIFT:
6974 /* This is also a multiply, so it distributes over everything. */
6975 break;
6977 case SUBREG:
6978 /* Non-paradoxical SUBREGs distributes over all operations, provided
6979 the inner modes and word numbers are the same, this is an extraction
6980 of a low-order part, we don't convert an fp operation to int or
6981 vice versa, and we would not be converting a single-word
6982 operation into a multi-word operation. The latter test is not
6983 required, but it prevents generating unneeded multi-word operations.
6984 Some of the previous tests are redundant given the latter test, but
6985 are retained because they are required for correctness.
6987 We produce the result slightly differently in this case. */
6989 if (GET_MODE (SUBREG_REG (lhs)) != GET_MODE (SUBREG_REG (rhs))
6990 || SUBREG_WORD (lhs) != SUBREG_WORD (rhs)
6991 || ! subreg_lowpart_p (lhs)
6992 || (GET_MODE_CLASS (GET_MODE (lhs))
6993 != GET_MODE_CLASS (GET_MODE (SUBREG_REG (lhs))))
6994 || (GET_MODE_SIZE (GET_MODE (lhs))
6995 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (lhs))))
6996 || GET_MODE_SIZE (GET_MODE (SUBREG_REG (lhs))) > UNITS_PER_WORD)
6997 return x;
6999 tem = gen_binary (code, GET_MODE (SUBREG_REG (lhs)),
7000 SUBREG_REG (lhs), SUBREG_REG (rhs));
7001 return gen_lowpart_for_combine (GET_MODE (x), tem);
7003 default:
7004 return x;
7007 /* Set LHS and RHS to the inner operands (A and B in the example
7008 above) and set OTHER to the common operand (C in the example).
7009 These is only one way to do this unless the inner operation is
7010 commutative. */
7011 if (GET_RTX_CLASS (inner_code) == 'c'
7012 && rtx_equal_p (XEXP (lhs, 0), XEXP (rhs, 0)))
7013 other = XEXP (lhs, 0), lhs = XEXP (lhs, 1), rhs = XEXP (rhs, 1);
7014 else if (GET_RTX_CLASS (inner_code) == 'c'
7015 && rtx_equal_p (XEXP (lhs, 0), XEXP (rhs, 1)))
7016 other = XEXP (lhs, 0), lhs = XEXP (lhs, 1), rhs = XEXP (rhs, 0);
7017 else if (GET_RTX_CLASS (inner_code) == 'c'
7018 && rtx_equal_p (XEXP (lhs, 1), XEXP (rhs, 0)))
7019 other = XEXP (lhs, 1), lhs = XEXP (lhs, 0), rhs = XEXP (rhs, 1);
7020 else if (rtx_equal_p (XEXP (lhs, 1), XEXP (rhs, 1)))
7021 other = XEXP (lhs, 1), lhs = XEXP (lhs, 0), rhs = XEXP (rhs, 0);
7022 else
7023 return x;
7025 /* Form the new inner operation, seeing if it simplifies first. */
7026 tem = gen_binary (code, GET_MODE (x), lhs, rhs);
7028 /* There is one exception to the general way of distributing:
7029 (a ^ b) | (a ^ c) -> (~a) & (b ^ c) */
7030 if (code == XOR && inner_code == IOR)
7032 inner_code = AND;
7033 other = gen_unary (NOT, GET_MODE (x), GET_MODE (x), other);
7036 /* We may be able to continuing distributing the result, so call
7037 ourselves recursively on the inner operation before forming the
7038 outer operation, which we return. */
7039 return gen_binary (inner_code, GET_MODE (x),
7040 apply_distributive_law (tem), other);
7043 /* We have X, a logical `and' of VAROP with the constant CONSTOP, to be done
7044 in MODE.
7046 Return an equivalent form, if different from X. Otherwise, return X. If
7047 X is zero, we are to always construct the equivalent form. */
7049 static rtx
7050 simplify_and_const_int (x, mode, varop, constop)
7051 rtx x;
7052 enum machine_mode mode;
7053 rtx varop;
7054 unsigned HOST_WIDE_INT constop;
7056 unsigned HOST_WIDE_INT nonzero;
7057 int width = GET_MODE_BITSIZE (mode);
7058 int i;
7060 /* Simplify VAROP knowing that we will be only looking at some of the
7061 bits in it. */
7062 varop = force_to_mode (varop, mode, constop, NULL_RTX, 0);
7064 /* If VAROP is a CLOBBER, we will fail so return it; if it is a
7065 CONST_INT, we are done. */
7066 if (GET_CODE (varop) == CLOBBER || GET_CODE (varop) == CONST_INT)
7067 return varop;
7069 /* See what bits may be nonzero in VAROP. Unlike the general case of
7070 a call to nonzero_bits, here we don't care about bits outside
7071 MODE. */
7073 nonzero = nonzero_bits (varop, mode) & GET_MODE_MASK (mode);
7075 /* If this would be an entire word for the target, but is not for
7076 the host, then sign-extend on the host so that the number will look
7077 the same way on the host that it would on the target.
7079 For example, when building a 64 bit alpha hosted 32 bit sparc
7080 targeted compiler, then we want the 32 bit unsigned value -1 to be
7081 represented as a 64 bit value -1, and not as 0x00000000ffffffff.
7082 The later confuses the sparc backend. */
7084 if (BITS_PER_WORD < HOST_BITS_PER_WIDE_INT && BITS_PER_WORD == width
7085 && (nonzero & ((HOST_WIDE_INT) 1 << (width - 1))))
7086 nonzero |= ((HOST_WIDE_INT) (-1) << width);
7088 /* Turn off all bits in the constant that are known to already be zero.
7089 Thus, if the AND isn't needed at all, we will have CONSTOP == NONZERO_BITS
7090 which is tested below. */
7092 constop &= nonzero;
7094 /* If we don't have any bits left, return zero. */
7095 if (constop == 0)
7096 return const0_rtx;
7098 /* If VAROP is a NEG of something known to be zero or 1 and CONSTOP is
7099 a power of two, we can replace this with a ASHIFT. */
7100 if (GET_CODE (varop) == NEG && nonzero_bits (XEXP (varop, 0), mode) == 1
7101 && (i = exact_log2 (constop)) >= 0)
7102 return simplify_shift_const (NULL_RTX, ASHIFT, mode, XEXP (varop, 0), i);
7104 /* If VAROP is an IOR or XOR, apply the AND to both branches of the IOR
7105 or XOR, then try to apply the distributive law. This may eliminate
7106 operations if either branch can be simplified because of the AND.
7107 It may also make some cases more complex, but those cases probably
7108 won't match a pattern either with or without this. */
7110 if (GET_CODE (varop) == IOR || GET_CODE (varop) == XOR)
7111 return
7112 gen_lowpart_for_combine
7113 (mode,
7114 apply_distributive_law
7115 (gen_binary (GET_CODE (varop), GET_MODE (varop),
7116 simplify_and_const_int (NULL_RTX, GET_MODE (varop),
7117 XEXP (varop, 0), constop),
7118 simplify_and_const_int (NULL_RTX, GET_MODE (varop),
7119 XEXP (varop, 1), constop))));
7121 /* Get VAROP in MODE. Try to get a SUBREG if not. Don't make a new SUBREG
7122 if we already had one (just check for the simplest cases). */
7123 if (x && GET_CODE (XEXP (x, 0)) == SUBREG
7124 && GET_MODE (XEXP (x, 0)) == mode
7125 && SUBREG_REG (XEXP (x, 0)) == varop)
7126 varop = XEXP (x, 0);
7127 else
7128 varop = gen_lowpart_for_combine (mode, varop);
7130 /* If we can't make the SUBREG, try to return what we were given. */
7131 if (GET_CODE (varop) == CLOBBER)
7132 return x ? x : varop;
7134 /* If we are only masking insignificant bits, return VAROP. */
7135 if (constop == nonzero)
7136 x = varop;
7138 /* Otherwise, return an AND. See how much, if any, of X we can use. */
7139 else if (x == 0 || GET_CODE (x) != AND || GET_MODE (x) != mode)
7140 x = gen_binary (AND, mode, varop, GEN_INT (constop));
7142 else
7144 if (GET_CODE (XEXP (x, 1)) != CONST_INT
7145 || INTVAL (XEXP (x, 1)) != constop)
7146 SUBST (XEXP (x, 1), GEN_INT (constop));
7148 SUBST (XEXP (x, 0), varop);
7151 return x;
7154 /* We let num_sign_bit_copies recur into nonzero_bits as that is useful.
7155 We don't let nonzero_bits recur into num_sign_bit_copies, because that
7156 is less useful. We can't allow both, because that results in exponential
7157 run time recusion. There is a nullstone testcase that triggered
7158 this. This macro avoids accidental uses of num_sign_bit_copies. */
7159 #define num_sign_bit_copies()
7161 /* Given an expression, X, compute which bits in X can be non-zero.
7162 We don't care about bits outside of those defined in MODE.
7164 For most X this is simply GET_MODE_MASK (GET_MODE (MODE)), but if X is
7165 a shift, AND, or zero_extract, we can do better. */
7167 static unsigned HOST_WIDE_INT
7168 nonzero_bits (x, mode)
7169 rtx x;
7170 enum machine_mode mode;
7172 unsigned HOST_WIDE_INT nonzero = GET_MODE_MASK (mode);
7173 unsigned HOST_WIDE_INT inner_nz;
7174 enum rtx_code code;
7175 int mode_width = GET_MODE_BITSIZE (mode);
7176 rtx tem;
7178 /* For floating-point values, assume all bits are needed. */
7179 if (FLOAT_MODE_P (GET_MODE (x)) || FLOAT_MODE_P (mode))
7180 return nonzero;
7182 /* If X is wider than MODE, use its mode instead. */
7183 if (GET_MODE_BITSIZE (GET_MODE (x)) > mode_width)
7185 mode = GET_MODE (x);
7186 nonzero = GET_MODE_MASK (mode);
7187 mode_width = GET_MODE_BITSIZE (mode);
7190 if (mode_width > HOST_BITS_PER_WIDE_INT)
7191 /* Our only callers in this case look for single bit values. So
7192 just return the mode mask. Those tests will then be false. */
7193 return nonzero;
7195 #ifndef WORD_REGISTER_OPERATIONS
7196 /* If MODE is wider than X, but both are a single word for both the host
7197 and target machines, we can compute this from which bits of the
7198 object might be nonzero in its own mode, taking into account the fact
7199 that on many CISC machines, accessing an object in a wider mode
7200 causes the high-order bits to become undefined. So they are
7201 not known to be zero. */
7203 if (GET_MODE (x) != VOIDmode && GET_MODE (x) != mode
7204 && GET_MODE_BITSIZE (GET_MODE (x)) <= BITS_PER_WORD
7205 && GET_MODE_BITSIZE (GET_MODE (x)) <= HOST_BITS_PER_WIDE_INT
7206 && GET_MODE_BITSIZE (mode) > GET_MODE_BITSIZE (GET_MODE (x)))
7208 nonzero &= nonzero_bits (x, GET_MODE (x));
7209 nonzero |= GET_MODE_MASK (mode) & ~ GET_MODE_MASK (GET_MODE (x));
7210 return nonzero;
7212 #endif
7214 code = GET_CODE (x);
7215 switch (code)
7217 case REG:
7218 #ifdef POINTERS_EXTEND_UNSIGNED
7219 /* If pointers extend unsigned and this is a pointer in Pmode, say that
7220 all the bits above ptr_mode are known to be zero. */
7221 if (POINTERS_EXTEND_UNSIGNED && GET_MODE (x) == Pmode
7222 && REGNO_POINTER_FLAG (REGNO (x)))
7223 nonzero &= GET_MODE_MASK (ptr_mode);
7224 #endif
7226 #ifdef STACK_BOUNDARY
7227 /* If this is the stack pointer, we may know something about its
7228 alignment. If PUSH_ROUNDING is defined, it is possible for the
7229 stack to be momentarily aligned only to that amount, so we pick
7230 the least alignment. */
7232 /* We can't check for arg_pointer_rtx here, because it is not
7233 guaranteed to have as much alignment as the stack pointer.
7234 In particular, in the Irix6 n64 ABI, the stack has 128 bit
7235 alignment but the argument pointer has only 64 bit alignment. */
7237 if (x == stack_pointer_rtx || x == frame_pointer_rtx
7238 || x == hard_frame_pointer_rtx
7239 || (REGNO (x) >= FIRST_VIRTUAL_REGISTER
7240 && REGNO (x) <= LAST_VIRTUAL_REGISTER))
7242 int sp_alignment = STACK_BOUNDARY / BITS_PER_UNIT;
7244 #ifdef PUSH_ROUNDING
7245 if (REGNO (x) == STACK_POINTER_REGNUM)
7246 sp_alignment = MIN (PUSH_ROUNDING (1), sp_alignment);
7247 #endif
7249 /* We must return here, otherwise we may get a worse result from
7250 one of the choices below. There is nothing useful below as
7251 far as the stack pointer is concerned. */
7252 return nonzero &= ~ (sp_alignment - 1);
7254 #endif
7256 /* If X is a register whose nonzero bits value is current, use it.
7257 Otherwise, if X is a register whose value we can find, use that
7258 value. Otherwise, use the previously-computed global nonzero bits
7259 for this register. */
7261 if (reg_last_set_value[REGNO (x)] != 0
7262 && reg_last_set_mode[REGNO (x)] == mode
7263 && (REG_N_SETS (REGNO (x)) == 1
7264 || reg_last_set_label[REGNO (x)] == label_tick)
7265 && INSN_CUID (reg_last_set[REGNO (x)]) < subst_low_cuid)
7266 return reg_last_set_nonzero_bits[REGNO (x)];
7268 tem = get_last_value (x);
7270 if (tem)
7272 #ifdef SHORT_IMMEDIATES_SIGN_EXTEND
7273 /* If X is narrower than MODE and TEM is a non-negative
7274 constant that would appear negative in the mode of X,
7275 sign-extend it for use in reg_nonzero_bits because some
7276 machines (maybe most) will actually do the sign-extension
7277 and this is the conservative approach.
7279 ??? For 2.5, try to tighten up the MD files in this regard
7280 instead of this kludge. */
7282 if (GET_MODE_BITSIZE (GET_MODE (x)) < mode_width
7283 && GET_CODE (tem) == CONST_INT
7284 && INTVAL (tem) > 0
7285 && 0 != (INTVAL (tem)
7286 & ((HOST_WIDE_INT) 1
7287 << (GET_MODE_BITSIZE (GET_MODE (x)) - 1))))
7288 tem = GEN_INT (INTVAL (tem)
7289 | ((HOST_WIDE_INT) (-1)
7290 << GET_MODE_BITSIZE (GET_MODE (x))));
7291 #endif
7292 return nonzero_bits (tem, mode);
7294 else if (nonzero_sign_valid && reg_nonzero_bits[REGNO (x)])
7295 return reg_nonzero_bits[REGNO (x)] & nonzero;
7296 else
7297 return nonzero;
7299 case CONST_INT:
7300 #ifdef SHORT_IMMEDIATES_SIGN_EXTEND
7301 /* If X is negative in MODE, sign-extend the value. */
7302 if (INTVAL (x) > 0 && mode_width < BITS_PER_WORD
7303 && 0 != (INTVAL (x) & ((HOST_WIDE_INT) 1 << (mode_width - 1))))
7304 return (INTVAL (x) | ((HOST_WIDE_INT) (-1) << mode_width));
7305 #endif
7307 return INTVAL (x);
7309 case MEM:
7310 #ifdef LOAD_EXTEND_OP
7311 /* In many, if not most, RISC machines, reading a byte from memory
7312 zeros the rest of the register. Noticing that fact saves a lot
7313 of extra zero-extends. */
7314 if (LOAD_EXTEND_OP (GET_MODE (x)) == ZERO_EXTEND)
7315 nonzero &= GET_MODE_MASK (GET_MODE (x));
7316 #endif
7317 break;
7319 case EQ: case NE:
7320 case GT: case GTU:
7321 case LT: case LTU:
7322 case GE: case GEU:
7323 case LE: case LEU:
7325 /* If this produces an integer result, we know which bits are set.
7326 Code here used to clear bits outside the mode of X, but that is
7327 now done above. */
7329 if (GET_MODE_CLASS (mode) == MODE_INT
7330 && mode_width <= HOST_BITS_PER_WIDE_INT)
7331 nonzero = STORE_FLAG_VALUE;
7332 break;
7334 case NEG:
7335 #if 0
7336 /* Disabled to avoid exponential mutual recursion between nonzero_bits
7337 and num_sign_bit_copies. */
7338 if (num_sign_bit_copies (XEXP (x, 0), GET_MODE (x))
7339 == GET_MODE_BITSIZE (GET_MODE (x)))
7340 nonzero = 1;
7341 #endif
7343 if (GET_MODE_SIZE (GET_MODE (x)) < mode_width)
7344 nonzero |= (GET_MODE_MASK (mode) & ~ GET_MODE_MASK (GET_MODE (x)));
7345 break;
7347 case ABS:
7348 #if 0
7349 /* Disabled to avoid exponential mutual recursion between nonzero_bits
7350 and num_sign_bit_copies. */
7351 if (num_sign_bit_copies (XEXP (x, 0), GET_MODE (x))
7352 == GET_MODE_BITSIZE (GET_MODE (x)))
7353 nonzero = 1;
7354 #endif
7355 break;
7357 case TRUNCATE:
7358 nonzero &= (nonzero_bits (XEXP (x, 0), mode) & GET_MODE_MASK (mode));
7359 break;
7361 case ZERO_EXTEND:
7362 nonzero &= nonzero_bits (XEXP (x, 0), mode);
7363 if (GET_MODE (XEXP (x, 0)) != VOIDmode)
7364 nonzero &= GET_MODE_MASK (GET_MODE (XEXP (x, 0)));
7365 break;
7367 case SIGN_EXTEND:
7368 /* If the sign bit is known clear, this is the same as ZERO_EXTEND.
7369 Otherwise, show all the bits in the outer mode but not the inner
7370 may be non-zero. */
7371 inner_nz = nonzero_bits (XEXP (x, 0), mode);
7372 if (GET_MODE (XEXP (x, 0)) != VOIDmode)
7374 inner_nz &= GET_MODE_MASK (GET_MODE (XEXP (x, 0)));
7375 if (inner_nz
7376 & (((HOST_WIDE_INT) 1
7377 << (GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0))) - 1))))
7378 inner_nz |= (GET_MODE_MASK (mode)
7379 & ~ GET_MODE_MASK (GET_MODE (XEXP (x, 0))));
7382 nonzero &= inner_nz;
7383 break;
7385 case AND:
7386 nonzero &= (nonzero_bits (XEXP (x, 0), mode)
7387 & nonzero_bits (XEXP (x, 1), mode));
7388 break;
7390 case XOR: case IOR:
7391 case UMIN: case UMAX: case SMIN: case SMAX:
7392 nonzero &= (nonzero_bits (XEXP (x, 0), mode)
7393 | nonzero_bits (XEXP (x, 1), mode));
7394 break;
7396 case PLUS: case MINUS:
7397 case MULT:
7398 case DIV: case UDIV:
7399 case MOD: case UMOD:
7400 /* We can apply the rules of arithmetic to compute the number of
7401 high- and low-order zero bits of these operations. We start by
7402 computing the width (position of the highest-order non-zero bit)
7403 and the number of low-order zero bits for each value. */
7405 unsigned HOST_WIDE_INT nz0 = nonzero_bits (XEXP (x, 0), mode);
7406 unsigned HOST_WIDE_INT nz1 = nonzero_bits (XEXP (x, 1), mode);
7407 int width0 = floor_log2 (nz0) + 1;
7408 int width1 = floor_log2 (nz1) + 1;
7409 int low0 = floor_log2 (nz0 & -nz0);
7410 int low1 = floor_log2 (nz1 & -nz1);
7411 HOST_WIDE_INT op0_maybe_minusp
7412 = (nz0 & ((HOST_WIDE_INT) 1 << (mode_width - 1)));
7413 HOST_WIDE_INT op1_maybe_minusp
7414 = (nz1 & ((HOST_WIDE_INT) 1 << (mode_width - 1)));
7415 int result_width = mode_width;
7416 int result_low = 0;
7418 switch (code)
7420 case PLUS:
7421 result_width = MAX (width0, width1) + 1;
7422 result_low = MIN (low0, low1);
7423 break;
7424 case MINUS:
7425 result_low = MIN (low0, low1);
7426 break;
7427 case MULT:
7428 result_width = width0 + width1;
7429 result_low = low0 + low1;
7430 break;
7431 case DIV:
7432 if (! op0_maybe_minusp && ! op1_maybe_minusp)
7433 result_width = width0;
7434 break;
7435 case UDIV:
7436 result_width = width0;
7437 break;
7438 case MOD:
7439 if (! op0_maybe_minusp && ! op1_maybe_minusp)
7440 result_width = MIN (width0, width1);
7441 result_low = MIN (low0, low1);
7442 break;
7443 case UMOD:
7444 result_width = MIN (width0, width1);
7445 result_low = MIN (low0, low1);
7446 break;
7449 if (result_width < mode_width)
7450 nonzero &= ((HOST_WIDE_INT) 1 << result_width) - 1;
7452 if (result_low > 0)
7453 nonzero &= ~ (((HOST_WIDE_INT) 1 << result_low) - 1);
7455 break;
7457 case ZERO_EXTRACT:
7458 if (GET_CODE (XEXP (x, 1)) == CONST_INT
7459 && INTVAL (XEXP (x, 1)) < HOST_BITS_PER_WIDE_INT)
7460 nonzero &= ((HOST_WIDE_INT) 1 << INTVAL (XEXP (x, 1))) - 1;
7461 break;
7463 case SUBREG:
7464 /* If this is a SUBREG formed for a promoted variable that has
7465 been zero-extended, we know that at least the high-order bits
7466 are zero, though others might be too. */
7468 if (SUBREG_PROMOTED_VAR_P (x) && SUBREG_PROMOTED_UNSIGNED_P (x))
7469 nonzero = (GET_MODE_MASK (GET_MODE (x))
7470 & nonzero_bits (SUBREG_REG (x), GET_MODE (x)));
7472 /* If the inner mode is a single word for both the host and target
7473 machines, we can compute this from which bits of the inner
7474 object might be nonzero. */
7475 if (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x))) <= BITS_PER_WORD
7476 && (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x)))
7477 <= HOST_BITS_PER_WIDE_INT))
7479 nonzero &= nonzero_bits (SUBREG_REG (x), mode);
7481 #ifndef WORD_REGISTER_OPERATIONS
7482 /* On many CISC machines, accessing an object in a wider mode
7483 causes the high-order bits to become undefined. So they are
7484 not known to be zero. */
7485 if (GET_MODE_SIZE (GET_MODE (x))
7486 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (x))))
7487 nonzero |= (GET_MODE_MASK (GET_MODE (x))
7488 & ~ GET_MODE_MASK (GET_MODE (SUBREG_REG (x))));
7489 #endif
7491 break;
7493 case ASHIFTRT:
7494 case LSHIFTRT:
7495 case ASHIFT:
7496 case ROTATE:
7497 /* The nonzero bits are in two classes: any bits within MODE
7498 that aren't in GET_MODE (x) are always significant. The rest of the
7499 nonzero bits are those that are significant in the operand of
7500 the shift when shifted the appropriate number of bits. This
7501 shows that high-order bits are cleared by the right shift and
7502 low-order bits by left shifts. */
7503 if (GET_CODE (XEXP (x, 1)) == CONST_INT
7504 && INTVAL (XEXP (x, 1)) >= 0
7505 && INTVAL (XEXP (x, 1)) < HOST_BITS_PER_WIDE_INT)
7507 enum machine_mode inner_mode = GET_MODE (x);
7508 int width = GET_MODE_BITSIZE (inner_mode);
7509 int count = INTVAL (XEXP (x, 1));
7510 unsigned HOST_WIDE_INT mode_mask = GET_MODE_MASK (inner_mode);
7511 unsigned HOST_WIDE_INT op_nonzero = nonzero_bits (XEXP (x, 0), mode);
7512 unsigned HOST_WIDE_INT inner = op_nonzero & mode_mask;
7513 unsigned HOST_WIDE_INT outer = 0;
7515 if (mode_width > width)
7516 outer = (op_nonzero & nonzero & ~ mode_mask);
7518 if (code == LSHIFTRT)
7519 inner >>= count;
7520 else if (code == ASHIFTRT)
7522 inner >>= count;
7524 /* If the sign bit may have been nonzero before the shift, we
7525 need to mark all the places it could have been copied to
7526 by the shift as possibly nonzero. */
7527 if (inner & ((HOST_WIDE_INT) 1 << (width - 1 - count)))
7528 inner |= (((HOST_WIDE_INT) 1 << count) - 1) << (width - count);
7530 else if (code == ASHIFT)
7531 inner <<= count;
7532 else
7533 inner = ((inner << (count % width)
7534 | (inner >> (width - (count % width)))) & mode_mask);
7536 nonzero &= (outer | inner);
7538 break;
7540 case FFS:
7541 /* This is at most the number of bits in the mode. */
7542 nonzero = ((HOST_WIDE_INT) 1 << (floor_log2 (mode_width) + 1)) - 1;
7543 break;
7545 case IF_THEN_ELSE:
7546 nonzero &= (nonzero_bits (XEXP (x, 1), mode)
7547 | nonzero_bits (XEXP (x, 2), mode));
7548 break;
7551 return nonzero;
7554 /* See the macro definition above. */
7555 #undef num_sign_bit_copies
7557 /* Return the number of bits at the high-order end of X that are known to
7558 be equal to the sign bit. X will be used in mode MODE; if MODE is
7559 VOIDmode, X will be used in its own mode. The returned value will always
7560 be between 1 and the number of bits in MODE. */
7562 static int
7563 num_sign_bit_copies (x, mode)
7564 rtx x;
7565 enum machine_mode mode;
7567 enum rtx_code code = GET_CODE (x);
7568 int bitwidth;
7569 int num0, num1, result;
7570 unsigned HOST_WIDE_INT nonzero;
7571 rtx tem;
7573 /* If we weren't given a mode, use the mode of X. If the mode is still
7574 VOIDmode, we don't know anything. Likewise if one of the modes is
7575 floating-point. */
7577 if (mode == VOIDmode)
7578 mode = GET_MODE (x);
7580 if (mode == VOIDmode || FLOAT_MODE_P (mode) || FLOAT_MODE_P (GET_MODE (x)))
7581 return 1;
7583 bitwidth = GET_MODE_BITSIZE (mode);
7585 /* For a smaller object, just ignore the high bits. */
7586 if (bitwidth < GET_MODE_BITSIZE (GET_MODE (x)))
7587 return MAX (1, (num_sign_bit_copies (x, GET_MODE (x))
7588 - (GET_MODE_BITSIZE (GET_MODE (x)) - bitwidth)));
7590 #ifndef WORD_REGISTER_OPERATIONS
7591 /* If this machine does not do all register operations on the entire
7592 register and MODE is wider than the mode of X, we can say nothing
7593 at all about the high-order bits. */
7594 if (GET_MODE (x) != VOIDmode && bitwidth > GET_MODE_BITSIZE (GET_MODE (x)))
7595 return 1;
7596 #endif
7598 switch (code)
7600 case REG:
7602 #ifdef POINTERS_EXTEND_UNSIGNED
7603 /* If pointers extend signed and this is a pointer in Pmode, say that
7604 all the bits above ptr_mode are known to be sign bit copies. */
7605 if (! POINTERS_EXTEND_UNSIGNED && GET_MODE (x) == Pmode && mode == Pmode
7606 && REGNO_POINTER_FLAG (REGNO (x)))
7607 return GET_MODE_BITSIZE (Pmode) - GET_MODE_BITSIZE (ptr_mode) + 1;
7608 #endif
7610 if (reg_last_set_value[REGNO (x)] != 0
7611 && reg_last_set_mode[REGNO (x)] == mode
7612 && (REG_N_SETS (REGNO (x)) == 1
7613 || reg_last_set_label[REGNO (x)] == label_tick)
7614 && INSN_CUID (reg_last_set[REGNO (x)]) < subst_low_cuid)
7615 return reg_last_set_sign_bit_copies[REGNO (x)];
7617 tem = get_last_value (x);
7618 if (tem != 0)
7619 return num_sign_bit_copies (tem, mode);
7621 if (nonzero_sign_valid && reg_sign_bit_copies[REGNO (x)] != 0)
7622 return reg_sign_bit_copies[REGNO (x)];
7623 break;
7625 case MEM:
7626 #ifdef LOAD_EXTEND_OP
7627 /* Some RISC machines sign-extend all loads of smaller than a word. */
7628 if (LOAD_EXTEND_OP (GET_MODE (x)) == SIGN_EXTEND)
7629 return MAX (1, bitwidth - GET_MODE_BITSIZE (GET_MODE (x)) + 1);
7630 #endif
7631 break;
7633 case CONST_INT:
7634 /* If the constant is negative, take its 1's complement and remask.
7635 Then see how many zero bits we have. */
7636 nonzero = INTVAL (x) & GET_MODE_MASK (mode);
7637 if (bitwidth <= HOST_BITS_PER_WIDE_INT
7638 && (nonzero & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0)
7639 nonzero = (~ nonzero) & GET_MODE_MASK (mode);
7641 return (nonzero == 0 ? bitwidth : bitwidth - floor_log2 (nonzero) - 1);
7643 case SUBREG:
7644 /* If this is a SUBREG for a promoted object that is sign-extended
7645 and we are looking at it in a wider mode, we know that at least the
7646 high-order bits are known to be sign bit copies. */
7648 if (SUBREG_PROMOTED_VAR_P (x) && ! SUBREG_PROMOTED_UNSIGNED_P (x))
7649 return MAX (bitwidth - GET_MODE_BITSIZE (GET_MODE (x)) + 1,
7650 num_sign_bit_copies (SUBREG_REG (x), mode));
7652 /* For a smaller object, just ignore the high bits. */
7653 if (bitwidth <= GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x))))
7655 num0 = num_sign_bit_copies (SUBREG_REG (x), VOIDmode);
7656 return MAX (1, (num0
7657 - (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x)))
7658 - bitwidth)));
7661 #ifdef WORD_REGISTER_OPERATIONS
7662 #ifdef LOAD_EXTEND_OP
7663 /* For paradoxical SUBREGs on machines where all register operations
7664 affect the entire register, just look inside. Note that we are
7665 passing MODE to the recursive call, so the number of sign bit copies
7666 will remain relative to that mode, not the inner mode. */
7668 /* This works only if loads sign extend. Otherwise, if we get a
7669 reload for the inner part, it may be loaded from the stack, and
7670 then we lose all sign bit copies that existed before the store
7671 to the stack. */
7673 if ((GET_MODE_SIZE (GET_MODE (x))
7674 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (x))))
7675 && LOAD_EXTEND_OP (GET_MODE (SUBREG_REG (x))) == SIGN_EXTEND)
7676 return num_sign_bit_copies (SUBREG_REG (x), mode);
7677 #endif
7678 #endif
7679 break;
7681 case SIGN_EXTRACT:
7682 if (GET_CODE (XEXP (x, 1)) == CONST_INT)
7683 return MAX (1, bitwidth - INTVAL (XEXP (x, 1)));
7684 break;
7686 case SIGN_EXTEND:
7687 return (bitwidth - GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0)))
7688 + num_sign_bit_copies (XEXP (x, 0), VOIDmode));
7690 case TRUNCATE:
7691 /* For a smaller object, just ignore the high bits. */
7692 num0 = num_sign_bit_copies (XEXP (x, 0), VOIDmode);
7693 return MAX (1, (num0 - (GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0)))
7694 - bitwidth)));
7696 case NOT:
7697 return num_sign_bit_copies (XEXP (x, 0), mode);
7699 case ROTATE: case ROTATERT:
7700 /* If we are rotating left by a number of bits less than the number
7701 of sign bit copies, we can just subtract that amount from the
7702 number. */
7703 if (GET_CODE (XEXP (x, 1)) == CONST_INT
7704 && INTVAL (XEXP (x, 1)) >= 0 && INTVAL (XEXP (x, 1)) < bitwidth)
7706 num0 = num_sign_bit_copies (XEXP (x, 0), mode);
7707 return MAX (1, num0 - (code == ROTATE ? INTVAL (XEXP (x, 1))
7708 : bitwidth - INTVAL (XEXP (x, 1))));
7710 break;
7712 case NEG:
7713 /* In general, this subtracts one sign bit copy. But if the value
7714 is known to be positive, the number of sign bit copies is the
7715 same as that of the input. Finally, if the input has just one bit
7716 that might be nonzero, all the bits are copies of the sign bit. */
7717 nonzero = nonzero_bits (XEXP (x, 0), mode);
7718 if (nonzero == 1)
7719 return bitwidth;
7721 num0 = num_sign_bit_copies (XEXP (x, 0), mode);
7722 if (num0 > 1
7723 && bitwidth <= HOST_BITS_PER_WIDE_INT
7724 && (((HOST_WIDE_INT) 1 << (bitwidth - 1)) & nonzero))
7725 num0--;
7727 return num0;
7729 case IOR: case AND: case XOR:
7730 case SMIN: case SMAX: case UMIN: case UMAX:
7731 /* Logical operations will preserve the number of sign-bit copies.
7732 MIN and MAX operations always return one of the operands. */
7733 num0 = num_sign_bit_copies (XEXP (x, 0), mode);
7734 num1 = num_sign_bit_copies (XEXP (x, 1), mode);
7735 return MIN (num0, num1);
7737 case PLUS: case MINUS:
7738 /* For addition and subtraction, we can have a 1-bit carry. However,
7739 if we are subtracting 1 from a positive number, there will not
7740 be such a carry. Furthermore, if the positive number is known to
7741 be 0 or 1, we know the result is either -1 or 0. */
7743 if (code == PLUS && XEXP (x, 1) == constm1_rtx
7744 && bitwidth <= HOST_BITS_PER_WIDE_INT)
7746 nonzero = nonzero_bits (XEXP (x, 0), mode);
7747 if ((((HOST_WIDE_INT) 1 << (bitwidth - 1)) & nonzero) == 0)
7748 return (nonzero == 1 || nonzero == 0 ? bitwidth
7749 : bitwidth - floor_log2 (nonzero) - 1);
7752 num0 = num_sign_bit_copies (XEXP (x, 0), mode);
7753 num1 = num_sign_bit_copies (XEXP (x, 1), mode);
7754 return MAX (1, MIN (num0, num1) - 1);
7756 case MULT:
7757 /* The number of bits of the product is the sum of the number of
7758 bits of both terms. However, unless one of the terms if known
7759 to be positive, we must allow for an additional bit since negating
7760 a negative number can remove one sign bit copy. */
7762 num0 = num_sign_bit_copies (XEXP (x, 0), mode);
7763 num1 = num_sign_bit_copies (XEXP (x, 1), mode);
7765 result = bitwidth - (bitwidth - num0) - (bitwidth - num1);
7766 if (result > 0
7767 && bitwidth <= HOST_BITS_PER_WIDE_INT
7768 && ((nonzero_bits (XEXP (x, 0), mode)
7769 & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0)
7770 && ((nonzero_bits (XEXP (x, 1), mode)
7771 & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0))
7772 result--;
7774 return MAX (1, result);
7776 case UDIV:
7777 /* The result must be <= the first operand. */
7778 return num_sign_bit_copies (XEXP (x, 0), mode);
7780 case UMOD:
7781 /* The result must be <= the scond operand. */
7782 return num_sign_bit_copies (XEXP (x, 1), mode);
7784 case DIV:
7785 /* Similar to unsigned division, except that we have to worry about
7786 the case where the divisor is negative, in which case we have
7787 to add 1. */
7788 result = num_sign_bit_copies (XEXP (x, 0), mode);
7789 if (result > 1
7790 && bitwidth <= HOST_BITS_PER_WIDE_INT
7791 && (nonzero_bits (XEXP (x, 1), mode)
7792 & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0)
7793 result --;
7795 return result;
7797 case MOD:
7798 result = num_sign_bit_copies (XEXP (x, 1), mode);
7799 if (result > 1
7800 && bitwidth <= HOST_BITS_PER_WIDE_INT
7801 && (nonzero_bits (XEXP (x, 1), mode)
7802 & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0)
7803 result --;
7805 return result;
7807 case ASHIFTRT:
7808 /* Shifts by a constant add to the number of bits equal to the
7809 sign bit. */
7810 num0 = num_sign_bit_copies (XEXP (x, 0), mode);
7811 if (GET_CODE (XEXP (x, 1)) == CONST_INT
7812 && INTVAL (XEXP (x, 1)) > 0)
7813 num0 = MIN (bitwidth, num0 + INTVAL (XEXP (x, 1)));
7815 return num0;
7817 case ASHIFT:
7818 /* Left shifts destroy copies. */
7819 if (GET_CODE (XEXP (x, 1)) != CONST_INT
7820 || INTVAL (XEXP (x, 1)) < 0
7821 || INTVAL (XEXP (x, 1)) >= bitwidth)
7822 return 1;
7824 num0 = num_sign_bit_copies (XEXP (x, 0), mode);
7825 return MAX (1, num0 - INTVAL (XEXP (x, 1)));
7827 case IF_THEN_ELSE:
7828 num0 = num_sign_bit_copies (XEXP (x, 1), mode);
7829 num1 = num_sign_bit_copies (XEXP (x, 2), mode);
7830 return MIN (num0, num1);
7832 case EQ: case NE: case GE: case GT: case LE: case LT:
7833 case GEU: case GTU: case LEU: case LTU:
7834 if (STORE_FLAG_VALUE == -1)
7835 return bitwidth;
7838 /* If we haven't been able to figure it out by one of the above rules,
7839 see if some of the high-order bits are known to be zero. If so,
7840 count those bits and return one less than that amount. If we can't
7841 safely compute the mask for this mode, always return BITWIDTH. */
7843 if (bitwidth > HOST_BITS_PER_WIDE_INT)
7844 return 1;
7846 nonzero = nonzero_bits (x, mode);
7847 return (nonzero & ((HOST_WIDE_INT) 1 << (bitwidth - 1))
7848 ? 1 : bitwidth - floor_log2 (nonzero) - 1);
7851 /* Return the number of "extended" bits there are in X, when interpreted
7852 as a quantity in MODE whose signedness is indicated by UNSIGNEDP. For
7853 unsigned quantities, this is the number of high-order zero bits.
7854 For signed quantities, this is the number of copies of the sign bit
7855 minus 1. In both case, this function returns the number of "spare"
7856 bits. For example, if two quantities for which this function returns
7857 at least 1 are added, the addition is known not to overflow.
7859 This function will always return 0 unless called during combine, which
7860 implies that it must be called from a define_split. */
7863 extended_count (x, mode, unsignedp)
7864 rtx x;
7865 enum machine_mode mode;
7866 int unsignedp;
7868 if (nonzero_sign_valid == 0)
7869 return 0;
7871 return (unsignedp
7872 ? (GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT
7873 && (GET_MODE_BITSIZE (mode) - 1
7874 - floor_log2 (nonzero_bits (x, mode))))
7875 : num_sign_bit_copies (x, mode) - 1);
7878 /* This function is called from `simplify_shift_const' to merge two
7879 outer operations. Specifically, we have already found that we need
7880 to perform operation *POP0 with constant *PCONST0 at the outermost
7881 position. We would now like to also perform OP1 with constant CONST1
7882 (with *POP0 being done last).
7884 Return 1 if we can do the operation and update *POP0 and *PCONST0 with
7885 the resulting operation. *PCOMP_P is set to 1 if we would need to
7886 complement the innermost operand, otherwise it is unchanged.
7888 MODE is the mode in which the operation will be done. No bits outside
7889 the width of this mode matter. It is assumed that the width of this mode
7890 is smaller than or equal to HOST_BITS_PER_WIDE_INT.
7892 If *POP0 or OP1 are NIL, it means no operation is required. Only NEG, PLUS,
7893 IOR, XOR, and AND are supported. We may set *POP0 to SET if the proper
7894 result is simply *PCONST0.
7896 If the resulting operation cannot be expressed as one operation, we
7897 return 0 and do not change *POP0, *PCONST0, and *PCOMP_P. */
7899 static int
7900 merge_outer_ops (pop0, pconst0, op1, const1, mode, pcomp_p)
7901 enum rtx_code *pop0;
7902 HOST_WIDE_INT *pconst0;
7903 enum rtx_code op1;
7904 HOST_WIDE_INT const1;
7905 enum machine_mode mode;
7906 int *pcomp_p;
7908 enum rtx_code op0 = *pop0;
7909 HOST_WIDE_INT const0 = *pconst0;
7910 int width = GET_MODE_BITSIZE (mode);
7912 const0 &= GET_MODE_MASK (mode);
7913 const1 &= GET_MODE_MASK (mode);
7915 /* If OP0 is an AND, clear unimportant bits in CONST1. */
7916 if (op0 == AND)
7917 const1 &= const0;
7919 /* If OP0 or OP1 is NIL, this is easy. Similarly if they are the same or
7920 if OP0 is SET. */
7922 if (op1 == NIL || op0 == SET)
7923 return 1;
7925 else if (op0 == NIL)
7926 op0 = op1, const0 = const1;
7928 else if (op0 == op1)
7930 switch (op0)
7932 case AND:
7933 const0 &= const1;
7934 break;
7935 case IOR:
7936 const0 |= const1;
7937 break;
7938 case XOR:
7939 const0 ^= const1;
7940 break;
7941 case PLUS:
7942 const0 += const1;
7943 break;
7944 case NEG:
7945 op0 = NIL;
7946 break;
7950 /* Otherwise, if either is a PLUS or NEG, we can't do anything. */
7951 else if (op0 == PLUS || op1 == PLUS || op0 == NEG || op1 == NEG)
7952 return 0;
7954 /* If the two constants aren't the same, we can't do anything. The
7955 remaining six cases can all be done. */
7956 else if (const0 != const1)
7957 return 0;
7959 else
7960 switch (op0)
7962 case IOR:
7963 if (op1 == AND)
7964 /* (a & b) | b == b */
7965 op0 = SET;
7966 else /* op1 == XOR */
7967 /* (a ^ b) | b == a | b */
7969 break;
7971 case XOR:
7972 if (op1 == AND)
7973 /* (a & b) ^ b == (~a) & b */
7974 op0 = AND, *pcomp_p = 1;
7975 else /* op1 == IOR */
7976 /* (a | b) ^ b == a & ~b */
7977 op0 = AND, *pconst0 = ~ const0;
7978 break;
7980 case AND:
7981 if (op1 == IOR)
7982 /* (a | b) & b == b */
7983 op0 = SET;
7984 else /* op1 == XOR */
7985 /* (a ^ b) & b) == (~a) & b */
7986 *pcomp_p = 1;
7987 break;
7990 /* Check for NO-OP cases. */
7991 const0 &= GET_MODE_MASK (mode);
7992 if (const0 == 0
7993 && (op0 == IOR || op0 == XOR || op0 == PLUS))
7994 op0 = NIL;
7995 else if (const0 == 0 && op0 == AND)
7996 op0 = SET;
7997 else if (const0 == GET_MODE_MASK (mode) && op0 == AND)
7998 op0 = NIL;
8000 /* If this would be an entire word for the target, but is not for
8001 the host, then sign-extend on the host so that the number will look
8002 the same way on the host that it would on the target.
8004 For example, when building a 64 bit alpha hosted 32 bit sparc
8005 targeted compiler, then we want the 32 bit unsigned value -1 to be
8006 represented as a 64 bit value -1, and not as 0x00000000ffffffff.
8007 The later confuses the sparc backend. */
8009 if (BITS_PER_WORD < HOST_BITS_PER_WIDE_INT && BITS_PER_WORD == width
8010 && (const0 & ((HOST_WIDE_INT) 1 << (width - 1))))
8011 const0 |= ((HOST_WIDE_INT) (-1) << width);
8013 *pop0 = op0;
8014 *pconst0 = const0;
8016 return 1;
8019 /* Simplify a shift of VAROP by COUNT bits. CODE says what kind of shift.
8020 The result of the shift is RESULT_MODE. X, if non-zero, is an expression
8021 that we started with.
8023 The shift is normally computed in the widest mode we find in VAROP, as
8024 long as it isn't a different number of words than RESULT_MODE. Exceptions
8025 are ASHIFTRT and ROTATE, which are always done in their original mode, */
8027 static rtx
8028 simplify_shift_const (x, code, result_mode, varop, count)
8029 rtx x;
8030 enum rtx_code code;
8031 enum machine_mode result_mode;
8032 rtx varop;
8033 int count;
8035 enum rtx_code orig_code = code;
8036 int orig_count = count;
8037 enum machine_mode mode = result_mode;
8038 enum machine_mode shift_mode, tmode;
8039 int mode_words
8040 = (GET_MODE_SIZE (mode) + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD;
8041 /* We form (outer_op (code varop count) (outer_const)). */
8042 enum rtx_code outer_op = NIL;
8043 HOST_WIDE_INT outer_const = 0;
8044 rtx const_rtx;
8045 int complement_p = 0;
8046 rtx new;
8048 /* If we were given an invalid count, don't do anything except exactly
8049 what was requested. */
8051 if (count < 0 || count > GET_MODE_BITSIZE (mode))
8053 if (x)
8054 return x;
8056 return gen_rtx (code, mode, varop, GEN_INT (count));
8059 /* Unless one of the branches of the `if' in this loop does a `continue',
8060 we will `break' the loop after the `if'. */
8062 while (count != 0)
8064 /* If we have an operand of (clobber (const_int 0)), just return that
8065 value. */
8066 if (GET_CODE (varop) == CLOBBER)
8067 return varop;
8069 /* If we discovered we had to complement VAROP, leave. Making a NOT
8070 here would cause an infinite loop. */
8071 if (complement_p)
8072 break;
8074 /* Convert ROTATERT to ROTATE. */
8075 if (code == ROTATERT)
8076 code = ROTATE, count = GET_MODE_BITSIZE (result_mode) - count;
8078 /* We need to determine what mode we will do the shift in. If the
8079 shift is a right shift or a ROTATE, we must always do it in the mode
8080 it was originally done in. Otherwise, we can do it in MODE, the
8081 widest mode encountered. */
8082 shift_mode
8083 = (code == ASHIFTRT || code == LSHIFTRT || code == ROTATE
8084 ? result_mode : mode);
8086 /* Handle cases where the count is greater than the size of the mode
8087 minus 1. For ASHIFT, use the size minus one as the count (this can
8088 occur when simplifying (lshiftrt (ashiftrt ..))). For rotates,
8089 take the count modulo the size. For other shifts, the result is
8090 zero.
8092 Since these shifts are being produced by the compiler by combining
8093 multiple operations, each of which are defined, we know what the
8094 result is supposed to be. */
8096 if (count > GET_MODE_BITSIZE (shift_mode) - 1)
8098 if (code == ASHIFTRT)
8099 count = GET_MODE_BITSIZE (shift_mode) - 1;
8100 else if (code == ROTATE || code == ROTATERT)
8101 count %= GET_MODE_BITSIZE (shift_mode);
8102 else
8104 /* We can't simply return zero because there may be an
8105 outer op. */
8106 varop = const0_rtx;
8107 count = 0;
8108 break;
8112 /* Negative counts are invalid and should not have been made (a
8113 programmer-specified negative count should have been handled
8114 above). */
8115 else if (count < 0)
8116 abort ();
8118 /* An arithmetic right shift of a quantity known to be -1 or 0
8119 is a no-op. */
8120 if (code == ASHIFTRT
8121 && (num_sign_bit_copies (varop, shift_mode)
8122 == GET_MODE_BITSIZE (shift_mode)))
8124 count = 0;
8125 break;
8128 /* If we are doing an arithmetic right shift and discarding all but
8129 the sign bit copies, this is equivalent to doing a shift by the
8130 bitsize minus one. Convert it into that shift because it will often
8131 allow other simplifications. */
8133 if (code == ASHIFTRT
8134 && (count + num_sign_bit_copies (varop, shift_mode)
8135 >= GET_MODE_BITSIZE (shift_mode)))
8136 count = GET_MODE_BITSIZE (shift_mode) - 1;
8138 /* We simplify the tests below and elsewhere by converting
8139 ASHIFTRT to LSHIFTRT if we know the sign bit is clear.
8140 `make_compound_operation' will convert it to a ASHIFTRT for
8141 those machines (such as Vax) that don't have a LSHIFTRT. */
8142 if (GET_MODE_BITSIZE (shift_mode) <= HOST_BITS_PER_WIDE_INT
8143 && code == ASHIFTRT
8144 && ((nonzero_bits (varop, shift_mode)
8145 & ((HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (shift_mode) - 1)))
8146 == 0))
8147 code = LSHIFTRT;
8149 switch (GET_CODE (varop))
8151 case SIGN_EXTEND:
8152 case ZERO_EXTEND:
8153 case SIGN_EXTRACT:
8154 case ZERO_EXTRACT:
8155 new = expand_compound_operation (varop);
8156 if (new != varop)
8158 varop = new;
8159 continue;
8161 break;
8163 case MEM:
8164 /* If we have (xshiftrt (mem ...) C) and C is MODE_WIDTH
8165 minus the width of a smaller mode, we can do this with a
8166 SIGN_EXTEND or ZERO_EXTEND from the narrower memory location. */
8167 if ((code == ASHIFTRT || code == LSHIFTRT)
8168 && ! mode_dependent_address_p (XEXP (varop, 0))
8169 && ! MEM_VOLATILE_P (varop)
8170 && (tmode = mode_for_size (GET_MODE_BITSIZE (mode) - count,
8171 MODE_INT, 1)) != BLKmode)
8173 if (BYTES_BIG_ENDIAN)
8174 new = gen_rtx (MEM, tmode, XEXP (varop, 0));
8175 else
8176 new = gen_rtx (MEM, tmode,
8177 plus_constant (XEXP (varop, 0),
8178 count / BITS_PER_UNIT));
8179 RTX_UNCHANGING_P (new) = RTX_UNCHANGING_P (varop);
8180 MEM_VOLATILE_P (new) = MEM_VOLATILE_P (varop);
8181 MEM_IN_STRUCT_P (new) = MEM_IN_STRUCT_P (varop);
8182 varop = gen_rtx_combine (code == ASHIFTRT ? SIGN_EXTEND
8183 : ZERO_EXTEND, mode, new);
8184 count = 0;
8185 continue;
8187 break;
8189 case USE:
8190 /* Similar to the case above, except that we can only do this if
8191 the resulting mode is the same as that of the underlying
8192 MEM and adjust the address depending on the *bits* endianness
8193 because of the way that bit-field extract insns are defined. */
8194 if ((code == ASHIFTRT || code == LSHIFTRT)
8195 && (tmode = mode_for_size (GET_MODE_BITSIZE (mode) - count,
8196 MODE_INT, 1)) != BLKmode
8197 && tmode == GET_MODE (XEXP (varop, 0)))
8199 if (BITS_BIG_ENDIAN)
8200 new = XEXP (varop, 0);
8201 else
8203 new = copy_rtx (XEXP (varop, 0));
8204 SUBST (XEXP (new, 0),
8205 plus_constant (XEXP (new, 0),
8206 count / BITS_PER_UNIT));
8209 varop = gen_rtx_combine (code == ASHIFTRT ? SIGN_EXTEND
8210 : ZERO_EXTEND, mode, new);
8211 count = 0;
8212 continue;
8214 break;
8216 case SUBREG:
8217 /* If VAROP is a SUBREG, strip it as long as the inner operand has
8218 the same number of words as what we've seen so far. Then store
8219 the widest mode in MODE. */
8220 if (subreg_lowpart_p (varop)
8221 && (GET_MODE_SIZE (GET_MODE (SUBREG_REG (varop)))
8222 > GET_MODE_SIZE (GET_MODE (varop)))
8223 && (((GET_MODE_SIZE (GET_MODE (SUBREG_REG (varop)))
8224 + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD)
8225 == mode_words))
8227 varop = SUBREG_REG (varop);
8228 if (GET_MODE_SIZE (GET_MODE (varop)) > GET_MODE_SIZE (mode))
8229 mode = GET_MODE (varop);
8230 continue;
8232 break;
8234 case MULT:
8235 /* Some machines use MULT instead of ASHIFT because MULT
8236 is cheaper. But it is still better on those machines to
8237 merge two shifts into one. */
8238 if (GET_CODE (XEXP (varop, 1)) == CONST_INT
8239 && exact_log2 (INTVAL (XEXP (varop, 1))) >= 0)
8241 varop = gen_binary (ASHIFT, GET_MODE (varop), XEXP (varop, 0),
8242 GEN_INT (exact_log2 (INTVAL (XEXP (varop, 1)))));;
8243 continue;
8245 break;
8247 case UDIV:
8248 /* Similar, for when divides are cheaper. */
8249 if (GET_CODE (XEXP (varop, 1)) == CONST_INT
8250 && exact_log2 (INTVAL (XEXP (varop, 1))) >= 0)
8252 varop = gen_binary (LSHIFTRT, GET_MODE (varop), XEXP (varop, 0),
8253 GEN_INT (exact_log2 (INTVAL (XEXP (varop, 1)))));
8254 continue;
8256 break;
8258 case ASHIFTRT:
8259 /* If we are extracting just the sign bit of an arithmetic right
8260 shift, that shift is not needed. */
8261 if (code == LSHIFTRT && count == GET_MODE_BITSIZE (result_mode) - 1)
8263 varop = XEXP (varop, 0);
8264 continue;
8267 /* ... fall through ... */
8269 case LSHIFTRT:
8270 case ASHIFT:
8271 case ROTATE:
8272 /* Here we have two nested shifts. The result is usually the
8273 AND of a new shift with a mask. We compute the result below. */
8274 if (GET_CODE (XEXP (varop, 1)) == CONST_INT
8275 && INTVAL (XEXP (varop, 1)) >= 0
8276 && INTVAL (XEXP (varop, 1)) < GET_MODE_BITSIZE (GET_MODE (varop))
8277 && GET_MODE_BITSIZE (result_mode) <= HOST_BITS_PER_WIDE_INT
8278 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT)
8280 enum rtx_code first_code = GET_CODE (varop);
8281 int first_count = INTVAL (XEXP (varop, 1));
8282 unsigned HOST_WIDE_INT mask;
8283 rtx mask_rtx;
8285 /* We have one common special case. We can't do any merging if
8286 the inner code is an ASHIFTRT of a smaller mode. However, if
8287 we have (ashift:M1 (subreg:M1 (ashiftrt:M2 FOO C1) 0) C2)
8288 with C2 == GET_MODE_BITSIZE (M1) - GET_MODE_BITSIZE (M2),
8289 we can convert it to
8290 (ashiftrt:M1 (ashift:M1 (and:M1 (subreg:M1 FOO 0 C2) C3) C1).
8291 This simplifies certain SIGN_EXTEND operations. */
8292 if (code == ASHIFT && first_code == ASHIFTRT
8293 && (GET_MODE_BITSIZE (result_mode)
8294 - GET_MODE_BITSIZE (GET_MODE (varop))) == count)
8296 /* C3 has the low-order C1 bits zero. */
8298 mask = (GET_MODE_MASK (mode)
8299 & ~ (((HOST_WIDE_INT) 1 << first_count) - 1));
8301 varop = simplify_and_const_int (NULL_RTX, result_mode,
8302 XEXP (varop, 0), mask);
8303 varop = simplify_shift_const (NULL_RTX, ASHIFT, result_mode,
8304 varop, count);
8305 count = first_count;
8306 code = ASHIFTRT;
8307 continue;
8310 /* If this was (ashiftrt (ashift foo C1) C2) and FOO has more
8311 than C1 high-order bits equal to the sign bit, we can convert
8312 this to either an ASHIFT or a ASHIFTRT depending on the
8313 two counts.
8315 We cannot do this if VAROP's mode is not SHIFT_MODE. */
8317 if (code == ASHIFTRT && first_code == ASHIFT
8318 && GET_MODE (varop) == shift_mode
8319 && (num_sign_bit_copies (XEXP (varop, 0), shift_mode)
8320 > first_count))
8322 count -= first_count;
8323 if (count < 0)
8324 count = - count, code = ASHIFT;
8325 varop = XEXP (varop, 0);
8326 continue;
8329 /* There are some cases we can't do. If CODE is ASHIFTRT,
8330 we can only do this if FIRST_CODE is also ASHIFTRT.
8332 We can't do the case when CODE is ROTATE and FIRST_CODE is
8333 ASHIFTRT.
8335 If the mode of this shift is not the mode of the outer shift,
8336 we can't do this if either shift is a right shift or ROTATE.
8338 Finally, we can't do any of these if the mode is too wide
8339 unless the codes are the same.
8341 Handle the case where the shift codes are the same
8342 first. */
8344 if (code == first_code)
8346 if (GET_MODE (varop) != result_mode
8347 && (code == ASHIFTRT || code == LSHIFTRT
8348 || code == ROTATE))
8349 break;
8351 count += first_count;
8352 varop = XEXP (varop, 0);
8353 continue;
8356 if (code == ASHIFTRT
8357 || (code == ROTATE && first_code == ASHIFTRT)
8358 || GET_MODE_BITSIZE (mode) > HOST_BITS_PER_WIDE_INT
8359 || (GET_MODE (varop) != result_mode
8360 && (first_code == ASHIFTRT || first_code == LSHIFTRT
8361 || first_code == ROTATE
8362 || code == ROTATE)))
8363 break;
8365 /* To compute the mask to apply after the shift, shift the
8366 nonzero bits of the inner shift the same way the
8367 outer shift will. */
8369 mask_rtx = GEN_INT (nonzero_bits (varop, GET_MODE (varop)));
8371 mask_rtx
8372 = simplify_binary_operation (code, result_mode, mask_rtx,
8373 GEN_INT (count));
8375 /* Give up if we can't compute an outer operation to use. */
8376 if (mask_rtx == 0
8377 || GET_CODE (mask_rtx) != CONST_INT
8378 || ! merge_outer_ops (&outer_op, &outer_const, AND,
8379 INTVAL (mask_rtx),
8380 result_mode, &complement_p))
8381 break;
8383 /* If the shifts are in the same direction, we add the
8384 counts. Otherwise, we subtract them. */
8385 if ((code == ASHIFTRT || code == LSHIFTRT)
8386 == (first_code == ASHIFTRT || first_code == LSHIFTRT))
8387 count += first_count;
8388 else
8389 count -= first_count;
8391 /* If COUNT is positive, the new shift is usually CODE,
8392 except for the two exceptions below, in which case it is
8393 FIRST_CODE. If the count is negative, FIRST_CODE should
8394 always be used */
8395 if (count > 0
8396 && ((first_code == ROTATE && code == ASHIFT)
8397 || (first_code == ASHIFTRT && code == LSHIFTRT)))
8398 code = first_code;
8399 else if (count < 0)
8400 code = first_code, count = - count;
8402 varop = XEXP (varop, 0);
8403 continue;
8406 /* If we have (A << B << C) for any shift, we can convert this to
8407 (A << C << B). This wins if A is a constant. Only try this if
8408 B is not a constant. */
8410 else if (GET_CODE (varop) == code
8411 && GET_CODE (XEXP (varop, 1)) != CONST_INT
8412 && 0 != (new
8413 = simplify_binary_operation (code, mode,
8414 XEXP (varop, 0),
8415 GEN_INT (count))))
8417 varop = gen_rtx_combine (code, mode, new, XEXP (varop, 1));
8418 count = 0;
8419 continue;
8421 break;
8423 case NOT:
8424 /* Make this fit the case below. */
8425 varop = gen_rtx_combine (XOR, mode, XEXP (varop, 0),
8426 GEN_INT (GET_MODE_MASK (mode)));
8427 continue;
8429 case IOR:
8430 case AND:
8431 case XOR:
8432 /* If we have (xshiftrt (ior (plus X (const_int -1)) X) C)
8433 with C the size of VAROP - 1 and the shift is logical if
8434 STORE_FLAG_VALUE is 1 and arithmetic if STORE_FLAG_VALUE is -1,
8435 we have an (le X 0) operation. If we have an arithmetic shift
8436 and STORE_FLAG_VALUE is 1 or we have a logical shift with
8437 STORE_FLAG_VALUE of -1, we have a (neg (le X 0)) operation. */
8439 if (GET_CODE (varop) == IOR && GET_CODE (XEXP (varop, 0)) == PLUS
8440 && XEXP (XEXP (varop, 0), 1) == constm1_rtx
8441 && (STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1)
8442 && (code == LSHIFTRT || code == ASHIFTRT)
8443 && count == GET_MODE_BITSIZE (GET_MODE (varop)) - 1
8444 && rtx_equal_p (XEXP (XEXP (varop, 0), 0), XEXP (varop, 1)))
8446 count = 0;
8447 varop = gen_rtx_combine (LE, GET_MODE (varop), XEXP (varop, 1),
8448 const0_rtx);
8450 if (STORE_FLAG_VALUE == 1 ? code == ASHIFTRT : code == LSHIFTRT)
8451 varop = gen_rtx_combine (NEG, GET_MODE (varop), varop);
8453 continue;
8456 /* If we have (shift (logical)), move the logical to the outside
8457 to allow it to possibly combine with another logical and the
8458 shift to combine with another shift. This also canonicalizes to
8459 what a ZERO_EXTRACT looks like. Also, some machines have
8460 (and (shift)) insns. */
8462 if (GET_CODE (XEXP (varop, 1)) == CONST_INT
8463 && (new = simplify_binary_operation (code, result_mode,
8464 XEXP (varop, 1),
8465 GEN_INT (count))) != 0
8466 && GET_CODE(new) == CONST_INT
8467 && merge_outer_ops (&outer_op, &outer_const, GET_CODE (varop),
8468 INTVAL (new), result_mode, &complement_p))
8470 varop = XEXP (varop, 0);
8471 continue;
8474 /* If we can't do that, try to simplify the shift in each arm of the
8475 logical expression, make a new logical expression, and apply
8476 the inverse distributive law. */
8478 rtx lhs = simplify_shift_const (NULL_RTX, code, shift_mode,
8479 XEXP (varop, 0), count);
8480 rtx rhs = simplify_shift_const (NULL_RTX, code, shift_mode,
8481 XEXP (varop, 1), count);
8483 varop = gen_binary (GET_CODE (varop), shift_mode, lhs, rhs);
8484 varop = apply_distributive_law (varop);
8486 count = 0;
8488 break;
8490 case EQ:
8491 /* convert (lshiftrt (eq FOO 0) C) to (xor FOO 1) if STORE_FLAG_VALUE
8492 says that the sign bit can be tested, FOO has mode MODE, C is
8493 GET_MODE_BITSIZE (MODE) - 1, and FOO has only its low-order bit
8494 that may be nonzero. */
8495 if (code == LSHIFTRT
8496 && XEXP (varop, 1) == const0_rtx
8497 && GET_MODE (XEXP (varop, 0)) == result_mode
8498 && count == GET_MODE_BITSIZE (result_mode) - 1
8499 && GET_MODE_BITSIZE (result_mode) <= HOST_BITS_PER_WIDE_INT
8500 && ((STORE_FLAG_VALUE
8501 & ((HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (result_mode) - 1))))
8502 && nonzero_bits (XEXP (varop, 0), result_mode) == 1
8503 && merge_outer_ops (&outer_op, &outer_const, XOR,
8504 (HOST_WIDE_INT) 1, result_mode,
8505 &complement_p))
8507 varop = XEXP (varop, 0);
8508 count = 0;
8509 continue;
8511 break;
8513 case NEG:
8514 /* (lshiftrt (neg A) C) where A is either 0 or 1 and C is one less
8515 than the number of bits in the mode is equivalent to A. */
8516 if (code == LSHIFTRT && count == GET_MODE_BITSIZE (result_mode) - 1
8517 && nonzero_bits (XEXP (varop, 0), result_mode) == 1)
8519 varop = XEXP (varop, 0);
8520 count = 0;
8521 continue;
8524 /* NEG commutes with ASHIFT since it is multiplication. Move the
8525 NEG outside to allow shifts to combine. */
8526 if (code == ASHIFT
8527 && merge_outer_ops (&outer_op, &outer_const, NEG,
8528 (HOST_WIDE_INT) 0, result_mode,
8529 &complement_p))
8531 varop = XEXP (varop, 0);
8532 continue;
8534 break;
8536 case PLUS:
8537 /* (lshiftrt (plus A -1) C) where A is either 0 or 1 and C
8538 is one less than the number of bits in the mode is
8539 equivalent to (xor A 1). */
8540 if (code == LSHIFTRT && count == GET_MODE_BITSIZE (result_mode) - 1
8541 && XEXP (varop, 1) == constm1_rtx
8542 && nonzero_bits (XEXP (varop, 0), result_mode) == 1
8543 && merge_outer_ops (&outer_op, &outer_const, XOR,
8544 (HOST_WIDE_INT) 1, result_mode,
8545 &complement_p))
8547 count = 0;
8548 varop = XEXP (varop, 0);
8549 continue;
8552 /* If we have (xshiftrt (plus FOO BAR) C), and the only bits
8553 that might be nonzero in BAR are those being shifted out and those
8554 bits are known zero in FOO, we can replace the PLUS with FOO.
8555 Similarly in the other operand order. This code occurs when
8556 we are computing the size of a variable-size array. */
8558 if ((code == ASHIFTRT || code == LSHIFTRT)
8559 && count < HOST_BITS_PER_WIDE_INT
8560 && nonzero_bits (XEXP (varop, 1), result_mode) >> count == 0
8561 && (nonzero_bits (XEXP (varop, 1), result_mode)
8562 & nonzero_bits (XEXP (varop, 0), result_mode)) == 0)
8564 varop = XEXP (varop, 0);
8565 continue;
8567 else if ((code == ASHIFTRT || code == LSHIFTRT)
8568 && count < HOST_BITS_PER_WIDE_INT
8569 && GET_MODE_BITSIZE (result_mode) <= HOST_BITS_PER_WIDE_INT
8570 && 0 == (nonzero_bits (XEXP (varop, 0), result_mode)
8571 >> count)
8572 && 0 == (nonzero_bits (XEXP (varop, 0), result_mode)
8573 & nonzero_bits (XEXP (varop, 1),
8574 result_mode)))
8576 varop = XEXP (varop, 1);
8577 continue;
8580 /* (ashift (plus foo C) N) is (plus (ashift foo N) C'). */
8581 if (code == ASHIFT
8582 && GET_CODE (XEXP (varop, 1)) == CONST_INT
8583 && (new = simplify_binary_operation (ASHIFT, result_mode,
8584 XEXP (varop, 1),
8585 GEN_INT (count))) != 0
8586 && GET_CODE(new) == CONST_INT
8587 && merge_outer_ops (&outer_op, &outer_const, PLUS,
8588 INTVAL (new), result_mode, &complement_p))
8590 varop = XEXP (varop, 0);
8591 continue;
8593 break;
8595 case MINUS:
8596 /* If we have (xshiftrt (minus (ashiftrt X C)) X) C)
8597 with C the size of VAROP - 1 and the shift is logical if
8598 STORE_FLAG_VALUE is 1 and arithmetic if STORE_FLAG_VALUE is -1,
8599 we have a (gt X 0) operation. If the shift is arithmetic with
8600 STORE_FLAG_VALUE of 1 or logical with STORE_FLAG_VALUE == -1,
8601 we have a (neg (gt X 0)) operation. */
8603 if ((STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1)
8604 && GET_CODE (XEXP (varop, 0)) == ASHIFTRT
8605 && count == GET_MODE_BITSIZE (GET_MODE (varop)) - 1
8606 && (code == LSHIFTRT || code == ASHIFTRT)
8607 && GET_CODE (XEXP (XEXP (varop, 0), 1)) == CONST_INT
8608 && INTVAL (XEXP (XEXP (varop, 0), 1)) == count
8609 && rtx_equal_p (XEXP (XEXP (varop, 0), 0), XEXP (varop, 1)))
8611 count = 0;
8612 varop = gen_rtx_combine (GT, GET_MODE (varop), XEXP (varop, 1),
8613 const0_rtx);
8615 if (STORE_FLAG_VALUE == 1 ? code == ASHIFTRT : code == LSHIFTRT)
8616 varop = gen_rtx_combine (NEG, GET_MODE (varop), varop);
8618 continue;
8620 break;
8623 break;
8626 /* We need to determine what mode to do the shift in. If the shift is
8627 a right shift or ROTATE, we must always do it in the mode it was
8628 originally done in. Otherwise, we can do it in MODE, the widest mode
8629 encountered. The code we care about is that of the shift that will
8630 actually be done, not the shift that was originally requested. */
8631 shift_mode
8632 = (code == ASHIFTRT || code == LSHIFTRT || code == ROTATE
8633 ? result_mode : mode);
8635 /* We have now finished analyzing the shift. The result should be
8636 a shift of type CODE with SHIFT_MODE shifting VAROP COUNT places. If
8637 OUTER_OP is non-NIL, it is an operation that needs to be applied
8638 to the result of the shift. OUTER_CONST is the relevant constant,
8639 but we must turn off all bits turned off in the shift.
8641 If we were passed a value for X, see if we can use any pieces of
8642 it. If not, make new rtx. */
8644 if (x && GET_RTX_CLASS (GET_CODE (x)) == '2'
8645 && GET_CODE (XEXP (x, 1)) == CONST_INT
8646 && INTVAL (XEXP (x, 1)) == count)
8647 const_rtx = XEXP (x, 1);
8648 else
8649 const_rtx = GEN_INT (count);
8651 if (x && GET_CODE (XEXP (x, 0)) == SUBREG
8652 && GET_MODE (XEXP (x, 0)) == shift_mode
8653 && SUBREG_REG (XEXP (x, 0)) == varop)
8654 varop = XEXP (x, 0);
8655 else if (GET_MODE (varop) != shift_mode)
8656 varop = gen_lowpart_for_combine (shift_mode, varop);
8658 /* If we can't make the SUBREG, try to return what we were given. */
8659 if (GET_CODE (varop) == CLOBBER)
8660 return x ? x : varop;
8662 new = simplify_binary_operation (code, shift_mode, varop, const_rtx);
8663 if (new != 0)
8664 x = new;
8665 else
8667 if (x == 0 || GET_CODE (x) != code || GET_MODE (x) != shift_mode)
8668 x = gen_rtx_combine (code, shift_mode, varop, const_rtx);
8670 SUBST (XEXP (x, 0), varop);
8671 SUBST (XEXP (x, 1), const_rtx);
8674 /* If we have an outer operation and we just made a shift, it is
8675 possible that we could have simplified the shift were it not
8676 for the outer operation. So try to do the simplification
8677 recursively. */
8679 if (outer_op != NIL && GET_CODE (x) == code
8680 && GET_CODE (XEXP (x, 1)) == CONST_INT)
8681 x = simplify_shift_const (x, code, shift_mode, XEXP (x, 0),
8682 INTVAL (XEXP (x, 1)));
8684 /* If we were doing a LSHIFTRT in a wider mode than it was originally,
8685 turn off all the bits that the shift would have turned off. */
8686 if (orig_code == LSHIFTRT && result_mode != shift_mode)
8687 x = simplify_and_const_int (NULL_RTX, shift_mode, x,
8688 GET_MODE_MASK (result_mode) >> orig_count);
8690 /* Do the remainder of the processing in RESULT_MODE. */
8691 x = gen_lowpart_for_combine (result_mode, x);
8693 /* If COMPLEMENT_P is set, we have to complement X before doing the outer
8694 operation. */
8695 if (complement_p)
8696 x = gen_unary (NOT, result_mode, result_mode, x);
8698 if (outer_op != NIL)
8700 if (GET_MODE_BITSIZE (result_mode) < HOST_BITS_PER_WIDE_INT)
8702 int width = GET_MODE_BITSIZE (result_mode);
8704 outer_const &= GET_MODE_MASK (result_mode);
8706 /* If this would be an entire word for the target, but is not for
8707 the host, then sign-extend on the host so that the number will
8708 look the same way on the host that it would on the target.
8710 For example, when building a 64 bit alpha hosted 32 bit sparc
8711 targeted compiler, then we want the 32 bit unsigned value -1 to be
8712 represented as a 64 bit value -1, and not as 0x00000000ffffffff.
8713 The later confuses the sparc backend. */
8715 if (BITS_PER_WORD < HOST_BITS_PER_WIDE_INT && BITS_PER_WORD == width
8716 && (outer_const & ((HOST_WIDE_INT) 1 << (width - 1))))
8717 outer_const |= ((HOST_WIDE_INT) (-1) << width);
8720 if (outer_op == AND)
8721 x = simplify_and_const_int (NULL_RTX, result_mode, x, outer_const);
8722 else if (outer_op == SET)
8723 /* This means that we have determined that the result is
8724 equivalent to a constant. This should be rare. */
8725 x = GEN_INT (outer_const);
8726 else if (GET_RTX_CLASS (outer_op) == '1')
8727 x = gen_unary (outer_op, result_mode, result_mode, x);
8728 else
8729 x = gen_binary (outer_op, result_mode, x, GEN_INT (outer_const));
8732 return x;
8735 /* Like recog, but we receive the address of a pointer to a new pattern.
8736 We try to match the rtx that the pointer points to.
8737 If that fails, we may try to modify or replace the pattern,
8738 storing the replacement into the same pointer object.
8740 Modifications include deletion or addition of CLOBBERs.
8742 PNOTES is a pointer to a location where any REG_UNUSED notes added for
8743 the CLOBBERs are placed.
8745 PADDED_SCRATCHES is set to the number of (clobber (scratch)) patterns
8746 we had to add.
8748 The value is the final insn code from the pattern ultimately matched,
8749 or -1. */
8751 static int
8752 recog_for_combine (pnewpat, insn, pnotes, padded_scratches)
8753 rtx *pnewpat;
8754 rtx insn;
8755 rtx *pnotes;
8756 int *padded_scratches;
8758 register rtx pat = *pnewpat;
8759 int insn_code_number;
8760 int num_clobbers_to_add = 0;
8761 int i;
8762 rtx notes = 0;
8764 *padded_scratches = 0;
8766 /* If PAT is a PARALLEL, check to see if it contains the CLOBBER
8767 we use to indicate that something didn't match. If we find such a
8768 thing, force rejection. */
8769 if (GET_CODE (pat) == PARALLEL)
8770 for (i = XVECLEN (pat, 0) - 1; i >= 0; i--)
8771 if (GET_CODE (XVECEXP (pat, 0, i)) == CLOBBER
8772 && XEXP (XVECEXP (pat, 0, i), 0) == const0_rtx)
8773 return -1;
8775 /* Is the result of combination a valid instruction? */
8776 insn_code_number = recog (pat, insn, &num_clobbers_to_add);
8778 /* If it isn't, there is the possibility that we previously had an insn
8779 that clobbered some register as a side effect, but the combined
8780 insn doesn't need to do that. So try once more without the clobbers
8781 unless this represents an ASM insn. */
8783 if (insn_code_number < 0 && ! check_asm_operands (pat)
8784 && GET_CODE (pat) == PARALLEL)
8786 int pos;
8788 for (pos = 0, i = 0; i < XVECLEN (pat, 0); i++)
8789 if (GET_CODE (XVECEXP (pat, 0, i)) != CLOBBER)
8791 if (i != pos)
8792 SUBST (XVECEXP (pat, 0, pos), XVECEXP (pat, 0, i));
8793 pos++;
8796 SUBST_INT (XVECLEN (pat, 0), pos);
8798 if (pos == 1)
8799 pat = XVECEXP (pat, 0, 0);
8801 insn_code_number = recog (pat, insn, &num_clobbers_to_add);
8804 /* If we had any clobbers to add, make a new pattern than contains
8805 them. Then check to make sure that all of them are dead. */
8806 if (num_clobbers_to_add)
8808 rtx newpat = gen_rtx (PARALLEL, VOIDmode,
8809 gen_rtvec (GET_CODE (pat) == PARALLEL
8810 ? XVECLEN (pat, 0) + num_clobbers_to_add
8811 : num_clobbers_to_add + 1));
8813 if (GET_CODE (pat) == PARALLEL)
8814 for (i = 0; i < XVECLEN (pat, 0); i++)
8815 XVECEXP (newpat, 0, i) = XVECEXP (pat, 0, i);
8816 else
8817 XVECEXP (newpat, 0, 0) = pat;
8819 add_clobbers (newpat, insn_code_number);
8821 for (i = XVECLEN (newpat, 0) - num_clobbers_to_add;
8822 i < XVECLEN (newpat, 0); i++)
8824 if (GET_CODE (XEXP (XVECEXP (newpat, 0, i), 0)) == REG
8825 && ! reg_dead_at_p (XEXP (XVECEXP (newpat, 0, i), 0), insn))
8826 return -1;
8827 else if (GET_CODE (XEXP (XVECEXP (newpat, 0, i), 0)) == SCRATCH)
8828 (*padded_scratches)++;
8829 notes = gen_rtx (EXPR_LIST, REG_UNUSED,
8830 XEXP (XVECEXP (newpat, 0, i), 0), notes);
8832 pat = newpat;
8835 *pnewpat = pat;
8836 *pnotes = notes;
8838 return insn_code_number;
8841 /* Like gen_lowpart but for use by combine. In combine it is not possible
8842 to create any new pseudoregs. However, it is safe to create
8843 invalid memory addresses, because combine will try to recognize
8844 them and all they will do is make the combine attempt fail.
8846 If for some reason this cannot do its job, an rtx
8847 (clobber (const_int 0)) is returned.
8848 An insn containing that will not be recognized. */
8850 #undef gen_lowpart
8852 static rtx
8853 gen_lowpart_for_combine (mode, x)
8854 enum machine_mode mode;
8855 register rtx x;
8857 rtx result;
8859 if (GET_MODE (x) == mode)
8860 return x;
8862 /* We can only support MODE being wider than a word if X is a
8863 constant integer or has a mode the same size. */
8865 if (GET_MODE_SIZE (mode) > UNITS_PER_WORD
8866 && ! ((GET_MODE (x) == VOIDmode
8867 && (GET_CODE (x) == CONST_INT
8868 || GET_CODE (x) == CONST_DOUBLE))
8869 || GET_MODE_SIZE (GET_MODE (x)) == GET_MODE_SIZE (mode)))
8870 return gen_rtx (CLOBBER, GET_MODE (x), const0_rtx);
8872 /* X might be a paradoxical (subreg (mem)). In that case, gen_lowpart
8873 won't know what to do. So we will strip off the SUBREG here and
8874 process normally. */
8875 if (GET_CODE (x) == SUBREG && GET_CODE (SUBREG_REG (x)) == MEM)
8877 x = SUBREG_REG (x);
8878 if (GET_MODE (x) == mode)
8879 return x;
8882 result = gen_lowpart_common (mode, x);
8883 if (result != 0
8884 && GET_CODE (result) == SUBREG
8885 && GET_CODE (SUBREG_REG (result)) == REG
8886 && REGNO (SUBREG_REG (result)) >= FIRST_PSEUDO_REGISTER
8887 && (GET_MODE_SIZE (GET_MODE (result))
8888 != GET_MODE_SIZE (GET_MODE (SUBREG_REG (result)))))
8889 REG_CHANGES_SIZE (REGNO (SUBREG_REG (result))) = 1;
8891 if (result)
8892 return result;
8894 if (GET_CODE (x) == MEM)
8896 register int offset = 0;
8897 rtx new;
8899 /* Refuse to work on a volatile memory ref or one with a mode-dependent
8900 address. */
8901 if (MEM_VOLATILE_P (x) || mode_dependent_address_p (XEXP (x, 0)))
8902 return gen_rtx (CLOBBER, GET_MODE (x), const0_rtx);
8904 /* If we want to refer to something bigger than the original memref,
8905 generate a perverse subreg instead. That will force a reload
8906 of the original memref X. */
8907 if (GET_MODE_SIZE (GET_MODE (x)) < GET_MODE_SIZE (mode))
8908 return gen_rtx (SUBREG, mode, x, 0);
8910 if (WORDS_BIG_ENDIAN)
8911 offset = (MAX (GET_MODE_SIZE (GET_MODE (x)), UNITS_PER_WORD)
8912 - MAX (GET_MODE_SIZE (mode), UNITS_PER_WORD));
8913 if (BYTES_BIG_ENDIAN)
8915 /* Adjust the address so that the address-after-the-data is
8916 unchanged. */
8917 offset -= (MIN (UNITS_PER_WORD, GET_MODE_SIZE (mode))
8918 - MIN (UNITS_PER_WORD, GET_MODE_SIZE (GET_MODE (x))));
8920 new = gen_rtx (MEM, mode, plus_constant (XEXP (x, 0), offset));
8921 RTX_UNCHANGING_P (new) = RTX_UNCHANGING_P (x);
8922 MEM_VOLATILE_P (new) = MEM_VOLATILE_P (x);
8923 MEM_IN_STRUCT_P (new) = MEM_IN_STRUCT_P (x);
8924 return new;
8927 /* If X is a comparison operator, rewrite it in a new mode. This
8928 probably won't match, but may allow further simplifications. */
8929 else if (GET_RTX_CLASS (GET_CODE (x)) == '<')
8930 return gen_rtx_combine (GET_CODE (x), mode, XEXP (x, 0), XEXP (x, 1));
8932 /* If we couldn't simplify X any other way, just enclose it in a
8933 SUBREG. Normally, this SUBREG won't match, but some patterns may
8934 include an explicit SUBREG or we may simplify it further in combine. */
8935 else
8937 int word = 0;
8939 if (WORDS_BIG_ENDIAN && GET_MODE_SIZE (GET_MODE (x)) > UNITS_PER_WORD)
8940 word = ((GET_MODE_SIZE (GET_MODE (x))
8941 - MAX (GET_MODE_SIZE (mode), UNITS_PER_WORD))
8942 / UNITS_PER_WORD);
8943 return gen_rtx (SUBREG, mode, x, word);
8947 /* Make an rtx expression. This is a subset of gen_rtx and only supports
8948 expressions of 1, 2, or 3 operands, each of which are rtx expressions.
8950 If the identical expression was previously in the insn (in the undobuf),
8951 it will be returned. Only if it is not found will a new expression
8952 be made. */
8954 /*VARARGS2*/
8955 static rtx
8956 gen_rtx_combine VPROTO((enum rtx_code code, enum machine_mode mode, ...))
8958 #ifndef __STDC__
8959 enum rtx_code code;
8960 enum machine_mode mode;
8961 #endif
8962 va_list p;
8963 int n_args;
8964 rtx args[3];
8965 int i, j;
8966 char *fmt;
8967 rtx rt;
8968 struct undo *undo;
8970 VA_START (p, mode);
8972 #ifndef __STDC__
8973 code = va_arg (p, enum rtx_code);
8974 mode = va_arg (p, enum machine_mode);
8975 #endif
8977 n_args = GET_RTX_LENGTH (code);
8978 fmt = GET_RTX_FORMAT (code);
8980 if (n_args == 0 || n_args > 3)
8981 abort ();
8983 /* Get each arg and verify that it is supposed to be an expression. */
8984 for (j = 0; j < n_args; j++)
8986 if (*fmt++ != 'e')
8987 abort ();
8989 args[j] = va_arg (p, rtx);
8992 /* See if this is in undobuf. Be sure we don't use objects that came
8993 from another insn; this could produce circular rtl structures. */
8995 for (undo = undobuf.undos; undo != undobuf.previous_undos; undo = undo->next)
8996 if (!undo->is_int
8997 && GET_CODE (undo->old_contents.r) == code
8998 && GET_MODE (undo->old_contents.r) == mode)
9000 for (j = 0; j < n_args; j++)
9001 if (XEXP (undo->old_contents.r, j) != args[j])
9002 break;
9004 if (j == n_args)
9005 return undo->old_contents.r;
9008 /* Otherwise make a new rtx. We know we have 1, 2, or 3 args.
9009 Use rtx_alloc instead of gen_rtx because it's faster on RISC. */
9010 rt = rtx_alloc (code);
9011 PUT_MODE (rt, mode);
9012 XEXP (rt, 0) = args[0];
9013 if (n_args > 1)
9015 XEXP (rt, 1) = args[1];
9016 if (n_args > 2)
9017 XEXP (rt, 2) = args[2];
9019 return rt;
9022 /* These routines make binary and unary operations by first seeing if they
9023 fold; if not, a new expression is allocated. */
9025 static rtx
9026 gen_binary (code, mode, op0, op1)
9027 enum rtx_code code;
9028 enum machine_mode mode;
9029 rtx op0, op1;
9031 rtx result;
9032 rtx tem;
9034 if (GET_RTX_CLASS (code) == 'c'
9035 && (GET_CODE (op0) == CONST_INT
9036 || (CONSTANT_P (op0) && GET_CODE (op1) != CONST_INT)))
9037 tem = op0, op0 = op1, op1 = tem;
9039 if (GET_RTX_CLASS (code) == '<')
9041 enum machine_mode op_mode = GET_MODE (op0);
9043 /* Strip the COMPARE from (REL_OP (compare X Y) 0) to get
9044 just (REL_OP X Y). */
9045 if (GET_CODE (op0) == COMPARE && op1 == const0_rtx)
9047 op1 = XEXP (op0, 1);
9048 op0 = XEXP (op0, 0);
9049 op_mode = GET_MODE (op0);
9052 if (op_mode == VOIDmode)
9053 op_mode = GET_MODE (op1);
9054 result = simplify_relational_operation (code, op_mode, op0, op1);
9056 else
9057 result = simplify_binary_operation (code, mode, op0, op1);
9059 if (result)
9060 return result;
9062 /* Put complex operands first and constants second. */
9063 if (GET_RTX_CLASS (code) == 'c'
9064 && ((CONSTANT_P (op0) && GET_CODE (op1) != CONST_INT)
9065 || (GET_RTX_CLASS (GET_CODE (op0)) == 'o'
9066 && GET_RTX_CLASS (GET_CODE (op1)) != 'o')
9067 || (GET_CODE (op0) == SUBREG
9068 && GET_RTX_CLASS (GET_CODE (SUBREG_REG (op0))) == 'o'
9069 && GET_RTX_CLASS (GET_CODE (op1)) != 'o')))
9070 return gen_rtx_combine (code, mode, op1, op0);
9072 return gen_rtx_combine (code, mode, op0, op1);
9075 static rtx
9076 gen_unary (code, mode, op0_mode, op0)
9077 enum rtx_code code;
9078 enum machine_mode mode, op0_mode;
9079 rtx op0;
9081 rtx result = simplify_unary_operation (code, mode, op0, op0_mode);
9083 if (result)
9084 return result;
9086 return gen_rtx_combine (code, mode, op0);
9089 /* Simplify a comparison between *POP0 and *POP1 where CODE is the
9090 comparison code that will be tested.
9092 The result is a possibly different comparison code to use. *POP0 and
9093 *POP1 may be updated.
9095 It is possible that we might detect that a comparison is either always
9096 true or always false. However, we do not perform general constant
9097 folding in combine, so this knowledge isn't useful. Such tautologies
9098 should have been detected earlier. Hence we ignore all such cases. */
9100 static enum rtx_code
9101 simplify_comparison (code, pop0, pop1)
9102 enum rtx_code code;
9103 rtx *pop0;
9104 rtx *pop1;
9106 rtx op0 = *pop0;
9107 rtx op1 = *pop1;
9108 rtx tem, tem1;
9109 int i;
9110 enum machine_mode mode, tmode;
9112 /* Try a few ways of applying the same transformation to both operands. */
9113 while (1)
9115 #ifndef WORD_REGISTER_OPERATIONS
9116 /* The test below this one won't handle SIGN_EXTENDs on these machines,
9117 so check specially. */
9118 if (code != GTU && code != GEU && code != LTU && code != LEU
9119 && GET_CODE (op0) == ASHIFTRT && GET_CODE (op1) == ASHIFTRT
9120 && GET_CODE (XEXP (op0, 0)) == ASHIFT
9121 && GET_CODE (XEXP (op1, 0)) == ASHIFT
9122 && GET_CODE (XEXP (XEXP (op0, 0), 0)) == SUBREG
9123 && GET_CODE (XEXP (XEXP (op1, 0), 0)) == SUBREG
9124 && (GET_MODE (SUBREG_REG (XEXP (XEXP (op0, 0), 0)))
9125 == GET_MODE (SUBREG_REG (XEXP (XEXP (op1, 0), 0))))
9126 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9127 && GET_CODE (XEXP (op1, 1)) == CONST_INT
9128 && GET_CODE (XEXP (XEXP (op0, 0), 1)) == CONST_INT
9129 && GET_CODE (XEXP (XEXP (op1, 0), 1)) == CONST_INT
9130 && INTVAL (XEXP (op0, 1)) == INTVAL (XEXP (op1, 1))
9131 && INTVAL (XEXP (op0, 1)) == INTVAL (XEXP (XEXP (op0, 0), 1))
9132 && INTVAL (XEXP (op0, 1)) == INTVAL (XEXP (XEXP (op1, 0), 1))
9133 && (INTVAL (XEXP (op0, 1))
9134 == (GET_MODE_BITSIZE (GET_MODE (op0))
9135 - (GET_MODE_BITSIZE
9136 (GET_MODE (SUBREG_REG (XEXP (XEXP (op0, 0), 0))))))))
9138 op0 = SUBREG_REG (XEXP (XEXP (op0, 0), 0));
9139 op1 = SUBREG_REG (XEXP (XEXP (op1, 0), 0));
9141 #endif
9143 /* If both operands are the same constant shift, see if we can ignore the
9144 shift. We can if the shift is a rotate or if the bits shifted out of
9145 this shift are known to be zero for both inputs and if the type of
9146 comparison is compatible with the shift. */
9147 if (GET_CODE (op0) == GET_CODE (op1)
9148 && GET_MODE_BITSIZE (GET_MODE (op0)) <= HOST_BITS_PER_WIDE_INT
9149 && ((GET_CODE (op0) == ROTATE && (code == NE || code == EQ))
9150 || ((GET_CODE (op0) == LSHIFTRT || GET_CODE (op0) == ASHIFT)
9151 && (code != GT && code != LT && code != GE && code != LE))
9152 || (GET_CODE (op0) == ASHIFTRT
9153 && (code != GTU && code != LTU
9154 && code != GEU && code != GEU)))
9155 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9156 && INTVAL (XEXP (op0, 1)) >= 0
9157 && INTVAL (XEXP (op0, 1)) < HOST_BITS_PER_WIDE_INT
9158 && XEXP (op0, 1) == XEXP (op1, 1))
9160 enum machine_mode mode = GET_MODE (op0);
9161 unsigned HOST_WIDE_INT mask = GET_MODE_MASK (mode);
9162 int shift_count = INTVAL (XEXP (op0, 1));
9164 if (GET_CODE (op0) == LSHIFTRT || GET_CODE (op0) == ASHIFTRT)
9165 mask &= (mask >> shift_count) << shift_count;
9166 else if (GET_CODE (op0) == ASHIFT)
9167 mask = (mask & (mask << shift_count)) >> shift_count;
9169 if ((nonzero_bits (XEXP (op0, 0), mode) & ~ mask) == 0
9170 && (nonzero_bits (XEXP (op1, 0), mode) & ~ mask) == 0)
9171 op0 = XEXP (op0, 0), op1 = XEXP (op1, 0);
9172 else
9173 break;
9176 /* If both operands are AND's of a paradoxical SUBREG by constant, the
9177 SUBREGs are of the same mode, and, in both cases, the AND would
9178 be redundant if the comparison was done in the narrower mode,
9179 do the comparison in the narrower mode (e.g., we are AND'ing with 1
9180 and the operand's possibly nonzero bits are 0xffffff01; in that case
9181 if we only care about QImode, we don't need the AND). This case
9182 occurs if the output mode of an scc insn is not SImode and
9183 STORE_FLAG_VALUE == 1 (e.g., the 386).
9185 Similarly, check for a case where the AND's are ZERO_EXTEND
9186 operations from some narrower mode even though a SUBREG is not
9187 present. */
9189 else if (GET_CODE (op0) == AND && GET_CODE (op1) == AND
9190 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9191 && GET_CODE (XEXP (op1, 1)) == CONST_INT)
9193 rtx inner_op0 = XEXP (op0, 0);
9194 rtx inner_op1 = XEXP (op1, 0);
9195 HOST_WIDE_INT c0 = INTVAL (XEXP (op0, 1));
9196 HOST_WIDE_INT c1 = INTVAL (XEXP (op1, 1));
9197 int changed = 0;
9199 if (GET_CODE (inner_op0) == SUBREG && GET_CODE (inner_op1) == SUBREG
9200 && (GET_MODE_SIZE (GET_MODE (inner_op0))
9201 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (inner_op0))))
9202 && (GET_MODE (SUBREG_REG (inner_op0))
9203 == GET_MODE (SUBREG_REG (inner_op1)))
9204 && (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (op0)))
9205 <= HOST_BITS_PER_WIDE_INT)
9206 && (0 == ((~c0) & nonzero_bits (SUBREG_REG (inner_op0),
9207 GET_MODE (SUBREG_REG (op0)))))
9208 && (0 == ((~c1) & nonzero_bits (SUBREG_REG (inner_op1),
9209 GET_MODE (SUBREG_REG (inner_op1))))))
9211 op0 = SUBREG_REG (inner_op0);
9212 op1 = SUBREG_REG (inner_op1);
9214 /* The resulting comparison is always unsigned since we masked
9215 off the original sign bit. */
9216 code = unsigned_condition (code);
9218 changed = 1;
9221 else if (c0 == c1)
9222 for (tmode = GET_CLASS_NARROWEST_MODE
9223 (GET_MODE_CLASS (GET_MODE (op0)));
9224 tmode != GET_MODE (op0); tmode = GET_MODE_WIDER_MODE (tmode))
9225 if (c0 == GET_MODE_MASK (tmode))
9227 op0 = gen_lowpart_for_combine (tmode, inner_op0);
9228 op1 = gen_lowpart_for_combine (tmode, inner_op1);
9229 code = unsigned_condition (code);
9230 changed = 1;
9231 break;
9234 if (! changed)
9235 break;
9238 /* If both operands are NOT, we can strip off the outer operation
9239 and adjust the comparison code for swapped operands; similarly for
9240 NEG, except that this must be an equality comparison. */
9241 else if ((GET_CODE (op0) == NOT && GET_CODE (op1) == NOT)
9242 || (GET_CODE (op0) == NEG && GET_CODE (op1) == NEG
9243 && (code == EQ || code == NE)))
9244 op0 = XEXP (op0, 0), op1 = XEXP (op1, 0), code = swap_condition (code);
9246 else
9247 break;
9250 /* If the first operand is a constant, swap the operands and adjust the
9251 comparison code appropriately, but don't do this if the second operand
9252 is already a constant integer. */
9253 if (CONSTANT_P (op0) && GET_CODE (op1) != CONST_INT)
9255 tem = op0, op0 = op1, op1 = tem;
9256 code = swap_condition (code);
9259 /* We now enter a loop during which we will try to simplify the comparison.
9260 For the most part, we only are concerned with comparisons with zero,
9261 but some things may really be comparisons with zero but not start
9262 out looking that way. */
9264 while (GET_CODE (op1) == CONST_INT)
9266 enum machine_mode mode = GET_MODE (op0);
9267 int mode_width = GET_MODE_BITSIZE (mode);
9268 unsigned HOST_WIDE_INT mask = GET_MODE_MASK (mode);
9269 int equality_comparison_p;
9270 int sign_bit_comparison_p;
9271 int unsigned_comparison_p;
9272 HOST_WIDE_INT const_op;
9274 /* We only want to handle integral modes. This catches VOIDmode,
9275 CCmode, and the floating-point modes. An exception is that we
9276 can handle VOIDmode if OP0 is a COMPARE or a comparison
9277 operation. */
9279 if (GET_MODE_CLASS (mode) != MODE_INT
9280 && ! (mode == VOIDmode
9281 && (GET_CODE (op0) == COMPARE
9282 || GET_RTX_CLASS (GET_CODE (op0)) == '<')))
9283 break;
9285 /* Get the constant we are comparing against and turn off all bits
9286 not on in our mode. */
9287 const_op = INTVAL (op1);
9288 if (mode_width <= HOST_BITS_PER_WIDE_INT)
9289 const_op &= mask;
9291 /* If we are comparing against a constant power of two and the value
9292 being compared can only have that single bit nonzero (e.g., it was
9293 `and'ed with that bit), we can replace this with a comparison
9294 with zero. */
9295 if (const_op
9296 && (code == EQ || code == NE || code == GE || code == GEU
9297 || code == LT || code == LTU)
9298 && mode_width <= HOST_BITS_PER_WIDE_INT
9299 && exact_log2 (const_op) >= 0
9300 && nonzero_bits (op0, mode) == const_op)
9302 code = (code == EQ || code == GE || code == GEU ? NE : EQ);
9303 op1 = const0_rtx, const_op = 0;
9306 /* Similarly, if we are comparing a value known to be either -1 or
9307 0 with -1, change it to the opposite comparison against zero. */
9309 if (const_op == -1
9310 && (code == EQ || code == NE || code == GT || code == LE
9311 || code == GEU || code == LTU)
9312 && num_sign_bit_copies (op0, mode) == mode_width)
9314 code = (code == EQ || code == LE || code == GEU ? NE : EQ);
9315 op1 = const0_rtx, const_op = 0;
9318 /* Do some canonicalizations based on the comparison code. We prefer
9319 comparisons against zero and then prefer equality comparisons.
9320 If we can reduce the size of a constant, we will do that too. */
9322 switch (code)
9324 case LT:
9325 /* < C is equivalent to <= (C - 1) */
9326 if (const_op > 0)
9328 const_op -= 1;
9329 op1 = GEN_INT (const_op);
9330 code = LE;
9331 /* ... fall through to LE case below. */
9333 else
9334 break;
9336 case LE:
9337 /* <= C is equivalent to < (C + 1); we do this for C < 0 */
9338 if (const_op < 0)
9340 const_op += 1;
9341 op1 = GEN_INT (const_op);
9342 code = LT;
9345 /* If we are doing a <= 0 comparison on a value known to have
9346 a zero sign bit, we can replace this with == 0. */
9347 else if (const_op == 0
9348 && mode_width <= HOST_BITS_PER_WIDE_INT
9349 && (nonzero_bits (op0, mode)
9350 & ((HOST_WIDE_INT) 1 << (mode_width - 1))) == 0)
9351 code = EQ;
9352 break;
9354 case GE:
9355 /* >= C is equivalent to > (C - 1). */
9356 if (const_op > 0)
9358 const_op -= 1;
9359 op1 = GEN_INT (const_op);
9360 code = GT;
9361 /* ... fall through to GT below. */
9363 else
9364 break;
9366 case GT:
9367 /* > C is equivalent to >= (C + 1); we do this for C < 0*/
9368 if (const_op < 0)
9370 const_op += 1;
9371 op1 = GEN_INT (const_op);
9372 code = GE;
9375 /* If we are doing a > 0 comparison on a value known to have
9376 a zero sign bit, we can replace this with != 0. */
9377 else if (const_op == 0
9378 && mode_width <= HOST_BITS_PER_WIDE_INT
9379 && (nonzero_bits (op0, mode)
9380 & ((HOST_WIDE_INT) 1 << (mode_width - 1))) == 0)
9381 code = NE;
9382 break;
9384 case LTU:
9385 /* < C is equivalent to <= (C - 1). */
9386 if (const_op > 0)
9388 const_op -= 1;
9389 op1 = GEN_INT (const_op);
9390 code = LEU;
9391 /* ... fall through ... */
9394 /* (unsigned) < 0x80000000 is equivalent to >= 0. */
9395 else if ((mode_width <= HOST_BITS_PER_WIDE_INT)
9396 && (const_op == (HOST_WIDE_INT) 1 << (mode_width - 1)))
9398 const_op = 0, op1 = const0_rtx;
9399 code = GE;
9400 break;
9402 else
9403 break;
9405 case LEU:
9406 /* unsigned <= 0 is equivalent to == 0 */
9407 if (const_op == 0)
9408 code = EQ;
9410 /* (unsigned) <= 0x7fffffff is equivalent to >= 0. */
9411 else if ((mode_width <= HOST_BITS_PER_WIDE_INT)
9412 && (const_op == ((HOST_WIDE_INT) 1 << (mode_width - 1)) - 1))
9414 const_op = 0, op1 = const0_rtx;
9415 code = GE;
9417 break;
9419 case GEU:
9420 /* >= C is equivalent to < (C - 1). */
9421 if (const_op > 1)
9423 const_op -= 1;
9424 op1 = GEN_INT (const_op);
9425 code = GTU;
9426 /* ... fall through ... */
9429 /* (unsigned) >= 0x80000000 is equivalent to < 0. */
9430 else if ((mode_width <= HOST_BITS_PER_WIDE_INT)
9431 && (const_op == (HOST_WIDE_INT) 1 << (mode_width - 1)))
9433 const_op = 0, op1 = const0_rtx;
9434 code = LT;
9435 break;
9437 else
9438 break;
9440 case GTU:
9441 /* unsigned > 0 is equivalent to != 0 */
9442 if (const_op == 0)
9443 code = NE;
9445 /* (unsigned) > 0x7fffffff is equivalent to < 0. */
9446 else if ((mode_width <= HOST_BITS_PER_WIDE_INT)
9447 && (const_op == ((HOST_WIDE_INT) 1 << (mode_width - 1)) - 1))
9449 const_op = 0, op1 = const0_rtx;
9450 code = LT;
9452 break;
9455 /* Compute some predicates to simplify code below. */
9457 equality_comparison_p = (code == EQ || code == NE);
9458 sign_bit_comparison_p = ((code == LT || code == GE) && const_op == 0);
9459 unsigned_comparison_p = (code == LTU || code == LEU || code == GTU
9460 || code == LEU);
9462 /* If this is a sign bit comparison and we can do arithmetic in
9463 MODE, say that we will only be needing the sign bit of OP0. */
9464 if (sign_bit_comparison_p
9465 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT)
9466 op0 = force_to_mode (op0, mode,
9467 ((HOST_WIDE_INT) 1
9468 << (GET_MODE_BITSIZE (mode) - 1)),
9469 NULL_RTX, 0);
9471 /* Now try cases based on the opcode of OP0. If none of the cases
9472 does a "continue", we exit this loop immediately after the
9473 switch. */
9475 switch (GET_CODE (op0))
9477 case ZERO_EXTRACT:
9478 /* If we are extracting a single bit from a variable position in
9479 a constant that has only a single bit set and are comparing it
9480 with zero, we can convert this into an equality comparison
9481 between the position and the location of the single bit. */
9483 if (GET_CODE (XEXP (op0, 0)) == CONST_INT
9484 && XEXP (op0, 1) == const1_rtx
9485 && equality_comparison_p && const_op == 0
9486 && (i = exact_log2 (INTVAL (XEXP (op0, 0)))) >= 0)
9488 if (BITS_BIG_ENDIAN)
9489 #ifdef HAVE_extzv
9490 i = (GET_MODE_BITSIZE
9491 (insn_operand_mode[(int) CODE_FOR_extzv][1]) - 1 - i);
9492 #else
9493 i = BITS_PER_WORD - 1 - i;
9494 #endif
9496 op0 = XEXP (op0, 2);
9497 op1 = GEN_INT (i);
9498 const_op = i;
9500 /* Result is nonzero iff shift count is equal to I. */
9501 code = reverse_condition (code);
9502 continue;
9505 /* ... fall through ... */
9507 case SIGN_EXTRACT:
9508 tem = expand_compound_operation (op0);
9509 if (tem != op0)
9511 op0 = tem;
9512 continue;
9514 break;
9516 case NOT:
9517 /* If testing for equality, we can take the NOT of the constant. */
9518 if (equality_comparison_p
9519 && (tem = simplify_unary_operation (NOT, mode, op1, mode)) != 0)
9521 op0 = XEXP (op0, 0);
9522 op1 = tem;
9523 continue;
9526 /* If just looking at the sign bit, reverse the sense of the
9527 comparison. */
9528 if (sign_bit_comparison_p)
9530 op0 = XEXP (op0, 0);
9531 code = (code == GE ? LT : GE);
9532 continue;
9534 break;
9536 case NEG:
9537 /* If testing for equality, we can take the NEG of the constant. */
9538 if (equality_comparison_p
9539 && (tem = simplify_unary_operation (NEG, mode, op1, mode)) != 0)
9541 op0 = XEXP (op0, 0);
9542 op1 = tem;
9543 continue;
9546 /* The remaining cases only apply to comparisons with zero. */
9547 if (const_op != 0)
9548 break;
9550 /* When X is ABS or is known positive,
9551 (neg X) is < 0 if and only if X != 0. */
9553 if (sign_bit_comparison_p
9554 && (GET_CODE (XEXP (op0, 0)) == ABS
9555 || (mode_width <= HOST_BITS_PER_WIDE_INT
9556 && (nonzero_bits (XEXP (op0, 0), mode)
9557 & ((HOST_WIDE_INT) 1 << (mode_width - 1))) == 0)))
9559 op0 = XEXP (op0, 0);
9560 code = (code == LT ? NE : EQ);
9561 continue;
9564 /* If we have NEG of something whose two high-order bits are the
9565 same, we know that "(-a) < 0" is equivalent to "a > 0". */
9566 if (num_sign_bit_copies (op0, mode) >= 2)
9568 op0 = XEXP (op0, 0);
9569 code = swap_condition (code);
9570 continue;
9572 break;
9574 case ROTATE:
9575 /* If we are testing equality and our count is a constant, we
9576 can perform the inverse operation on our RHS. */
9577 if (equality_comparison_p && GET_CODE (XEXP (op0, 1)) == CONST_INT
9578 && (tem = simplify_binary_operation (ROTATERT, mode,
9579 op1, XEXP (op0, 1))) != 0)
9581 op0 = XEXP (op0, 0);
9582 op1 = tem;
9583 continue;
9586 /* If we are doing a < 0 or >= 0 comparison, it means we are testing
9587 a particular bit. Convert it to an AND of a constant of that
9588 bit. This will be converted into a ZERO_EXTRACT. */
9589 if (const_op == 0 && sign_bit_comparison_p
9590 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9591 && mode_width <= HOST_BITS_PER_WIDE_INT)
9593 op0 = simplify_and_const_int (NULL_RTX, mode, XEXP (op0, 0),
9594 ((HOST_WIDE_INT) 1
9595 << (mode_width - 1
9596 - INTVAL (XEXP (op0, 1)))));
9597 code = (code == LT ? NE : EQ);
9598 continue;
9601 /* ... fall through ... */
9603 case ABS:
9604 /* ABS is ignorable inside an equality comparison with zero. */
9605 if (const_op == 0 && equality_comparison_p)
9607 op0 = XEXP (op0, 0);
9608 continue;
9610 break;
9613 case SIGN_EXTEND:
9614 /* Can simplify (compare (zero/sign_extend FOO) CONST)
9615 to (compare FOO CONST) if CONST fits in FOO's mode and we
9616 are either testing inequality or have an unsigned comparison
9617 with ZERO_EXTEND or a signed comparison with SIGN_EXTEND. */
9618 if (! unsigned_comparison_p
9619 && (GET_MODE_BITSIZE (GET_MODE (XEXP (op0, 0)))
9620 <= HOST_BITS_PER_WIDE_INT)
9621 && ((unsigned HOST_WIDE_INT) const_op
9622 < (((HOST_WIDE_INT) 1
9623 << (GET_MODE_BITSIZE (GET_MODE (XEXP (op0, 0))) - 1)))))
9625 op0 = XEXP (op0, 0);
9626 continue;
9628 break;
9630 case SUBREG:
9631 /* Check for the case where we are comparing A - C1 with C2,
9632 both constants are smaller than 1/2 the maximum positive
9633 value in MODE, and the comparison is equality or unsigned.
9634 In that case, if A is either zero-extended to MODE or has
9635 sufficient sign bits so that the high-order bit in MODE
9636 is a copy of the sign in the inner mode, we can prove that it is
9637 safe to do the operation in the wider mode. This simplifies
9638 many range checks. */
9640 if (mode_width <= HOST_BITS_PER_WIDE_INT
9641 && subreg_lowpart_p (op0)
9642 && GET_CODE (SUBREG_REG (op0)) == PLUS
9643 && GET_CODE (XEXP (SUBREG_REG (op0), 1)) == CONST_INT
9644 && INTVAL (XEXP (SUBREG_REG (op0), 1)) < 0
9645 && (- INTVAL (XEXP (SUBREG_REG (op0), 1))
9646 < GET_MODE_MASK (mode) / 2)
9647 && (unsigned HOST_WIDE_INT) const_op < GET_MODE_MASK (mode) / 2
9648 && (0 == (nonzero_bits (XEXP (SUBREG_REG (op0), 0),
9649 GET_MODE (SUBREG_REG (op0)))
9650 & ~ GET_MODE_MASK (mode))
9651 || (num_sign_bit_copies (XEXP (SUBREG_REG (op0), 0),
9652 GET_MODE (SUBREG_REG (op0)))
9653 > (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (op0)))
9654 - GET_MODE_BITSIZE (mode)))))
9656 op0 = SUBREG_REG (op0);
9657 continue;
9660 /* If the inner mode is narrower and we are extracting the low part,
9661 we can treat the SUBREG as if it were a ZERO_EXTEND. */
9662 if (subreg_lowpart_p (op0)
9663 && GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (op0))) < mode_width)
9664 /* Fall through */ ;
9665 else
9666 break;
9668 /* ... fall through ... */
9670 case ZERO_EXTEND:
9671 if ((unsigned_comparison_p || equality_comparison_p)
9672 && (GET_MODE_BITSIZE (GET_MODE (XEXP (op0, 0)))
9673 <= HOST_BITS_PER_WIDE_INT)
9674 && ((unsigned HOST_WIDE_INT) const_op
9675 < GET_MODE_MASK (GET_MODE (XEXP (op0, 0)))))
9677 op0 = XEXP (op0, 0);
9678 continue;
9680 break;
9682 case PLUS:
9683 /* (eq (plus X A) B) -> (eq X (minus B A)). We can only do
9684 this for equality comparisons due to pathological cases involving
9685 overflows. */
9686 if (equality_comparison_p
9687 && 0 != (tem = simplify_binary_operation (MINUS, mode,
9688 op1, XEXP (op0, 1))))
9690 op0 = XEXP (op0, 0);
9691 op1 = tem;
9692 continue;
9695 /* (plus (abs X) (const_int -1)) is < 0 if and only if X == 0. */
9696 if (const_op == 0 && XEXP (op0, 1) == constm1_rtx
9697 && GET_CODE (XEXP (op0, 0)) == ABS && sign_bit_comparison_p)
9699 op0 = XEXP (XEXP (op0, 0), 0);
9700 code = (code == LT ? EQ : NE);
9701 continue;
9703 break;
9705 case MINUS:
9706 /* (eq (minus A B) C) -> (eq A (plus B C)) or
9707 (eq B (minus A C)), whichever simplifies. We can only do
9708 this for equality comparisons due to pathological cases involving
9709 overflows. */
9710 if (equality_comparison_p
9711 && 0 != (tem = simplify_binary_operation (PLUS, mode,
9712 XEXP (op0, 1), op1)))
9714 op0 = XEXP (op0, 0);
9715 op1 = tem;
9716 continue;
9719 if (equality_comparison_p
9720 && 0 != (tem = simplify_binary_operation (MINUS, mode,
9721 XEXP (op0, 0), op1)))
9723 op0 = XEXP (op0, 1);
9724 op1 = tem;
9725 continue;
9728 /* The sign bit of (minus (ashiftrt X C) X), where C is the number
9729 of bits in X minus 1, is one iff X > 0. */
9730 if (sign_bit_comparison_p && GET_CODE (XEXP (op0, 0)) == ASHIFTRT
9731 && GET_CODE (XEXP (XEXP (op0, 0), 1)) == CONST_INT
9732 && INTVAL (XEXP (XEXP (op0, 0), 1)) == mode_width - 1
9733 && rtx_equal_p (XEXP (XEXP (op0, 0), 0), XEXP (op0, 1)))
9735 op0 = XEXP (op0, 1);
9736 code = (code == GE ? LE : GT);
9737 continue;
9739 break;
9741 case XOR:
9742 /* (eq (xor A B) C) -> (eq A (xor B C)). This is a simplification
9743 if C is zero or B is a constant. */
9744 if (equality_comparison_p
9745 && 0 != (tem = simplify_binary_operation (XOR, mode,
9746 XEXP (op0, 1), op1)))
9748 op0 = XEXP (op0, 0);
9749 op1 = tem;
9750 continue;
9752 break;
9754 case EQ: case NE:
9755 case LT: case LTU: case LE: case LEU:
9756 case GT: case GTU: case GE: case GEU:
9757 /* We can't do anything if OP0 is a condition code value, rather
9758 than an actual data value. */
9759 if (const_op != 0
9760 #ifdef HAVE_cc0
9761 || XEXP (op0, 0) == cc0_rtx
9762 #endif
9763 || GET_MODE_CLASS (GET_MODE (XEXP (op0, 0))) == MODE_CC)
9764 break;
9766 /* Get the two operands being compared. */
9767 if (GET_CODE (XEXP (op0, 0)) == COMPARE)
9768 tem = XEXP (XEXP (op0, 0), 0), tem1 = XEXP (XEXP (op0, 0), 1);
9769 else
9770 tem = XEXP (op0, 0), tem1 = XEXP (op0, 1);
9772 /* Check for the cases where we simply want the result of the
9773 earlier test or the opposite of that result. */
9774 if (code == NE
9775 || (code == EQ && reversible_comparison_p (op0))
9776 || (GET_MODE_BITSIZE (GET_MODE (op0)) <= HOST_BITS_PER_WIDE_INT
9777 && GET_MODE_CLASS (GET_MODE (op0)) == MODE_INT
9778 && (STORE_FLAG_VALUE
9779 & (((HOST_WIDE_INT) 1
9780 << (GET_MODE_BITSIZE (GET_MODE (op0)) - 1))))
9781 && (code == LT
9782 || (code == GE && reversible_comparison_p (op0)))))
9784 code = (code == LT || code == NE
9785 ? GET_CODE (op0) : reverse_condition (GET_CODE (op0)));
9786 op0 = tem, op1 = tem1;
9787 continue;
9789 break;
9791 case IOR:
9792 /* The sign bit of (ior (plus X (const_int -1)) X) is non-zero
9793 iff X <= 0. */
9794 if (sign_bit_comparison_p && GET_CODE (XEXP (op0, 0)) == PLUS
9795 && XEXP (XEXP (op0, 0), 1) == constm1_rtx
9796 && rtx_equal_p (XEXP (XEXP (op0, 0), 0), XEXP (op0, 1)))
9798 op0 = XEXP (op0, 1);
9799 code = (code == GE ? GT : LE);
9800 continue;
9802 break;
9804 case AND:
9805 /* Convert (and (xshift 1 X) Y) to (and (lshiftrt Y X) 1). This
9806 will be converted to a ZERO_EXTRACT later. */
9807 if (const_op == 0 && equality_comparison_p
9808 && GET_CODE (XEXP (op0, 0)) == ASHIFT
9809 && XEXP (XEXP (op0, 0), 0) == const1_rtx)
9811 op0 = simplify_and_const_int
9812 (op0, mode, gen_rtx_combine (LSHIFTRT, mode,
9813 XEXP (op0, 1),
9814 XEXP (XEXP (op0, 0), 1)),
9815 (HOST_WIDE_INT) 1);
9816 continue;
9819 /* If we are comparing (and (lshiftrt X C1) C2) for equality with
9820 zero and X is a comparison and C1 and C2 describe only bits set
9821 in STORE_FLAG_VALUE, we can compare with X. */
9822 if (const_op == 0 && equality_comparison_p
9823 && mode_width <= HOST_BITS_PER_WIDE_INT
9824 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9825 && GET_CODE (XEXP (op0, 0)) == LSHIFTRT
9826 && GET_CODE (XEXP (XEXP (op0, 0), 1)) == CONST_INT
9827 && INTVAL (XEXP (XEXP (op0, 0), 1)) >= 0
9828 && INTVAL (XEXP (XEXP (op0, 0), 1)) < HOST_BITS_PER_WIDE_INT)
9830 mask = ((INTVAL (XEXP (op0, 1)) & GET_MODE_MASK (mode))
9831 << INTVAL (XEXP (XEXP (op0, 0), 1)));
9832 if ((~ STORE_FLAG_VALUE & mask) == 0
9833 && (GET_RTX_CLASS (GET_CODE (XEXP (XEXP (op0, 0), 0))) == '<'
9834 || ((tem = get_last_value (XEXP (XEXP (op0, 0), 0))) != 0
9835 && GET_RTX_CLASS (GET_CODE (tem)) == '<')))
9837 op0 = XEXP (XEXP (op0, 0), 0);
9838 continue;
9842 /* If we are doing an equality comparison of an AND of a bit equal
9843 to the sign bit, replace this with a LT or GE comparison of
9844 the underlying value. */
9845 if (equality_comparison_p
9846 && const_op == 0
9847 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9848 && mode_width <= HOST_BITS_PER_WIDE_INT
9849 && ((INTVAL (XEXP (op0, 1)) & GET_MODE_MASK (mode))
9850 == (HOST_WIDE_INT) 1 << (mode_width - 1)))
9852 op0 = XEXP (op0, 0);
9853 code = (code == EQ ? GE : LT);
9854 continue;
9857 /* If this AND operation is really a ZERO_EXTEND from a narrower
9858 mode, the constant fits within that mode, and this is either an
9859 equality or unsigned comparison, try to do this comparison in
9860 the narrower mode. */
9861 if ((equality_comparison_p || unsigned_comparison_p)
9862 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9863 && (i = exact_log2 ((INTVAL (XEXP (op0, 1))
9864 & GET_MODE_MASK (mode))
9865 + 1)) >= 0
9866 && const_op >> i == 0
9867 && (tmode = mode_for_size (i, MODE_INT, 1)) != BLKmode)
9869 op0 = gen_lowpart_for_combine (tmode, XEXP (op0, 0));
9870 continue;
9872 break;
9874 case ASHIFT:
9875 /* If we have (compare (ashift FOO N) (const_int C)) and
9876 the high order N bits of FOO (N+1 if an inequality comparison)
9877 are known to be zero, we can do this by comparing FOO with C
9878 shifted right N bits so long as the low-order N bits of C are
9879 zero. */
9880 if (GET_CODE (XEXP (op0, 1)) == CONST_INT
9881 && INTVAL (XEXP (op0, 1)) >= 0
9882 && ((INTVAL (XEXP (op0, 1)) + ! equality_comparison_p)
9883 < HOST_BITS_PER_WIDE_INT)
9884 && ((const_op
9885 & (((HOST_WIDE_INT) 1 << INTVAL (XEXP (op0, 1))) - 1)) == 0)
9886 && mode_width <= HOST_BITS_PER_WIDE_INT
9887 && (nonzero_bits (XEXP (op0, 0), mode)
9888 & ~ (mask >> (INTVAL (XEXP (op0, 1))
9889 + ! equality_comparison_p))) == 0)
9891 const_op >>= INTVAL (XEXP (op0, 1));
9892 op1 = GEN_INT (const_op);
9893 op0 = XEXP (op0, 0);
9894 continue;
9897 /* If we are doing a sign bit comparison, it means we are testing
9898 a particular bit. Convert it to the appropriate AND. */
9899 if (sign_bit_comparison_p && GET_CODE (XEXP (op0, 1)) == CONST_INT
9900 && mode_width <= HOST_BITS_PER_WIDE_INT)
9902 op0 = simplify_and_const_int (NULL_RTX, mode, XEXP (op0, 0),
9903 ((HOST_WIDE_INT) 1
9904 << (mode_width - 1
9905 - INTVAL (XEXP (op0, 1)))));
9906 code = (code == LT ? NE : EQ);
9907 continue;
9910 /* If this an equality comparison with zero and we are shifting
9911 the low bit to the sign bit, we can convert this to an AND of the
9912 low-order bit. */
9913 if (const_op == 0 && equality_comparison_p
9914 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9915 && INTVAL (XEXP (op0, 1)) == mode_width - 1)
9917 op0 = simplify_and_const_int (NULL_RTX, mode, XEXP (op0, 0),
9918 (HOST_WIDE_INT) 1);
9919 continue;
9921 break;
9923 case ASHIFTRT:
9924 /* If this is an equality comparison with zero, we can do this
9925 as a logical shift, which might be much simpler. */
9926 if (equality_comparison_p && const_op == 0
9927 && GET_CODE (XEXP (op0, 1)) == CONST_INT)
9929 op0 = simplify_shift_const (NULL_RTX, LSHIFTRT, mode,
9930 XEXP (op0, 0),
9931 INTVAL (XEXP (op0, 1)));
9932 continue;
9935 /* If OP0 is a sign extension and CODE is not an unsigned comparison,
9936 do the comparison in a narrower mode. */
9937 if (! unsigned_comparison_p
9938 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9939 && GET_CODE (XEXP (op0, 0)) == ASHIFT
9940 && XEXP (op0, 1) == XEXP (XEXP (op0, 0), 1)
9941 && (tmode = mode_for_size (mode_width - INTVAL (XEXP (op0, 1)),
9942 MODE_INT, 1)) != BLKmode
9943 && ((unsigned HOST_WIDE_INT) const_op <= GET_MODE_MASK (tmode)
9944 || ((unsigned HOST_WIDE_INT) - const_op
9945 <= GET_MODE_MASK (tmode))))
9947 op0 = gen_lowpart_for_combine (tmode, XEXP (XEXP (op0, 0), 0));
9948 continue;
9951 /* ... fall through ... */
9952 case LSHIFTRT:
9953 /* If we have (compare (xshiftrt FOO N) (const_int C)) and
9954 the low order N bits of FOO are known to be zero, we can do this
9955 by comparing FOO with C shifted left N bits so long as no
9956 overflow occurs. */
9957 if (GET_CODE (XEXP (op0, 1)) == CONST_INT
9958 && INTVAL (XEXP (op0, 1)) >= 0
9959 && INTVAL (XEXP (op0, 1)) < HOST_BITS_PER_WIDE_INT
9960 && mode_width <= HOST_BITS_PER_WIDE_INT
9961 && (nonzero_bits (XEXP (op0, 0), mode)
9962 & (((HOST_WIDE_INT) 1 << INTVAL (XEXP (op0, 1))) - 1)) == 0
9963 && (const_op == 0
9964 || (floor_log2 (const_op) + INTVAL (XEXP (op0, 1))
9965 < mode_width)))
9967 const_op <<= INTVAL (XEXP (op0, 1));
9968 op1 = GEN_INT (const_op);
9969 op0 = XEXP (op0, 0);
9970 continue;
9973 /* If we are using this shift to extract just the sign bit, we
9974 can replace this with an LT or GE comparison. */
9975 if (const_op == 0
9976 && (equality_comparison_p || sign_bit_comparison_p)
9977 && GET_CODE (XEXP (op0, 1)) == CONST_INT
9978 && INTVAL (XEXP (op0, 1)) == mode_width - 1)
9980 op0 = XEXP (op0, 0);
9981 code = (code == NE || code == GT ? LT : GE);
9982 continue;
9984 break;
9987 break;
9990 /* Now make any compound operations involved in this comparison. Then,
9991 check for an outmost SUBREG on OP0 that isn't doing anything or is
9992 paradoxical. The latter case can only occur when it is known that the
9993 "extra" bits will be zero. Therefore, it is safe to remove the SUBREG.
9994 We can never remove a SUBREG for a non-equality comparison because the
9995 sign bit is in a different place in the underlying object. */
9997 op0 = make_compound_operation (op0, op1 == const0_rtx ? COMPARE : SET);
9998 op1 = make_compound_operation (op1, SET);
10000 if (GET_CODE (op0) == SUBREG && subreg_lowpart_p (op0)
10001 && GET_MODE_CLASS (GET_MODE (op0)) == MODE_INT
10002 && (code == NE || code == EQ)
10003 && ((GET_MODE_SIZE (GET_MODE (op0))
10004 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (op0))))))
10006 op0 = SUBREG_REG (op0);
10007 op1 = gen_lowpart_for_combine (GET_MODE (op0), op1);
10010 else if (GET_CODE (op0) == SUBREG && subreg_lowpart_p (op0)
10011 && GET_MODE_CLASS (GET_MODE (op0)) == MODE_INT
10012 && (code == NE || code == EQ)
10013 && (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (op0)))
10014 <= HOST_BITS_PER_WIDE_INT)
10015 && (nonzero_bits (SUBREG_REG (op0), GET_MODE (SUBREG_REG (op0)))
10016 & ~ GET_MODE_MASK (GET_MODE (op0))) == 0
10017 && (tem = gen_lowpart_for_combine (GET_MODE (SUBREG_REG (op0)),
10018 op1),
10019 (nonzero_bits (tem, GET_MODE (SUBREG_REG (op0)))
10020 & ~ GET_MODE_MASK (GET_MODE (op0))) == 0))
10021 op0 = SUBREG_REG (op0), op1 = tem;
10023 /* We now do the opposite procedure: Some machines don't have compare
10024 insns in all modes. If OP0's mode is an integer mode smaller than a
10025 word and we can't do a compare in that mode, see if there is a larger
10026 mode for which we can do the compare. There are a number of cases in
10027 which we can use the wider mode. */
10029 mode = GET_MODE (op0);
10030 if (mode != VOIDmode && GET_MODE_CLASS (mode) == MODE_INT
10031 && GET_MODE_SIZE (mode) < UNITS_PER_WORD
10032 && cmp_optab->handlers[(int) mode].insn_code == CODE_FOR_nothing)
10033 for (tmode = GET_MODE_WIDER_MODE (mode);
10034 (tmode != VOIDmode
10035 && GET_MODE_BITSIZE (tmode) <= HOST_BITS_PER_WIDE_INT);
10036 tmode = GET_MODE_WIDER_MODE (tmode))
10037 if (cmp_optab->handlers[(int) tmode].insn_code != CODE_FOR_nothing)
10039 /* If the only nonzero bits in OP0 and OP1 are those in the
10040 narrower mode and this is an equality or unsigned comparison,
10041 we can use the wider mode. Similarly for sign-extended
10042 values, in which case it is true for all comparisons. */
10043 if (((code == EQ || code == NE
10044 || code == GEU || code == GTU || code == LEU || code == LTU)
10045 && (nonzero_bits (op0, tmode) & ~ GET_MODE_MASK (mode)) == 0
10046 && (nonzero_bits (op1, tmode) & ~ GET_MODE_MASK (mode)) == 0)
10047 || ((num_sign_bit_copies (op0, tmode)
10048 > GET_MODE_BITSIZE (tmode) - GET_MODE_BITSIZE (mode))
10049 && (num_sign_bit_copies (op1, tmode)
10050 > GET_MODE_BITSIZE (tmode) - GET_MODE_BITSIZE (mode))))
10052 op0 = gen_lowpart_for_combine (tmode, op0);
10053 op1 = gen_lowpart_for_combine (tmode, op1);
10054 break;
10057 /* If this is a test for negative, we can make an explicit
10058 test of the sign bit. */
10060 if (op1 == const0_rtx && (code == LT || code == GE)
10061 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT)
10063 op0 = gen_binary (AND, tmode,
10064 gen_lowpart_for_combine (tmode, op0),
10065 GEN_INT ((HOST_WIDE_INT) 1
10066 << (GET_MODE_BITSIZE (mode) - 1)));
10067 code = (code == LT) ? NE : EQ;
10068 break;
10072 #ifdef CANONICALIZE_COMPARISON
10073 /* If this machine only supports a subset of valid comparisons, see if we
10074 can convert an unsupported one into a supported one. */
10075 CANONICALIZE_COMPARISON (code, op0, op1);
10076 #endif
10078 *pop0 = op0;
10079 *pop1 = op1;
10081 return code;
10084 /* Return 1 if we know that X, a comparison operation, is not operating
10085 on a floating-point value or is EQ or NE, meaning that we can safely
10086 reverse it. */
10088 static int
10089 reversible_comparison_p (x)
10090 rtx x;
10092 if (TARGET_FLOAT_FORMAT != IEEE_FLOAT_FORMAT
10093 || flag_fast_math
10094 || GET_CODE (x) == NE || GET_CODE (x) == EQ)
10095 return 1;
10097 switch (GET_MODE_CLASS (GET_MODE (XEXP (x, 0))))
10099 case MODE_INT:
10100 case MODE_PARTIAL_INT:
10101 case MODE_COMPLEX_INT:
10102 return 1;
10104 case MODE_CC:
10105 /* If the mode of the condition codes tells us that this is safe,
10106 we need look no further. */
10107 if (REVERSIBLE_CC_MODE (GET_MODE (XEXP (x, 0))))
10108 return 1;
10110 /* Otherwise try and find where the condition codes were last set and
10111 use that. */
10112 x = get_last_value (XEXP (x, 0));
10113 return (x && GET_CODE (x) == COMPARE
10114 && ! FLOAT_MODE_P (GET_MODE (XEXP (x, 0))));
10117 return 0;
10120 /* Utility function for following routine. Called when X is part of a value
10121 being stored into reg_last_set_value. Sets reg_last_set_table_tick
10122 for each register mentioned. Similar to mention_regs in cse.c */
10124 static void
10125 update_table_tick (x)
10126 rtx x;
10128 register enum rtx_code code = GET_CODE (x);
10129 register char *fmt = GET_RTX_FORMAT (code);
10130 register int i;
10132 if (code == REG)
10134 int regno = REGNO (x);
10135 int endregno = regno + (regno < FIRST_PSEUDO_REGISTER
10136 ? HARD_REGNO_NREGS (regno, GET_MODE (x)) : 1);
10138 for (i = regno; i < endregno; i++)
10139 reg_last_set_table_tick[i] = label_tick;
10141 return;
10144 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
10145 /* Note that we can't have an "E" in values stored; see
10146 get_last_value_validate. */
10147 if (fmt[i] == 'e')
10148 update_table_tick (XEXP (x, i));
10151 /* Record that REG is set to VALUE in insn INSN. If VALUE is zero, we
10152 are saying that the register is clobbered and we no longer know its
10153 value. If INSN is zero, don't update reg_last_set; this is only permitted
10154 with VALUE also zero and is used to invalidate the register. */
10156 static void
10157 record_value_for_reg (reg, insn, value)
10158 rtx reg;
10159 rtx insn;
10160 rtx value;
10162 int regno = REGNO (reg);
10163 int endregno = regno + (regno < FIRST_PSEUDO_REGISTER
10164 ? HARD_REGNO_NREGS (regno, GET_MODE (reg)) : 1);
10165 int i;
10167 /* If VALUE contains REG and we have a previous value for REG, substitute
10168 the previous value. */
10169 if (value && insn && reg_overlap_mentioned_p (reg, value))
10171 rtx tem;
10173 /* Set things up so get_last_value is allowed to see anything set up to
10174 our insn. */
10175 subst_low_cuid = INSN_CUID (insn);
10176 tem = get_last_value (reg);
10178 if (tem)
10179 value = replace_rtx (copy_rtx (value), reg, tem);
10182 /* For each register modified, show we don't know its value, that
10183 we don't know about its bitwise content, that its value has been
10184 updated, and that we don't know the location of the death of the
10185 register. */
10186 for (i = regno; i < endregno; i ++)
10188 if (insn)
10189 reg_last_set[i] = insn;
10190 reg_last_set_value[i] = 0;
10191 reg_last_set_mode[i] = 0;
10192 reg_last_set_nonzero_bits[i] = 0;
10193 reg_last_set_sign_bit_copies[i] = 0;
10194 reg_last_death[i] = 0;
10197 /* Mark registers that are being referenced in this value. */
10198 if (value)
10199 update_table_tick (value);
10201 /* Now update the status of each register being set.
10202 If someone is using this register in this block, set this register
10203 to invalid since we will get confused between the two lives in this
10204 basic block. This makes using this register always invalid. In cse, we
10205 scan the table to invalidate all entries using this register, but this
10206 is too much work for us. */
10208 for (i = regno; i < endregno; i++)
10210 reg_last_set_label[i] = label_tick;
10211 if (value && reg_last_set_table_tick[i] == label_tick)
10212 reg_last_set_invalid[i] = 1;
10213 else
10214 reg_last_set_invalid[i] = 0;
10217 /* The value being assigned might refer to X (like in "x++;"). In that
10218 case, we must replace it with (clobber (const_int 0)) to prevent
10219 infinite loops. */
10220 if (value && ! get_last_value_validate (&value, insn,
10221 reg_last_set_label[regno], 0))
10223 value = copy_rtx (value);
10224 if (! get_last_value_validate (&value, insn,
10225 reg_last_set_label[regno], 1))
10226 value = 0;
10229 /* For the main register being modified, update the value, the mode, the
10230 nonzero bits, and the number of sign bit copies. */
10232 reg_last_set_value[regno] = value;
10234 if (value)
10236 subst_low_cuid = INSN_CUID (insn);
10237 reg_last_set_mode[regno] = GET_MODE (reg);
10238 reg_last_set_nonzero_bits[regno] = nonzero_bits (value, GET_MODE (reg));
10239 reg_last_set_sign_bit_copies[regno]
10240 = num_sign_bit_copies (value, GET_MODE (reg));
10244 /* Used for communication between the following two routines. */
10245 static rtx record_dead_insn;
10247 /* Called via note_stores from record_dead_and_set_regs to handle one
10248 SET or CLOBBER in an insn. */
10250 static void
10251 record_dead_and_set_regs_1 (dest, setter)
10252 rtx dest, setter;
10254 if (GET_CODE (dest) == SUBREG)
10255 dest = SUBREG_REG (dest);
10257 if (GET_CODE (dest) == REG)
10259 /* If we are setting the whole register, we know its value. Otherwise
10260 show that we don't know the value. We can handle SUBREG in
10261 some cases. */
10262 if (GET_CODE (setter) == SET && dest == SET_DEST (setter))
10263 record_value_for_reg (dest, record_dead_insn, SET_SRC (setter));
10264 else if (GET_CODE (setter) == SET
10265 && GET_CODE (SET_DEST (setter)) == SUBREG
10266 && SUBREG_REG (SET_DEST (setter)) == dest
10267 && GET_MODE_BITSIZE (GET_MODE (dest)) <= BITS_PER_WORD
10268 && subreg_lowpart_p (SET_DEST (setter)))
10269 record_value_for_reg (dest, record_dead_insn,
10270 gen_lowpart_for_combine (GET_MODE (dest),
10271 SET_SRC (setter)));
10272 else
10273 record_value_for_reg (dest, record_dead_insn, NULL_RTX);
10275 else if (GET_CODE (dest) == MEM
10276 /* Ignore pushes, they clobber nothing. */
10277 && ! push_operand (dest, GET_MODE (dest)))
10278 mem_last_set = INSN_CUID (record_dead_insn);
10281 /* Update the records of when each REG was most recently set or killed
10282 for the things done by INSN. This is the last thing done in processing
10283 INSN in the combiner loop.
10285 We update reg_last_set, reg_last_set_value, reg_last_set_mode,
10286 reg_last_set_nonzero_bits, reg_last_set_sign_bit_copies, reg_last_death,
10287 and also the similar information mem_last_set (which insn most recently
10288 modified memory) and last_call_cuid (which insn was the most recent
10289 subroutine call). */
10291 static void
10292 record_dead_and_set_regs (insn)
10293 rtx insn;
10295 register rtx link;
10296 int i;
10298 for (link = REG_NOTES (insn); link; link = XEXP (link, 1))
10300 if (REG_NOTE_KIND (link) == REG_DEAD
10301 && GET_CODE (XEXP (link, 0)) == REG)
10303 int regno = REGNO (XEXP (link, 0));
10304 int endregno
10305 = regno + (regno < FIRST_PSEUDO_REGISTER
10306 ? HARD_REGNO_NREGS (regno, GET_MODE (XEXP (link, 0)))
10307 : 1);
10309 for (i = regno; i < endregno; i++)
10310 reg_last_death[i] = insn;
10312 else if (REG_NOTE_KIND (link) == REG_INC)
10313 record_value_for_reg (XEXP (link, 0), insn, NULL_RTX);
10316 if (GET_CODE (insn) == CALL_INSN)
10318 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
10319 if (call_used_regs[i])
10321 reg_last_set_value[i] = 0;
10322 reg_last_set_mode[i] = 0;
10323 reg_last_set_nonzero_bits[i] = 0;
10324 reg_last_set_sign_bit_copies[i] = 0;
10325 reg_last_death[i] = 0;
10328 last_call_cuid = mem_last_set = INSN_CUID (insn);
10331 record_dead_insn = insn;
10332 note_stores (PATTERN (insn), record_dead_and_set_regs_1);
10335 /* Utility routine for the following function. Verify that all the registers
10336 mentioned in *LOC are valid when *LOC was part of a value set when
10337 label_tick == TICK. Return 0 if some are not.
10339 If REPLACE is non-zero, replace the invalid reference with
10340 (clobber (const_int 0)) and return 1. This replacement is useful because
10341 we often can get useful information about the form of a value (e.g., if
10342 it was produced by a shift that always produces -1 or 0) even though
10343 we don't know exactly what registers it was produced from. */
10345 static int
10346 get_last_value_validate (loc, insn, tick, replace)
10347 rtx *loc;
10348 rtx insn;
10349 int tick;
10350 int replace;
10352 rtx x = *loc;
10353 char *fmt = GET_RTX_FORMAT (GET_CODE (x));
10354 int len = GET_RTX_LENGTH (GET_CODE (x));
10355 int i;
10357 if (GET_CODE (x) == REG)
10359 int regno = REGNO (x);
10360 int endregno = regno + (regno < FIRST_PSEUDO_REGISTER
10361 ? HARD_REGNO_NREGS (regno, GET_MODE (x)) : 1);
10362 int j;
10364 for (j = regno; j < endregno; j++)
10365 if (reg_last_set_invalid[j]
10366 /* If this is a pseudo-register that was only set once, it is
10367 always valid. */
10368 || (! (regno >= FIRST_PSEUDO_REGISTER && REG_N_SETS (regno) == 1)
10369 && reg_last_set_label[j] > tick))
10371 if (replace)
10372 *loc = gen_rtx (CLOBBER, GET_MODE (x), const0_rtx);
10373 return replace;
10376 return 1;
10378 /* If this is a memory reference, make sure that there were
10379 no stores after it that might have clobbered the value. We don't
10380 have alias info, so we assume any store invalidates it. */
10381 else if (GET_CODE (x) == MEM && ! RTX_UNCHANGING_P (x)
10382 && INSN_CUID (insn) <= mem_last_set)
10384 if (replace)
10385 *loc = gen_rtx (CLOBBER, GET_MODE (x), const0_rtx);
10386 return replace;
10389 for (i = 0; i < len; i++)
10390 if ((fmt[i] == 'e'
10391 && get_last_value_validate (&XEXP (x, i), insn, tick, replace) == 0)
10392 /* Don't bother with these. They shouldn't occur anyway. */
10393 || fmt[i] == 'E')
10394 return 0;
10396 /* If we haven't found a reason for it to be invalid, it is valid. */
10397 return 1;
10400 /* Get the last value assigned to X, if known. Some registers
10401 in the value may be replaced with (clobber (const_int 0)) if their value
10402 is known longer known reliably. */
10404 static rtx
10405 get_last_value (x)
10406 rtx x;
10408 int regno;
10409 rtx value;
10411 /* If this is a non-paradoxical SUBREG, get the value of its operand and
10412 then convert it to the desired mode. If this is a paradoxical SUBREG,
10413 we cannot predict what values the "extra" bits might have. */
10414 if (GET_CODE (x) == SUBREG
10415 && subreg_lowpart_p (x)
10416 && (GET_MODE_SIZE (GET_MODE (x))
10417 <= GET_MODE_SIZE (GET_MODE (SUBREG_REG (x))))
10418 && (value = get_last_value (SUBREG_REG (x))) != 0)
10419 return gen_lowpart_for_combine (GET_MODE (x), value);
10421 if (GET_CODE (x) != REG)
10422 return 0;
10424 regno = REGNO (x);
10425 value = reg_last_set_value[regno];
10427 /* If we don't have a value or if it isn't for this basic block,
10428 return 0. */
10430 if (value == 0
10431 || (REG_N_SETS (regno) != 1
10432 && reg_last_set_label[regno] != label_tick))
10433 return 0;
10435 /* If the value was set in a later insn than the ones we are processing,
10436 we can't use it even if the register was only set once, but make a quick
10437 check to see if the previous insn set it to something. This is commonly
10438 the case when the same pseudo is used by repeated insns.
10440 This does not work if there exists an instruction which is temporarily
10441 not on the insn chain. */
10443 if (INSN_CUID (reg_last_set[regno]) >= subst_low_cuid)
10445 rtx insn, set;
10447 /* We can not do anything useful in this case, because there is
10448 an instruction which is not on the insn chain. */
10449 if (subst_prev_insn)
10450 return 0;
10452 /* Skip over USE insns. They are not useful here, and they may have
10453 been made by combine, in which case they do not have a INSN_CUID
10454 value. We can't use prev_real_insn, because that would incorrectly
10455 take us backwards across labels. Skip over BARRIERs also, since
10456 they could have been made by combine. If we see one, we must be
10457 optimizing dead code, so it doesn't matter what we do. */
10458 for (insn = prev_nonnote_insn (subst_insn);
10459 insn && ((GET_CODE (insn) == INSN
10460 && GET_CODE (PATTERN (insn)) == USE)
10461 || GET_CODE (insn) == BARRIER
10462 || INSN_CUID (insn) >= subst_low_cuid);
10463 insn = prev_nonnote_insn (insn))
10466 if (insn
10467 && (set = single_set (insn)) != 0
10468 && rtx_equal_p (SET_DEST (set), x))
10470 value = SET_SRC (set);
10472 /* Make sure that VALUE doesn't reference X. Replace any
10473 explicit references with a CLOBBER. If there are any remaining
10474 references (rare), don't use the value. */
10476 if (reg_mentioned_p (x, value))
10477 value = replace_rtx (copy_rtx (value), x,
10478 gen_rtx (CLOBBER, GET_MODE (x), const0_rtx));
10480 if (reg_overlap_mentioned_p (x, value))
10481 return 0;
10483 else
10484 return 0;
10487 /* If the value has all its registers valid, return it. */
10488 if (get_last_value_validate (&value, reg_last_set[regno],
10489 reg_last_set_label[regno], 0))
10490 return value;
10492 /* Otherwise, make a copy and replace any invalid register with
10493 (clobber (const_int 0)). If that fails for some reason, return 0. */
10495 value = copy_rtx (value);
10496 if (get_last_value_validate (&value, reg_last_set[regno],
10497 reg_last_set_label[regno], 1))
10498 return value;
10500 return 0;
10503 /* Return nonzero if expression X refers to a REG or to memory
10504 that is set in an instruction more recent than FROM_CUID. */
10506 static int
10507 use_crosses_set_p (x, from_cuid)
10508 register rtx x;
10509 int from_cuid;
10511 register char *fmt;
10512 register int i;
10513 register enum rtx_code code = GET_CODE (x);
10515 if (code == REG)
10517 register int regno = REGNO (x);
10518 int endreg = regno + (regno < FIRST_PSEUDO_REGISTER
10519 ? HARD_REGNO_NREGS (regno, GET_MODE (x)) : 1);
10521 #ifdef PUSH_ROUNDING
10522 /* Don't allow uses of the stack pointer to be moved,
10523 because we don't know whether the move crosses a push insn. */
10524 if (regno == STACK_POINTER_REGNUM)
10525 return 1;
10526 #endif
10527 for (;regno < endreg; regno++)
10528 if (reg_last_set[regno]
10529 && INSN_CUID (reg_last_set[regno]) > from_cuid)
10530 return 1;
10531 return 0;
10534 if (code == MEM && mem_last_set > from_cuid)
10535 return 1;
10537 fmt = GET_RTX_FORMAT (code);
10539 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
10541 if (fmt[i] == 'E')
10543 register int j;
10544 for (j = XVECLEN (x, i) - 1; j >= 0; j--)
10545 if (use_crosses_set_p (XVECEXP (x, i, j), from_cuid))
10546 return 1;
10548 else if (fmt[i] == 'e'
10549 && use_crosses_set_p (XEXP (x, i), from_cuid))
10550 return 1;
10552 return 0;
10555 /* Define three variables used for communication between the following
10556 routines. */
10558 static int reg_dead_regno, reg_dead_endregno;
10559 static int reg_dead_flag;
10561 /* Function called via note_stores from reg_dead_at_p.
10563 If DEST is within [reg_dead_regno, reg_dead_endregno), set
10564 reg_dead_flag to 1 if X is a CLOBBER and to -1 it is a SET. */
10566 static void
10567 reg_dead_at_p_1 (dest, x)
10568 rtx dest;
10569 rtx x;
10571 int regno, endregno;
10573 if (GET_CODE (dest) != REG)
10574 return;
10576 regno = REGNO (dest);
10577 endregno = regno + (regno < FIRST_PSEUDO_REGISTER
10578 ? HARD_REGNO_NREGS (regno, GET_MODE (dest)) : 1);
10580 if (reg_dead_endregno > regno && reg_dead_regno < endregno)
10581 reg_dead_flag = (GET_CODE (x) == CLOBBER) ? 1 : -1;
10584 /* Return non-zero if REG is known to be dead at INSN.
10586 We scan backwards from INSN. If we hit a REG_DEAD note or a CLOBBER
10587 referencing REG, it is dead. If we hit a SET referencing REG, it is
10588 live. Otherwise, see if it is live or dead at the start of the basic
10589 block we are in. Hard regs marked as being live in NEWPAT_USED_REGS
10590 must be assumed to be always live. */
10592 static int
10593 reg_dead_at_p (reg, insn)
10594 rtx reg;
10595 rtx insn;
10597 int block, i;
10599 /* Set variables for reg_dead_at_p_1. */
10600 reg_dead_regno = REGNO (reg);
10601 reg_dead_endregno = reg_dead_regno + (reg_dead_regno < FIRST_PSEUDO_REGISTER
10602 ? HARD_REGNO_NREGS (reg_dead_regno,
10603 GET_MODE (reg))
10604 : 1);
10606 reg_dead_flag = 0;
10608 /* Check that reg isn't mentioned in NEWPAT_USED_REGS. */
10609 if (reg_dead_regno < FIRST_PSEUDO_REGISTER)
10611 for (i = reg_dead_regno; i < reg_dead_endregno; i++)
10612 if (TEST_HARD_REG_BIT (newpat_used_regs, i))
10613 return 0;
10616 /* Scan backwards until we find a REG_DEAD note, SET, CLOBBER, label, or
10617 beginning of function. */
10618 for (; insn && GET_CODE (insn) != CODE_LABEL && GET_CODE (insn) != BARRIER;
10619 insn = prev_nonnote_insn (insn))
10621 note_stores (PATTERN (insn), reg_dead_at_p_1);
10622 if (reg_dead_flag)
10623 return reg_dead_flag == 1 ? 1 : 0;
10625 if (find_regno_note (insn, REG_DEAD, reg_dead_regno))
10626 return 1;
10629 /* Get the basic block number that we were in. */
10630 if (insn == 0)
10631 block = 0;
10632 else
10634 for (block = 0; block < n_basic_blocks; block++)
10635 if (insn == basic_block_head[block])
10636 break;
10638 if (block == n_basic_blocks)
10639 return 0;
10642 for (i = reg_dead_regno; i < reg_dead_endregno; i++)
10643 if (REGNO_REG_SET_P (basic_block_live_at_start[block], i))
10644 return 0;
10646 return 1;
10649 /* Note hard registers in X that are used. This code is similar to
10650 that in flow.c, but much simpler since we don't care about pseudos. */
10652 static void
10653 mark_used_regs_combine (x)
10654 rtx x;
10656 register RTX_CODE code = GET_CODE (x);
10657 register int regno;
10658 int i;
10660 switch (code)
10662 case LABEL_REF:
10663 case SYMBOL_REF:
10664 case CONST_INT:
10665 case CONST:
10666 case CONST_DOUBLE:
10667 case PC:
10668 case ADDR_VEC:
10669 case ADDR_DIFF_VEC:
10670 case ASM_INPUT:
10671 #ifdef HAVE_cc0
10672 /* CC0 must die in the insn after it is set, so we don't need to take
10673 special note of it here. */
10674 case CC0:
10675 #endif
10676 return;
10678 case CLOBBER:
10679 /* If we are clobbering a MEM, mark any hard registers inside the
10680 address as used. */
10681 if (GET_CODE (XEXP (x, 0)) == MEM)
10682 mark_used_regs_combine (XEXP (XEXP (x, 0), 0));
10683 return;
10685 case REG:
10686 regno = REGNO (x);
10687 /* A hard reg in a wide mode may really be multiple registers.
10688 If so, mark all of them just like the first. */
10689 if (regno < FIRST_PSEUDO_REGISTER)
10691 /* None of this applies to the stack, frame or arg pointers */
10692 if (regno == STACK_POINTER_REGNUM
10693 #if FRAME_POINTER_REGNUM != HARD_FRAME_POINTER_REGNUM
10694 || regno == HARD_FRAME_POINTER_REGNUM
10695 #endif
10696 #if FRAME_POINTER_REGNUM != ARG_POINTER_REGNUM
10697 || (regno == ARG_POINTER_REGNUM && fixed_regs[regno])
10698 #endif
10699 || regno == FRAME_POINTER_REGNUM)
10700 return;
10702 i = HARD_REGNO_NREGS (regno, GET_MODE (x));
10703 while (i-- > 0)
10704 SET_HARD_REG_BIT (newpat_used_regs, regno + i);
10706 return;
10708 case SET:
10710 /* If setting a MEM, or a SUBREG of a MEM, then note any hard regs in
10711 the address. */
10712 register rtx testreg = SET_DEST (x);
10714 while (GET_CODE (testreg) == SUBREG
10715 || GET_CODE (testreg) == ZERO_EXTRACT
10716 || GET_CODE (testreg) == SIGN_EXTRACT
10717 || GET_CODE (testreg) == STRICT_LOW_PART)
10718 testreg = XEXP (testreg, 0);
10720 if (GET_CODE (testreg) == MEM)
10721 mark_used_regs_combine (XEXP (testreg, 0));
10723 mark_used_regs_combine (SET_SRC (x));
10724 return;
10728 /* Recursively scan the operands of this expression. */
10731 register char *fmt = GET_RTX_FORMAT (code);
10733 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
10735 if (fmt[i] == 'e')
10736 mark_used_regs_combine (XEXP (x, i));
10737 else if (fmt[i] == 'E')
10739 register int j;
10741 for (j = 0; j < XVECLEN (x, i); j++)
10742 mark_used_regs_combine (XVECEXP (x, i, j));
10749 /* Remove register number REGNO from the dead registers list of INSN.
10751 Return the note used to record the death, if there was one. */
10754 remove_death (regno, insn)
10755 int regno;
10756 rtx insn;
10758 register rtx note = find_regno_note (insn, REG_DEAD, regno);
10760 if (note)
10762 REG_N_DEATHS (regno)--;
10763 remove_note (insn, note);
10766 return note;
10769 /* For each register (hardware or pseudo) used within expression X, if its
10770 death is in an instruction with cuid between FROM_CUID (inclusive) and
10771 TO_INSN (exclusive), put a REG_DEAD note for that register in the
10772 list headed by PNOTES.
10774 That said, don't move registers killed by maybe_kill_insn.
10776 This is done when X is being merged by combination into TO_INSN. These
10777 notes will then be distributed as needed. */
10779 static void
10780 move_deaths (x, maybe_kill_insn, from_cuid, to_insn, pnotes)
10781 rtx x;
10782 rtx maybe_kill_insn;
10783 int from_cuid;
10784 rtx to_insn;
10785 rtx *pnotes;
10787 register char *fmt;
10788 register int len, i;
10789 register enum rtx_code code = GET_CODE (x);
10791 if (code == REG)
10793 register int regno = REGNO (x);
10794 register rtx where_dead = reg_last_death[regno];
10795 register rtx before_dead, after_dead;
10797 /* Don't move the register if it gets killed in between from and to */
10798 if (maybe_kill_insn && reg_set_p (x, maybe_kill_insn)
10799 && !reg_referenced_p (x, maybe_kill_insn))
10800 return;
10802 /* WHERE_DEAD could be a USE insn made by combine, so first we
10803 make sure that we have insns with valid INSN_CUID values. */
10804 before_dead = where_dead;
10805 while (before_dead && INSN_UID (before_dead) > max_uid_cuid)
10806 before_dead = PREV_INSN (before_dead);
10807 after_dead = where_dead;
10808 while (after_dead && INSN_UID (after_dead) > max_uid_cuid)
10809 after_dead = NEXT_INSN (after_dead);
10811 if (before_dead && after_dead
10812 && INSN_CUID (before_dead) >= from_cuid
10813 && (INSN_CUID (after_dead) < INSN_CUID (to_insn)
10814 || (where_dead != after_dead
10815 && INSN_CUID (after_dead) == INSN_CUID (to_insn))))
10817 rtx note = remove_death (regno, where_dead);
10819 /* It is possible for the call above to return 0. This can occur
10820 when reg_last_death points to I2 or I1 that we combined with.
10821 In that case make a new note.
10823 We must also check for the case where X is a hard register
10824 and NOTE is a death note for a range of hard registers
10825 including X. In that case, we must put REG_DEAD notes for
10826 the remaining registers in place of NOTE. */
10828 if (note != 0 && regno < FIRST_PSEUDO_REGISTER
10829 && (GET_MODE_SIZE (GET_MODE (XEXP (note, 0)))
10830 > GET_MODE_SIZE (GET_MODE (x))))
10832 int deadregno = REGNO (XEXP (note, 0));
10833 int deadend
10834 = (deadregno + HARD_REGNO_NREGS (deadregno,
10835 GET_MODE (XEXP (note, 0))));
10836 int ourend = regno + HARD_REGNO_NREGS (regno, GET_MODE (x));
10837 int i;
10839 for (i = deadregno; i < deadend; i++)
10840 if (i < regno || i >= ourend)
10841 REG_NOTES (where_dead)
10842 = gen_rtx (EXPR_LIST, REG_DEAD,
10843 gen_rtx (REG, reg_raw_mode[i], i),
10844 REG_NOTES (where_dead));
10846 /* If we didn't find any note, or if we found a REG_DEAD note that
10847 covers only part of the given reg, and we have a multi-reg hard
10848 register, then to be safe we must check for REG_DEAD notes
10849 for each register other than the first. They could have
10850 their own REG_DEAD notes lying around. */
10851 else if ((note == 0
10852 || (note != 0
10853 && (GET_MODE_SIZE (GET_MODE (XEXP (note, 0)))
10854 < GET_MODE_SIZE (GET_MODE (x)))))
10855 && regno < FIRST_PSEUDO_REGISTER
10856 && HARD_REGNO_NREGS (regno, GET_MODE (x)) > 1)
10858 int ourend = regno + HARD_REGNO_NREGS (regno, GET_MODE (x));
10859 int i, offset;
10860 rtx oldnotes = 0;
10862 if (note)
10863 offset = HARD_REGNO_NREGS (regno, GET_MODE (XEXP (note, 0)));
10864 else
10865 offset = 1;
10867 for (i = regno + offset; i < ourend; i++)
10868 move_deaths (gen_rtx (REG, reg_raw_mode[i], i),
10869 maybe_kill_insn, from_cuid, to_insn, &oldnotes);
10872 if (note != 0 && GET_MODE (XEXP (note, 0)) == GET_MODE (x))
10874 XEXP (note, 1) = *pnotes;
10875 *pnotes = note;
10877 else
10878 *pnotes = gen_rtx (EXPR_LIST, REG_DEAD, x, *pnotes);
10880 REG_N_DEATHS (regno)++;
10883 return;
10886 else if (GET_CODE (x) == SET)
10888 rtx dest = SET_DEST (x);
10890 move_deaths (SET_SRC (x), maybe_kill_insn, from_cuid, to_insn, pnotes);
10892 /* In the case of a ZERO_EXTRACT, a STRICT_LOW_PART, or a SUBREG
10893 that accesses one word of a multi-word item, some
10894 piece of everything register in the expression is used by
10895 this insn, so remove any old death. */
10897 if (GET_CODE (dest) == ZERO_EXTRACT
10898 || GET_CODE (dest) == STRICT_LOW_PART
10899 || (GET_CODE (dest) == SUBREG
10900 && (((GET_MODE_SIZE (GET_MODE (dest))
10901 + UNITS_PER_WORD - 1) / UNITS_PER_WORD)
10902 == ((GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest)))
10903 + UNITS_PER_WORD - 1) / UNITS_PER_WORD))))
10905 move_deaths (dest, maybe_kill_insn, from_cuid, to_insn, pnotes);
10906 return;
10909 /* If this is some other SUBREG, we know it replaces the entire
10910 value, so use that as the destination. */
10911 if (GET_CODE (dest) == SUBREG)
10912 dest = SUBREG_REG (dest);
10914 /* If this is a MEM, adjust deaths of anything used in the address.
10915 For a REG (the only other possibility), the entire value is
10916 being replaced so the old value is not used in this insn. */
10918 if (GET_CODE (dest) == MEM)
10919 move_deaths (XEXP (dest, 0), maybe_kill_insn, from_cuid,
10920 to_insn, pnotes);
10921 return;
10924 else if (GET_CODE (x) == CLOBBER)
10925 return;
10927 len = GET_RTX_LENGTH (code);
10928 fmt = GET_RTX_FORMAT (code);
10930 for (i = 0; i < len; i++)
10932 if (fmt[i] == 'E')
10934 register int j;
10935 for (j = XVECLEN (x, i) - 1; j >= 0; j--)
10936 move_deaths (XVECEXP (x, i, j), maybe_kill_insn, from_cuid,
10937 to_insn, pnotes);
10939 else if (fmt[i] == 'e')
10940 move_deaths (XEXP (x, i), maybe_kill_insn, from_cuid, to_insn, pnotes);
10944 /* Return 1 if X is the target of a bit-field assignment in BODY, the
10945 pattern of an insn. X must be a REG. */
10947 static int
10948 reg_bitfield_target_p (x, body)
10949 rtx x;
10950 rtx body;
10952 int i;
10954 if (GET_CODE (body) == SET)
10956 rtx dest = SET_DEST (body);
10957 rtx target;
10958 int regno, tregno, endregno, endtregno;
10960 if (GET_CODE (dest) == ZERO_EXTRACT)
10961 target = XEXP (dest, 0);
10962 else if (GET_CODE (dest) == STRICT_LOW_PART)
10963 target = SUBREG_REG (XEXP (dest, 0));
10964 else
10965 return 0;
10967 if (GET_CODE (target) == SUBREG)
10968 target = SUBREG_REG (target);
10970 if (GET_CODE (target) != REG)
10971 return 0;
10973 tregno = REGNO (target), regno = REGNO (x);
10974 if (tregno >= FIRST_PSEUDO_REGISTER || regno >= FIRST_PSEUDO_REGISTER)
10975 return target == x;
10977 endtregno = tregno + HARD_REGNO_NREGS (tregno, GET_MODE (target));
10978 endregno = regno + HARD_REGNO_NREGS (regno, GET_MODE (x));
10980 return endregno > tregno && regno < endtregno;
10983 else if (GET_CODE (body) == PARALLEL)
10984 for (i = XVECLEN (body, 0) - 1; i >= 0; i--)
10985 if (reg_bitfield_target_p (x, XVECEXP (body, 0, i)))
10986 return 1;
10988 return 0;
10991 /* Given a chain of REG_NOTES originally from FROM_INSN, try to place them
10992 as appropriate. I3 and I2 are the insns resulting from the combination
10993 insns including FROM (I2 may be zero).
10995 ELIM_I2 and ELIM_I1 are either zero or registers that we know will
10996 not need REG_DEAD notes because they are being substituted for. This
10997 saves searching in the most common cases.
10999 Each note in the list is either ignored or placed on some insns, depending
11000 on the type of note. */
11002 static void
11003 distribute_notes (notes, from_insn, i3, i2, elim_i2, elim_i1)
11004 rtx notes;
11005 rtx from_insn;
11006 rtx i3, i2;
11007 rtx elim_i2, elim_i1;
11009 rtx note, next_note;
11010 rtx tem;
11012 for (note = notes; note; note = next_note)
11014 rtx place = 0, place2 = 0;
11016 /* If this NOTE references a pseudo register, ensure it references
11017 the latest copy of that register. */
11018 if (XEXP (note, 0) && GET_CODE (XEXP (note, 0)) == REG
11019 && REGNO (XEXP (note, 0)) >= FIRST_PSEUDO_REGISTER)
11020 XEXP (note, 0) = regno_reg_rtx[REGNO (XEXP (note, 0))];
11022 next_note = XEXP (note, 1);
11023 switch (REG_NOTE_KIND (note))
11025 case REG_BR_PROB:
11026 case REG_EXEC_COUNT:
11027 /* Doesn't matter much where we put this, as long as it's somewhere.
11028 It is preferable to keep these notes on branches, which is most
11029 likely to be i3. */
11030 place = i3;
11031 break;
11033 case REG_UNUSED:
11034 /* Any clobbers for i3 may still exist, and so we must process
11035 REG_UNUSED notes from that insn.
11037 Any clobbers from i2 or i1 can only exist if they were added by
11038 recog_for_combine. In that case, recog_for_combine created the
11039 necessary REG_UNUSED notes. Trying to keep any original
11040 REG_UNUSED notes from these insns can cause incorrect output
11041 if it is for the same register as the original i3 dest.
11042 In that case, we will notice that the register is set in i3,
11043 and then add a REG_UNUSED note for the destination of i3, which
11044 is wrong. However, it is possible to have REG_UNUSED notes from
11045 i2 or i1 for register which were both used and clobbered, so
11046 we keep notes from i2 or i1 if they will turn into REG_DEAD
11047 notes. */
11049 /* If this register is set or clobbered in I3, put the note there
11050 unless there is one already. */
11051 if (reg_set_p (XEXP (note, 0), PATTERN (i3)))
11053 if (from_insn != i3)
11054 break;
11056 if (! (GET_CODE (XEXP (note, 0)) == REG
11057 ? find_regno_note (i3, REG_UNUSED, REGNO (XEXP (note, 0)))
11058 : find_reg_note (i3, REG_UNUSED, XEXP (note, 0))))
11059 place = i3;
11061 /* Otherwise, if this register is used by I3, then this register
11062 now dies here, so we must put a REG_DEAD note here unless there
11063 is one already. */
11064 else if (reg_referenced_p (XEXP (note, 0), PATTERN (i3))
11065 && ! (GET_CODE (XEXP (note, 0)) == REG
11066 ? find_regno_note (i3, REG_DEAD, REGNO (XEXP (note, 0)))
11067 : find_reg_note (i3, REG_DEAD, XEXP (note, 0))))
11069 PUT_REG_NOTE_KIND (note, REG_DEAD);
11070 place = i3;
11072 break;
11074 case REG_EQUAL:
11075 case REG_EQUIV:
11076 case REG_NONNEG:
11077 case REG_NOALIAS:
11078 /* These notes say something about results of an insn. We can
11079 only support them if they used to be on I3 in which case they
11080 remain on I3. Otherwise they are ignored.
11082 If the note refers to an expression that is not a constant, we
11083 must also ignore the note since we cannot tell whether the
11084 equivalence is still true. It might be possible to do
11085 slightly better than this (we only have a problem if I2DEST
11086 or I1DEST is present in the expression), but it doesn't
11087 seem worth the trouble. */
11089 if (from_insn == i3
11090 && (XEXP (note, 0) == 0 || CONSTANT_P (XEXP (note, 0))))
11091 place = i3;
11092 break;
11094 case REG_INC:
11095 case REG_NO_CONFLICT:
11096 case REG_LABEL:
11097 /* These notes say something about how a register is used. They must
11098 be present on any use of the register in I2 or I3. */
11099 if (reg_mentioned_p (XEXP (note, 0), PATTERN (i3)))
11100 place = i3;
11102 if (i2 && reg_mentioned_p (XEXP (note, 0), PATTERN (i2)))
11104 if (place)
11105 place2 = i2;
11106 else
11107 place = i2;
11109 break;
11111 case REG_WAS_0:
11112 /* It is too much trouble to try to see if this note is still
11113 correct in all situations. It is better to simply delete it. */
11114 break;
11116 case REG_RETVAL:
11117 /* If the insn previously containing this note still exists,
11118 put it back where it was. Otherwise move it to the previous
11119 insn. Adjust the corresponding REG_LIBCALL note. */
11120 if (GET_CODE (from_insn) != NOTE)
11121 place = from_insn;
11122 else
11124 tem = find_reg_note (XEXP (note, 0), REG_LIBCALL, NULL_RTX);
11125 place = prev_real_insn (from_insn);
11126 if (tem && place)
11127 XEXP (tem, 0) = place;
11129 break;
11131 case REG_LIBCALL:
11132 /* This is handled similarly to REG_RETVAL. */
11133 if (GET_CODE (from_insn) != NOTE)
11134 place = from_insn;
11135 else
11137 tem = find_reg_note (XEXP (note, 0), REG_RETVAL, NULL_RTX);
11138 place = next_real_insn (from_insn);
11139 if (tem && place)
11140 XEXP (tem, 0) = place;
11142 break;
11144 case REG_DEAD:
11145 /* If the register is used as an input in I3, it dies there.
11146 Similarly for I2, if it is non-zero and adjacent to I3.
11148 If the register is not used as an input in either I3 or I2
11149 and it is not one of the registers we were supposed to eliminate,
11150 there are two possibilities. We might have a non-adjacent I2
11151 or we might have somehow eliminated an additional register
11152 from a computation. For example, we might have had A & B where
11153 we discover that B will always be zero. In this case we will
11154 eliminate the reference to A.
11156 In both cases, we must search to see if we can find a previous
11157 use of A and put the death note there. */
11159 if (from_insn
11160 && GET_CODE (from_insn) == CALL_INSN
11161 && find_reg_fusage (from_insn, USE, XEXP (note, 0)))
11162 place = from_insn;
11163 else if (reg_referenced_p (XEXP (note, 0), PATTERN (i3)))
11164 place = i3;
11165 else if (i2 != 0 && next_nonnote_insn (i2) == i3
11166 && reg_referenced_p (XEXP (note, 0), PATTERN (i2)))
11167 place = i2;
11169 if (XEXP (note, 0) == elim_i2 || XEXP (note, 0) == elim_i1)
11170 break;
11172 /* If the register is used in both I2 and I3 and it dies in I3,
11173 we might have added another reference to it. If reg_n_refs
11174 was 2, bump it to 3. This has to be correct since the
11175 register must have been set somewhere. The reason this is
11176 done is because local-alloc.c treats 2 references as a
11177 special case. */
11179 if (place == i3 && i2 != 0 && GET_CODE (XEXP (note, 0)) == REG
11180 && REG_N_REFS (REGNO (XEXP (note, 0)))== 2
11181 && reg_referenced_p (XEXP (note, 0), PATTERN (i2)))
11182 REG_N_REFS (REGNO (XEXP (note, 0))) = 3;
11184 if (place == 0)
11186 for (tem = prev_nonnote_insn (i3);
11187 place == 0 && tem
11188 && (GET_CODE (tem) == INSN || GET_CODE (tem) == CALL_INSN);
11189 tem = prev_nonnote_insn (tem))
11191 /* If the register is being set at TEM, see if that is all
11192 TEM is doing. If so, delete TEM. Otherwise, make this
11193 into a REG_UNUSED note instead. */
11194 if (reg_set_p (XEXP (note, 0), PATTERN (tem)))
11196 rtx set = single_set (tem);
11198 /* Verify that it was the set, and not a clobber that
11199 modified the register. */
11201 if (set != 0 && ! side_effects_p (SET_SRC (set))
11202 && (rtx_equal_p (XEXP (note, 0), SET_DEST (set))
11203 || (GET_CODE (SET_DEST (set)) == SUBREG
11204 && rtx_equal_p (XEXP (note, 0),
11205 XEXP (SET_DEST (set), 0)))))
11207 /* Move the notes and links of TEM elsewhere.
11208 This might delete other dead insns recursively.
11209 First set the pattern to something that won't use
11210 any register. */
11212 PATTERN (tem) = pc_rtx;
11214 distribute_notes (REG_NOTES (tem), tem, tem,
11215 NULL_RTX, NULL_RTX, NULL_RTX);
11216 distribute_links (LOG_LINKS (tem));
11218 PUT_CODE (tem, NOTE);
11219 NOTE_LINE_NUMBER (tem) = NOTE_INSN_DELETED;
11220 NOTE_SOURCE_FILE (tem) = 0;
11222 else
11224 PUT_REG_NOTE_KIND (note, REG_UNUSED);
11226 /* If there isn't already a REG_UNUSED note, put one
11227 here. */
11228 if (! find_regno_note (tem, REG_UNUSED,
11229 REGNO (XEXP (note, 0))))
11230 place = tem;
11231 break;
11234 else if (reg_referenced_p (XEXP (note, 0), PATTERN (tem))
11235 || (GET_CODE (tem) == CALL_INSN
11236 && find_reg_fusage (tem, USE, XEXP (note, 0))))
11238 place = tem;
11240 /* If we are doing a 3->2 combination, and we have a
11241 register which formerly died in i3 and was not used
11242 by i2, which now no longer dies in i3 and is used in
11243 i2 but does not die in i2, and place is between i2
11244 and i3, then we may need to move a link from place to
11245 i2. */
11246 if (i2 && INSN_UID (place) <= max_uid_cuid
11247 && INSN_CUID (place) > INSN_CUID (i2)
11248 && from_insn && INSN_CUID (from_insn) > INSN_CUID (i2)
11249 && reg_referenced_p (XEXP (note, 0), PATTERN (i2)))
11251 rtx links = LOG_LINKS (place);
11252 LOG_LINKS (place) = 0;
11253 distribute_links (links);
11255 break;
11259 /* If we haven't found an insn for the death note and it
11260 is still a REG_DEAD note, but we have hit a CODE_LABEL,
11261 insert a USE insn for the register at that label and
11262 put the death node there. This prevents problems with
11263 call-state tracking in caller-save.c. */
11264 if (REG_NOTE_KIND (note) == REG_DEAD && place == 0 && tem != 0)
11266 place
11267 = emit_insn_after (gen_rtx (USE, VOIDmode, XEXP (note, 0)),
11268 tem);
11270 /* If this insn was emitted between blocks, then update
11271 basic_block_head of the current block to include it. */
11272 if (basic_block_end[this_basic_block - 1] == tem)
11273 basic_block_head[this_basic_block] = place;
11277 /* If the register is set or already dead at PLACE, we needn't do
11278 anything with this note if it is still a REG_DEAD note.
11280 Note that we cannot use just `dead_or_set_p' here since we can
11281 convert an assignment to a register into a bit-field assignment.
11282 Therefore, we must also omit the note if the register is the
11283 target of a bitfield assignment. */
11285 if (place && REG_NOTE_KIND (note) == REG_DEAD)
11287 int regno = REGNO (XEXP (note, 0));
11289 if (dead_or_set_p (place, XEXP (note, 0))
11290 || reg_bitfield_target_p (XEXP (note, 0), PATTERN (place)))
11292 /* Unless the register previously died in PLACE, clear
11293 reg_last_death. [I no longer understand why this is
11294 being done.] */
11295 if (reg_last_death[regno] != place)
11296 reg_last_death[regno] = 0;
11297 place = 0;
11299 else
11300 reg_last_death[regno] = place;
11302 /* If this is a death note for a hard reg that is occupying
11303 multiple registers, ensure that we are still using all
11304 parts of the object. If we find a piece of the object
11305 that is unused, we must add a USE for that piece before
11306 PLACE and put the appropriate REG_DEAD note on it.
11308 An alternative would be to put a REG_UNUSED for the pieces
11309 on the insn that set the register, but that can't be done if
11310 it is not in the same block. It is simpler, though less
11311 efficient, to add the USE insns. */
11313 if (place && regno < FIRST_PSEUDO_REGISTER
11314 && HARD_REGNO_NREGS (regno, GET_MODE (XEXP (note, 0))) > 1)
11316 int endregno
11317 = regno + HARD_REGNO_NREGS (regno,
11318 GET_MODE (XEXP (note, 0)));
11319 int all_used = 1;
11320 int i;
11322 for (i = regno; i < endregno; i++)
11323 if (! refers_to_regno_p (i, i + 1, PATTERN (place), 0)
11324 && ! find_regno_fusage (place, USE, i))
11326 rtx piece = gen_rtx (REG, reg_raw_mode[i], i);
11327 rtx p;
11329 /* See if we already placed a USE note for this
11330 register in front of PLACE. */
11331 for (p = place;
11332 GET_CODE (PREV_INSN (p)) == INSN
11333 && GET_CODE (PATTERN (PREV_INSN (p))) == USE;
11334 p = PREV_INSN (p))
11335 if (rtx_equal_p (piece,
11336 XEXP (PATTERN (PREV_INSN (p)), 0)))
11338 p = 0;
11339 break;
11342 if (p)
11344 rtx use_insn
11345 = emit_insn_before (gen_rtx (USE, VOIDmode,
11346 piece),
11348 REG_NOTES (use_insn)
11349 = gen_rtx (EXPR_LIST, REG_DEAD, piece,
11350 REG_NOTES (use_insn));
11353 all_used = 0;
11356 /* Check for the case where the register dying partially
11357 overlaps the register set by this insn. */
11358 if (all_used)
11359 for (i = regno; i < endregno; i++)
11360 if (dead_or_set_regno_p (place, i))
11362 all_used = 0;
11363 break;
11366 if (! all_used)
11368 /* Put only REG_DEAD notes for pieces that are
11369 still used and that are not already dead or set. */
11371 for (i = regno; i < endregno; i++)
11373 rtx piece = gen_rtx (REG, reg_raw_mode[i], i);
11375 if ((reg_referenced_p (piece, PATTERN (place))
11376 || (GET_CODE (place) == CALL_INSN
11377 && find_reg_fusage (place, USE, piece)))
11378 && ! dead_or_set_p (place, piece)
11379 && ! reg_bitfield_target_p (piece,
11380 PATTERN (place)))
11381 REG_NOTES (place) = gen_rtx (EXPR_LIST, REG_DEAD,
11382 piece,
11383 REG_NOTES (place));
11386 place = 0;
11390 break;
11392 default:
11393 /* Any other notes should not be present at this point in the
11394 compilation. */
11395 abort ();
11398 if (place)
11400 XEXP (note, 1) = REG_NOTES (place);
11401 REG_NOTES (place) = note;
11403 else if ((REG_NOTE_KIND (note) == REG_DEAD
11404 || REG_NOTE_KIND (note) == REG_UNUSED)
11405 && GET_CODE (XEXP (note, 0)) == REG)
11406 REG_N_DEATHS (REGNO (XEXP (note, 0)))--;
11408 if (place2)
11410 if ((REG_NOTE_KIND (note) == REG_DEAD
11411 || REG_NOTE_KIND (note) == REG_UNUSED)
11412 && GET_CODE (XEXP (note, 0)) == REG)
11413 REG_N_DEATHS (REGNO (XEXP (note, 0)))++;
11415 REG_NOTES (place2) = gen_rtx (GET_CODE (note), REG_NOTE_KIND (note),
11416 XEXP (note, 0), REG_NOTES (place2));
11421 /* Similarly to above, distribute the LOG_LINKS that used to be present on
11422 I3, I2, and I1 to new locations. This is also called in one case to
11423 add a link pointing at I3 when I3's destination is changed. */
11425 static void
11426 distribute_links (links)
11427 rtx links;
11429 rtx link, next_link;
11431 for (link = links; link; link = next_link)
11433 rtx place = 0;
11434 rtx insn;
11435 rtx set, reg;
11437 next_link = XEXP (link, 1);
11439 /* If the insn that this link points to is a NOTE or isn't a single
11440 set, ignore it. In the latter case, it isn't clear what we
11441 can do other than ignore the link, since we can't tell which
11442 register it was for. Such links wouldn't be used by combine
11443 anyway.
11445 It is not possible for the destination of the target of the link to
11446 have been changed by combine. The only potential of this is if we
11447 replace I3, I2, and I1 by I3 and I2. But in that case the
11448 destination of I2 also remains unchanged. */
11450 if (GET_CODE (XEXP (link, 0)) == NOTE
11451 || (set = single_set (XEXP (link, 0))) == 0)
11452 continue;
11454 reg = SET_DEST (set);
11455 while (GET_CODE (reg) == SUBREG || GET_CODE (reg) == ZERO_EXTRACT
11456 || GET_CODE (reg) == SIGN_EXTRACT
11457 || GET_CODE (reg) == STRICT_LOW_PART)
11458 reg = XEXP (reg, 0);
11460 /* A LOG_LINK is defined as being placed on the first insn that uses
11461 a register and points to the insn that sets the register. Start
11462 searching at the next insn after the target of the link and stop
11463 when we reach a set of the register or the end of the basic block.
11465 Note that this correctly handles the link that used to point from
11466 I3 to I2. Also note that not much searching is typically done here
11467 since most links don't point very far away. */
11469 for (insn = NEXT_INSN (XEXP (link, 0));
11470 (insn && (this_basic_block == n_basic_blocks - 1
11471 || basic_block_head[this_basic_block + 1] != insn));
11472 insn = NEXT_INSN (insn))
11473 if (GET_RTX_CLASS (GET_CODE (insn)) == 'i'
11474 && reg_overlap_mentioned_p (reg, PATTERN (insn)))
11476 if (reg_referenced_p (reg, PATTERN (insn)))
11477 place = insn;
11478 break;
11480 else if (GET_CODE (insn) == CALL_INSN
11481 && find_reg_fusage (insn, USE, reg))
11483 place = insn;
11484 break;
11487 /* If we found a place to put the link, place it there unless there
11488 is already a link to the same insn as LINK at that point. */
11490 if (place)
11492 rtx link2;
11494 for (link2 = LOG_LINKS (place); link2; link2 = XEXP (link2, 1))
11495 if (XEXP (link2, 0) == XEXP (link, 0))
11496 break;
11498 if (link2 == 0)
11500 XEXP (link, 1) = LOG_LINKS (place);
11501 LOG_LINKS (place) = link;
11503 /* Set added_links_insn to the earliest insn we added a
11504 link to. */
11505 if (added_links_insn == 0
11506 || INSN_CUID (added_links_insn) > INSN_CUID (place))
11507 added_links_insn = place;
11513 /* Compute INSN_CUID for INSN, which is an insn made by combine. */
11515 static int
11516 insn_cuid (insn)
11517 rtx insn;
11519 while (insn != 0 && INSN_UID (insn) > max_uid_cuid
11520 && GET_CODE (insn) == INSN && GET_CODE (PATTERN (insn)) == USE)
11521 insn = NEXT_INSN (insn);
11523 if (INSN_UID (insn) > max_uid_cuid)
11524 abort ();
11526 return INSN_CUID (insn);
11529 void
11530 dump_combine_stats (file)
11531 FILE *file;
11533 fprintf
11534 (file,
11535 ";; Combiner statistics: %d attempts, %d substitutions (%d requiring new space),\n;; %d successes.\n\n",
11536 combine_attempts, combine_merges, combine_extras, combine_successes);
11539 void
11540 dump_combine_total_stats (file)
11541 FILE *file;
11543 fprintf
11544 (file,
11545 "\n;; Combiner totals: %d attempts, %d substitutions (%d requiring new space),\n;; %d successes.\n",
11546 total_attempts, total_merges, total_extras, total_successes);