1 /* RTL simplification functions for GNU compiler.
2 Copyright (C) 1987-2019 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
23 #include "coretypes.h"
33 #include "diagnostic-core.h"
37 #include "selftest-rtl.h"
38 #include "rtx-vector-builder.h"
40 /* Simplification and canonicalization of RTL. */
42 /* Much code operates on (low, high) pairs; the low value is an
43 unsigned wide int, the high value a signed wide int. We
44 occasionally need to sign extend from low to high as if low were a
46 #define HWI_SIGN_EXTEND(low) \
47 ((((HOST_WIDE_INT) low) < 0) ? HOST_WIDE_INT_M1 : HOST_WIDE_INT_0)
49 static bool plus_minus_operand_p (const_rtx
);
50 static rtx
simplify_plus_minus (enum rtx_code
, machine_mode
, rtx
, rtx
);
51 static rtx
simplify_associative_operation (enum rtx_code
, machine_mode
,
53 static rtx
simplify_relational_operation_1 (enum rtx_code
, machine_mode
,
54 machine_mode
, rtx
, rtx
);
55 static rtx
simplify_unary_operation_1 (enum rtx_code
, machine_mode
, rtx
);
56 static rtx
simplify_binary_operation_1 (enum rtx_code
, machine_mode
,
59 /* Negate I, which satisfies poly_int_rtx_p. MODE is the mode of I. */
62 neg_poly_int_rtx (machine_mode mode
, const_rtx i
)
64 return immed_wide_int_const (-wi::to_poly_wide (i
, mode
), mode
);
67 /* Test whether expression, X, is an immediate constant that represents
68 the most significant bit of machine mode MODE. */
71 mode_signbit_p (machine_mode mode
, const_rtx x
)
73 unsigned HOST_WIDE_INT val
;
75 scalar_int_mode int_mode
;
77 if (!is_int_mode (mode
, &int_mode
))
80 width
= GET_MODE_PRECISION (int_mode
);
84 if (width
<= HOST_BITS_PER_WIDE_INT
87 #if TARGET_SUPPORTS_WIDE_INT
88 else if (CONST_WIDE_INT_P (x
))
91 unsigned int elts
= CONST_WIDE_INT_NUNITS (x
);
92 if (elts
!= (width
+ HOST_BITS_PER_WIDE_INT
- 1) / HOST_BITS_PER_WIDE_INT
)
94 for (i
= 0; i
< elts
- 1; i
++)
95 if (CONST_WIDE_INT_ELT (x
, i
) != 0)
97 val
= CONST_WIDE_INT_ELT (x
, elts
- 1);
98 width
%= HOST_BITS_PER_WIDE_INT
;
100 width
= HOST_BITS_PER_WIDE_INT
;
103 else if (width
<= HOST_BITS_PER_DOUBLE_INT
104 && CONST_DOUBLE_AS_INT_P (x
)
105 && CONST_DOUBLE_LOW (x
) == 0)
107 val
= CONST_DOUBLE_HIGH (x
);
108 width
-= HOST_BITS_PER_WIDE_INT
;
112 /* X is not an integer constant. */
115 if (width
< HOST_BITS_PER_WIDE_INT
)
116 val
&= (HOST_WIDE_INT_1U
<< width
) - 1;
117 return val
== (HOST_WIDE_INT_1U
<< (width
- 1));
120 /* Test whether VAL is equal to the most significant bit of mode MODE
121 (after masking with the mode mask of MODE). Returns false if the
122 precision of MODE is too large to handle. */
125 val_signbit_p (machine_mode mode
, unsigned HOST_WIDE_INT val
)
128 scalar_int_mode int_mode
;
130 if (!is_int_mode (mode
, &int_mode
))
133 width
= GET_MODE_PRECISION (int_mode
);
134 if (width
== 0 || width
> HOST_BITS_PER_WIDE_INT
)
137 val
&= GET_MODE_MASK (int_mode
);
138 return val
== (HOST_WIDE_INT_1U
<< (width
- 1));
141 /* Test whether the most significant bit of mode MODE is set in VAL.
142 Returns false if the precision of MODE is too large to handle. */
144 val_signbit_known_set_p (machine_mode mode
, unsigned HOST_WIDE_INT val
)
148 scalar_int_mode int_mode
;
149 if (!is_int_mode (mode
, &int_mode
))
152 width
= GET_MODE_PRECISION (int_mode
);
153 if (width
== 0 || width
> HOST_BITS_PER_WIDE_INT
)
156 val
&= HOST_WIDE_INT_1U
<< (width
- 1);
160 /* Test whether the most significant bit of mode MODE is clear in VAL.
161 Returns false if the precision of MODE is too large to handle. */
163 val_signbit_known_clear_p (machine_mode mode
, unsigned HOST_WIDE_INT val
)
167 scalar_int_mode int_mode
;
168 if (!is_int_mode (mode
, &int_mode
))
171 width
= GET_MODE_PRECISION (int_mode
);
172 if (width
== 0 || width
> HOST_BITS_PER_WIDE_INT
)
175 val
&= HOST_WIDE_INT_1U
<< (width
- 1);
179 /* Make a binary operation by properly ordering the operands and
180 seeing if the expression folds. */
183 simplify_gen_binary (enum rtx_code code
, machine_mode mode
, rtx op0
,
188 /* If this simplifies, do it. */
189 tem
= simplify_binary_operation (code
, mode
, op0
, op1
);
193 /* Put complex operands first and constants second if commutative. */
194 if (GET_RTX_CLASS (code
) == RTX_COMM_ARITH
195 && swap_commutative_operands_p (op0
, op1
))
196 std::swap (op0
, op1
);
198 return gen_rtx_fmt_ee (code
, mode
, op0
, op1
);
201 /* If X is a MEM referencing the constant pool, return the real value.
202 Otherwise return X. */
204 avoid_constant_pool_reference (rtx x
)
208 poly_int64 offset
= 0;
210 switch (GET_CODE (x
))
216 /* Handle float extensions of constant pool references. */
218 c
= avoid_constant_pool_reference (tmp
);
219 if (c
!= tmp
&& CONST_DOUBLE_AS_FLOAT_P (c
))
220 return const_double_from_real_value (*CONST_DOUBLE_REAL_VALUE (c
),
228 if (GET_MODE (x
) == BLKmode
)
233 /* Call target hook to avoid the effects of -fpic etc.... */
234 addr
= targetm
.delegitimize_address (addr
);
236 /* Split the address into a base and integer offset. */
237 addr
= strip_offset (addr
, &offset
);
239 if (GET_CODE (addr
) == LO_SUM
)
240 addr
= XEXP (addr
, 1);
242 /* If this is a constant pool reference, we can turn it into its
243 constant and hope that simplifications happen. */
244 if (GET_CODE (addr
) == SYMBOL_REF
245 && CONSTANT_POOL_ADDRESS_P (addr
))
247 c
= get_pool_constant (addr
);
248 cmode
= get_pool_mode (addr
);
250 /* If we're accessing the constant in a different mode than it was
251 originally stored, attempt to fix that up via subreg simplifications.
252 If that fails we have no choice but to return the original memory. */
253 if (known_eq (offset
, 0) && cmode
== GET_MODE (x
))
255 else if (known_in_range_p (offset
, 0, GET_MODE_SIZE (cmode
)))
257 rtx tem
= simplify_subreg (GET_MODE (x
), c
, cmode
, offset
);
258 if (tem
&& CONSTANT_P (tem
))
266 /* Simplify a MEM based on its attributes. This is the default
267 delegitimize_address target hook, and it's recommended that every
268 overrider call it. */
271 delegitimize_mem_from_attrs (rtx x
)
273 /* MEMs without MEM_OFFSETs may have been offset, so we can't just
274 use their base addresses as equivalent. */
277 && MEM_OFFSET_KNOWN_P (x
))
279 tree decl
= MEM_EXPR (x
);
280 machine_mode mode
= GET_MODE (x
);
281 poly_int64 offset
= 0;
283 switch (TREE_CODE (decl
))
293 case ARRAY_RANGE_REF
:
298 case VIEW_CONVERT_EXPR
:
300 poly_int64 bitsize
, bitpos
, bytepos
, toffset_val
= 0;
302 int unsignedp
, reversep
, volatilep
= 0;
305 = get_inner_reference (decl
, &bitsize
, &bitpos
, &toffset
, &mode
,
306 &unsignedp
, &reversep
, &volatilep
);
307 if (maybe_ne (bitsize
, GET_MODE_BITSIZE (mode
))
308 || !multiple_p (bitpos
, BITS_PER_UNIT
, &bytepos
)
309 || (toffset
&& !poly_int_tree_p (toffset
, &toffset_val
)))
312 offset
+= bytepos
+ toffset_val
;
318 && mode
== GET_MODE (x
)
320 && (TREE_STATIC (decl
)
321 || DECL_THREAD_LOCAL_P (decl
))
322 && DECL_RTL_SET_P (decl
)
323 && MEM_P (DECL_RTL (decl
)))
327 offset
+= MEM_OFFSET (x
);
329 newx
= DECL_RTL (decl
);
333 rtx n
= XEXP (newx
, 0), o
= XEXP (x
, 0);
334 poly_int64 n_offset
, o_offset
;
336 /* Avoid creating a new MEM needlessly if we already had
337 the same address. We do if there's no OFFSET and the
338 old address X is identical to NEWX, or if X is of the
339 form (plus NEWX OFFSET), or the NEWX is of the form
340 (plus Y (const_int Z)) and X is that with the offset
341 added: (plus Y (const_int Z+OFFSET)). */
342 n
= strip_offset (n
, &n_offset
);
343 o
= strip_offset (o
, &o_offset
);
344 if (!(known_eq (o_offset
, n_offset
+ offset
)
345 && rtx_equal_p (o
, n
)))
346 x
= adjust_address_nv (newx
, mode
, offset
);
348 else if (GET_MODE (x
) == GET_MODE (newx
)
349 && known_eq (offset
, 0))
357 /* Make a unary operation by first seeing if it folds and otherwise making
358 the specified operation. */
361 simplify_gen_unary (enum rtx_code code
, machine_mode mode
, rtx op
,
362 machine_mode op_mode
)
366 /* If this simplifies, use it. */
367 if ((tem
= simplify_unary_operation (code
, mode
, op
, op_mode
)) != 0)
370 return gen_rtx_fmt_e (code
, mode
, op
);
373 /* Likewise for ternary operations. */
376 simplify_gen_ternary (enum rtx_code code
, machine_mode mode
,
377 machine_mode op0_mode
, rtx op0
, rtx op1
, rtx op2
)
381 /* If this simplifies, use it. */
382 if ((tem
= simplify_ternary_operation (code
, mode
, op0_mode
,
383 op0
, op1
, op2
)) != 0)
386 return gen_rtx_fmt_eee (code
, mode
, op0
, op1
, op2
);
389 /* Likewise, for relational operations.
390 CMP_MODE specifies mode comparison is done in. */
393 simplify_gen_relational (enum rtx_code code
, machine_mode mode
,
394 machine_mode cmp_mode
, rtx op0
, rtx op1
)
398 if ((tem
= simplify_relational_operation (code
, mode
, cmp_mode
,
402 return gen_rtx_fmt_ee (code
, mode
, op0
, op1
);
405 /* If FN is NULL, replace all occurrences of OLD_RTX in X with copy_rtx (DATA)
406 and simplify the result. If FN is non-NULL, call this callback on each
407 X, if it returns non-NULL, replace X with its return value and simplify the
411 simplify_replace_fn_rtx (rtx x
, const_rtx old_rtx
,
412 rtx (*fn
) (rtx
, const_rtx
, void *), void *data
)
414 enum rtx_code code
= GET_CODE (x
);
415 machine_mode mode
= GET_MODE (x
);
416 machine_mode op_mode
;
418 rtx op0
, op1
, op2
, newx
, op
;
422 if (__builtin_expect (fn
!= NULL
, 0))
424 newx
= fn (x
, old_rtx
, data
);
428 else if (rtx_equal_p (x
, old_rtx
))
429 return copy_rtx ((rtx
) data
);
431 switch (GET_RTX_CLASS (code
))
435 op_mode
= GET_MODE (op0
);
436 op0
= simplify_replace_fn_rtx (op0
, old_rtx
, fn
, data
);
437 if (op0
== XEXP (x
, 0))
439 return simplify_gen_unary (code
, mode
, op0
, op_mode
);
443 op0
= simplify_replace_fn_rtx (XEXP (x
, 0), old_rtx
, fn
, data
);
444 op1
= simplify_replace_fn_rtx (XEXP (x
, 1), old_rtx
, fn
, data
);
445 if (op0
== XEXP (x
, 0) && op1
== XEXP (x
, 1))
447 return simplify_gen_binary (code
, mode
, op0
, op1
);
450 case RTX_COMM_COMPARE
:
453 op_mode
= GET_MODE (op0
) != VOIDmode
? GET_MODE (op0
) : GET_MODE (op1
);
454 op0
= simplify_replace_fn_rtx (op0
, old_rtx
, fn
, data
);
455 op1
= simplify_replace_fn_rtx (op1
, old_rtx
, fn
, data
);
456 if (op0
== XEXP (x
, 0) && op1
== XEXP (x
, 1))
458 return simplify_gen_relational (code
, mode
, op_mode
, op0
, op1
);
461 case RTX_BITFIELD_OPS
:
463 op_mode
= GET_MODE (op0
);
464 op0
= simplify_replace_fn_rtx (op0
, old_rtx
, fn
, data
);
465 op1
= simplify_replace_fn_rtx (XEXP (x
, 1), old_rtx
, fn
, data
);
466 op2
= simplify_replace_fn_rtx (XEXP (x
, 2), old_rtx
, fn
, data
);
467 if (op0
== XEXP (x
, 0) && op1
== XEXP (x
, 1) && op2
== XEXP (x
, 2))
469 if (op_mode
== VOIDmode
)
470 op_mode
= GET_MODE (op0
);
471 return simplify_gen_ternary (code
, mode
, op_mode
, op0
, op1
, op2
);
476 op0
= simplify_replace_fn_rtx (SUBREG_REG (x
), old_rtx
, fn
, data
);
477 if (op0
== SUBREG_REG (x
))
479 op0
= simplify_gen_subreg (GET_MODE (x
), op0
,
480 GET_MODE (SUBREG_REG (x
)),
482 return op0
? op0
: x
;
489 op0
= simplify_replace_fn_rtx (XEXP (x
, 0), old_rtx
, fn
, data
);
490 if (op0
== XEXP (x
, 0))
492 return replace_equiv_address_nv (x
, op0
);
494 else if (code
== LO_SUM
)
496 op0
= simplify_replace_fn_rtx (XEXP (x
, 0), old_rtx
, fn
, data
);
497 op1
= simplify_replace_fn_rtx (XEXP (x
, 1), old_rtx
, fn
, data
);
499 /* (lo_sum (high x) y) -> y where x and y have the same base. */
500 if (GET_CODE (op0
) == HIGH
)
502 rtx base0
, base1
, offset0
, offset1
;
503 split_const (XEXP (op0
, 0), &base0
, &offset0
);
504 split_const (op1
, &base1
, &offset1
);
505 if (rtx_equal_p (base0
, base1
))
509 if (op0
== XEXP (x
, 0) && op1
== XEXP (x
, 1))
511 return gen_rtx_LO_SUM (mode
, op0
, op1
);
520 fmt
= GET_RTX_FORMAT (code
);
521 for (i
= 0; fmt
[i
]; i
++)
526 newvec
= XVEC (newx
, i
);
527 for (j
= 0; j
< GET_NUM_ELEM (vec
); j
++)
529 op
= simplify_replace_fn_rtx (RTVEC_ELT (vec
, j
),
531 if (op
!= RTVEC_ELT (vec
, j
))
535 newvec
= shallow_copy_rtvec (vec
);
537 newx
= shallow_copy_rtx (x
);
538 XVEC (newx
, i
) = newvec
;
540 RTVEC_ELT (newvec
, j
) = op
;
548 op
= simplify_replace_fn_rtx (XEXP (x
, i
), old_rtx
, fn
, data
);
549 if (op
!= XEXP (x
, i
))
552 newx
= shallow_copy_rtx (x
);
561 /* Replace all occurrences of OLD_RTX in X with NEW_RTX and try to simplify the
562 resulting RTX. Return a new RTX which is as simplified as possible. */
565 simplify_replace_rtx (rtx x
, const_rtx old_rtx
, rtx new_rtx
)
567 return simplify_replace_fn_rtx (x
, old_rtx
, 0, new_rtx
);
570 /* Try to simplify a MODE truncation of OP, which has OP_MODE.
571 Only handle cases where the truncated value is inherently an rvalue.
573 RTL provides two ways of truncating a value:
575 1. a lowpart subreg. This form is only a truncation when both
576 the outer and inner modes (here MODE and OP_MODE respectively)
577 are scalar integers, and only then when the subreg is used as
580 It is only valid to form such truncating subregs if the
581 truncation requires no action by the target. The onus for
582 proving this is on the creator of the subreg -- e.g. the
583 caller to simplify_subreg or simplify_gen_subreg -- and typically
584 involves either TRULY_NOOP_TRUNCATION_MODES_P or truncated_to_mode.
586 2. a TRUNCATE. This form handles both scalar and compound integers.
588 The first form is preferred where valid. However, the TRUNCATE
589 handling in simplify_unary_operation turns the second form into the
590 first form when TRULY_NOOP_TRUNCATION_MODES_P or truncated_to_mode allow,
591 so it is generally safe to form rvalue truncations using:
593 simplify_gen_unary (TRUNCATE, ...)
595 and leave simplify_unary_operation to work out which representation
598 Because of the proof requirements on (1), simplify_truncation must
599 also use simplify_gen_unary (TRUNCATE, ...) to truncate parts of OP,
600 regardless of whether the outer truncation came from a SUBREG or a
601 TRUNCATE. For example, if the caller has proven that an SImode
606 is a no-op and can be represented as a subreg, it does not follow
607 that SImode truncations of X and Y are also no-ops. On a target
608 like 64-bit MIPS that requires SImode values to be stored in
609 sign-extended form, an SImode truncation of:
611 (and:DI (reg:DI X) (const_int 63))
613 is trivially a no-op because only the lower 6 bits can be set.
614 However, X is still an arbitrary 64-bit number and so we cannot
615 assume that truncating it too is a no-op. */
618 simplify_truncation (machine_mode mode
, rtx op
,
619 machine_mode op_mode
)
621 unsigned int precision
= GET_MODE_UNIT_PRECISION (mode
);
622 unsigned int op_precision
= GET_MODE_UNIT_PRECISION (op_mode
);
623 scalar_int_mode int_mode
, int_op_mode
, subreg_mode
;
625 gcc_assert (precision
<= op_precision
);
627 /* Optimize truncations of zero and sign extended values. */
628 if (GET_CODE (op
) == ZERO_EXTEND
629 || GET_CODE (op
) == SIGN_EXTEND
)
631 /* There are three possibilities. If MODE is the same as the
632 origmode, we can omit both the extension and the subreg.
633 If MODE is not larger than the origmode, we can apply the
634 truncation without the extension. Finally, if the outermode
635 is larger than the origmode, we can just extend to the appropriate
637 machine_mode origmode
= GET_MODE (XEXP (op
, 0));
638 if (mode
== origmode
)
640 else if (precision
<= GET_MODE_UNIT_PRECISION (origmode
))
641 return simplify_gen_unary (TRUNCATE
, mode
,
642 XEXP (op
, 0), origmode
);
644 return simplify_gen_unary (GET_CODE (op
), mode
,
645 XEXP (op
, 0), origmode
);
648 /* If the machine can perform operations in the truncated mode, distribute
649 the truncation, i.e. simplify (truncate:QI (op:SI (x:SI) (y:SI))) into
650 (op:QI (truncate:QI (x:SI)) (truncate:QI (y:SI))). */
652 && (!WORD_REGISTER_OPERATIONS
|| precision
>= BITS_PER_WORD
)
653 && (GET_CODE (op
) == PLUS
654 || GET_CODE (op
) == MINUS
655 || GET_CODE (op
) == MULT
))
657 rtx op0
= simplify_gen_unary (TRUNCATE
, mode
, XEXP (op
, 0), op_mode
);
660 rtx op1
= simplify_gen_unary (TRUNCATE
, mode
, XEXP (op
, 1), op_mode
);
662 return simplify_gen_binary (GET_CODE (op
), mode
, op0
, op1
);
666 /* Simplify (truncate:QI (lshiftrt:SI (sign_extend:SI (x:QI)) C)) into
667 to (ashiftrt:QI (x:QI) C), where C is a suitable small constant and
668 the outer subreg is effectively a truncation to the original mode. */
669 if ((GET_CODE (op
) == LSHIFTRT
670 || GET_CODE (op
) == ASHIFTRT
)
671 /* Ensure that OP_MODE is at least twice as wide as MODE
672 to avoid the possibility that an outer LSHIFTRT shifts by more
673 than the sign extension's sign_bit_copies and introduces zeros
674 into the high bits of the result. */
675 && 2 * precision
<= op_precision
676 && CONST_INT_P (XEXP (op
, 1))
677 && GET_CODE (XEXP (op
, 0)) == SIGN_EXTEND
678 && GET_MODE (XEXP (XEXP (op
, 0), 0)) == mode
679 && UINTVAL (XEXP (op
, 1)) < precision
)
680 return simplify_gen_binary (ASHIFTRT
, mode
,
681 XEXP (XEXP (op
, 0), 0), XEXP (op
, 1));
683 /* Likewise (truncate:QI (lshiftrt:SI (zero_extend:SI (x:QI)) C)) into
684 to (lshiftrt:QI (x:QI) C), where C is a suitable small constant and
685 the outer subreg is effectively a truncation to the original mode. */
686 if ((GET_CODE (op
) == LSHIFTRT
687 || GET_CODE (op
) == ASHIFTRT
)
688 && CONST_INT_P (XEXP (op
, 1))
689 && GET_CODE (XEXP (op
, 0)) == ZERO_EXTEND
690 && GET_MODE (XEXP (XEXP (op
, 0), 0)) == mode
691 && UINTVAL (XEXP (op
, 1)) < precision
)
692 return simplify_gen_binary (LSHIFTRT
, mode
,
693 XEXP (XEXP (op
, 0), 0), XEXP (op
, 1));
695 /* Likewise (truncate:QI (ashift:SI (zero_extend:SI (x:QI)) C)) into
696 to (ashift:QI (x:QI) C), where C is a suitable small constant and
697 the outer subreg is effectively a truncation to the original mode. */
698 if (GET_CODE (op
) == ASHIFT
699 && CONST_INT_P (XEXP (op
, 1))
700 && (GET_CODE (XEXP (op
, 0)) == ZERO_EXTEND
701 || GET_CODE (XEXP (op
, 0)) == SIGN_EXTEND
)
702 && GET_MODE (XEXP (XEXP (op
, 0), 0)) == mode
703 && UINTVAL (XEXP (op
, 1)) < precision
)
704 return simplify_gen_binary (ASHIFT
, mode
,
705 XEXP (XEXP (op
, 0), 0), XEXP (op
, 1));
707 /* Likewise (truncate:QI (and:SI (lshiftrt:SI (x:SI) C) C2)) into
708 (and:QI (lshiftrt:QI (truncate:QI (x:SI)) C) C2) for suitable C
710 if (GET_CODE (op
) == AND
711 && (GET_CODE (XEXP (op
, 0)) == LSHIFTRT
712 || GET_CODE (XEXP (op
, 0)) == ASHIFTRT
)
713 && CONST_INT_P (XEXP (XEXP (op
, 0), 1))
714 && CONST_INT_P (XEXP (op
, 1)))
716 rtx op0
= (XEXP (XEXP (op
, 0), 0));
717 rtx shift_op
= XEXP (XEXP (op
, 0), 1);
718 rtx mask_op
= XEXP (op
, 1);
719 unsigned HOST_WIDE_INT shift
= UINTVAL (shift_op
);
720 unsigned HOST_WIDE_INT mask
= UINTVAL (mask_op
);
722 if (shift
< precision
723 /* If doing this transform works for an X with all bits set,
724 it works for any X. */
725 && ((GET_MODE_MASK (mode
) >> shift
) & mask
)
726 == ((GET_MODE_MASK (op_mode
) >> shift
) & mask
)
727 && (op0
= simplify_gen_unary (TRUNCATE
, mode
, op0
, op_mode
))
728 && (op0
= simplify_gen_binary (LSHIFTRT
, mode
, op0
, shift_op
)))
730 mask_op
= GEN_INT (trunc_int_for_mode (mask
, mode
));
731 return simplify_gen_binary (AND
, mode
, op0
, mask_op
);
735 /* Turn (truncate:M1 (*_extract:M2 (reg:M2) (len) (pos))) into
736 (*_extract:M1 (truncate:M1 (reg:M2)) (len) (pos')) if possible without
738 if ((GET_CODE (op
) == ZERO_EXTRACT
|| GET_CODE (op
) == SIGN_EXTRACT
)
739 && REG_P (XEXP (op
, 0))
740 && GET_MODE (XEXP (op
, 0)) == GET_MODE (op
)
741 && CONST_INT_P (XEXP (op
, 1))
742 && CONST_INT_P (XEXP (op
, 2)))
744 rtx op0
= XEXP (op
, 0);
745 unsigned HOST_WIDE_INT len
= UINTVAL (XEXP (op
, 1));
746 unsigned HOST_WIDE_INT pos
= UINTVAL (XEXP (op
, 2));
747 if (BITS_BIG_ENDIAN
&& pos
>= op_precision
- precision
)
749 op0
= simplify_gen_unary (TRUNCATE
, mode
, op0
, GET_MODE (op0
));
752 pos
-= op_precision
- precision
;
753 return simplify_gen_ternary (GET_CODE (op
), mode
, mode
, op0
,
754 XEXP (op
, 1), GEN_INT (pos
));
757 else if (!BITS_BIG_ENDIAN
&& precision
>= len
+ pos
)
759 op0
= simplify_gen_unary (TRUNCATE
, mode
, op0
, GET_MODE (op0
));
761 return simplify_gen_ternary (GET_CODE (op
), mode
, mode
, op0
,
762 XEXP (op
, 1), XEXP (op
, 2));
766 /* Recognize a word extraction from a multi-word subreg. */
767 if ((GET_CODE (op
) == LSHIFTRT
768 || GET_CODE (op
) == ASHIFTRT
)
769 && SCALAR_INT_MODE_P (mode
)
770 && SCALAR_INT_MODE_P (op_mode
)
771 && precision
>= BITS_PER_WORD
772 && 2 * precision
<= op_precision
773 && CONST_INT_P (XEXP (op
, 1))
774 && (INTVAL (XEXP (op
, 1)) & (precision
- 1)) == 0
775 && UINTVAL (XEXP (op
, 1)) < op_precision
)
777 poly_int64 byte
= subreg_lowpart_offset (mode
, op_mode
);
778 int shifted_bytes
= INTVAL (XEXP (op
, 1)) / BITS_PER_UNIT
;
779 return simplify_gen_subreg (mode
, XEXP (op
, 0), op_mode
,
781 ? byte
- shifted_bytes
782 : byte
+ shifted_bytes
));
785 /* If we have a TRUNCATE of a right shift of MEM, make a new MEM
786 and try replacing the TRUNCATE and shift with it. Don't do this
787 if the MEM has a mode-dependent address. */
788 if ((GET_CODE (op
) == LSHIFTRT
789 || GET_CODE (op
) == ASHIFTRT
)
790 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
791 && is_a
<scalar_int_mode
> (op_mode
, &int_op_mode
)
792 && MEM_P (XEXP (op
, 0))
793 && CONST_INT_P (XEXP (op
, 1))
794 && INTVAL (XEXP (op
, 1)) % GET_MODE_BITSIZE (int_mode
) == 0
795 && INTVAL (XEXP (op
, 1)) > 0
796 && INTVAL (XEXP (op
, 1)) < GET_MODE_BITSIZE (int_op_mode
)
797 && ! mode_dependent_address_p (XEXP (XEXP (op
, 0), 0),
798 MEM_ADDR_SPACE (XEXP (op
, 0)))
799 && ! MEM_VOLATILE_P (XEXP (op
, 0))
800 && (GET_MODE_SIZE (int_mode
) >= UNITS_PER_WORD
801 || WORDS_BIG_ENDIAN
== BYTES_BIG_ENDIAN
))
803 poly_int64 byte
= subreg_lowpart_offset (int_mode
, int_op_mode
);
804 int shifted_bytes
= INTVAL (XEXP (op
, 1)) / BITS_PER_UNIT
;
805 return adjust_address_nv (XEXP (op
, 0), int_mode
,
807 ? byte
- shifted_bytes
808 : byte
+ shifted_bytes
));
811 /* (truncate:SI (OP:DI ({sign,zero}_extend:DI foo:SI))) is
812 (OP:SI foo:SI) if OP is NEG or ABS. */
813 if ((GET_CODE (op
) == ABS
814 || GET_CODE (op
) == NEG
)
815 && (GET_CODE (XEXP (op
, 0)) == SIGN_EXTEND
816 || GET_CODE (XEXP (op
, 0)) == ZERO_EXTEND
)
817 && GET_MODE (XEXP (XEXP (op
, 0), 0)) == mode
)
818 return simplify_gen_unary (GET_CODE (op
), mode
,
819 XEXP (XEXP (op
, 0), 0), mode
);
821 /* (truncate:A (subreg:B (truncate:C X) 0)) is
823 if (GET_CODE (op
) == SUBREG
824 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
825 && SCALAR_INT_MODE_P (op_mode
)
826 && is_a
<scalar_int_mode
> (GET_MODE (SUBREG_REG (op
)), &subreg_mode
)
827 && GET_CODE (SUBREG_REG (op
)) == TRUNCATE
828 && subreg_lowpart_p (op
))
830 rtx inner
= XEXP (SUBREG_REG (op
), 0);
831 if (GET_MODE_PRECISION (int_mode
) <= GET_MODE_PRECISION (subreg_mode
))
832 return simplify_gen_unary (TRUNCATE
, int_mode
, inner
,
835 /* If subreg above is paradoxical and C is narrower
836 than A, return (subreg:A (truncate:C X) 0). */
837 return simplify_gen_subreg (int_mode
, SUBREG_REG (op
), subreg_mode
, 0);
840 /* (truncate:A (truncate:B X)) is (truncate:A X). */
841 if (GET_CODE (op
) == TRUNCATE
)
842 return simplify_gen_unary (TRUNCATE
, mode
, XEXP (op
, 0),
843 GET_MODE (XEXP (op
, 0)));
845 /* (truncate:A (ior X C)) is (const_int -1) if C is equal to that already,
847 if (GET_CODE (op
) == IOR
848 && SCALAR_INT_MODE_P (mode
)
849 && SCALAR_INT_MODE_P (op_mode
)
850 && CONST_INT_P (XEXP (op
, 1))
851 && trunc_int_for_mode (INTVAL (XEXP (op
, 1)), mode
) == -1)
857 /* Try to simplify a unary operation CODE whose output mode is to be
858 MODE with input operand OP whose mode was originally OP_MODE.
859 Return zero if no simplification can be made. */
861 simplify_unary_operation (enum rtx_code code
, machine_mode mode
,
862 rtx op
, machine_mode op_mode
)
866 trueop
= avoid_constant_pool_reference (op
);
868 tem
= simplify_const_unary_operation (code
, mode
, trueop
, op_mode
);
872 return simplify_unary_operation_1 (code
, mode
, op
);
875 /* Return true if FLOAT or UNSIGNED_FLOAT operation OP is known
879 exact_int_to_float_conversion_p (const_rtx op
)
881 int out_bits
= significand_size (GET_MODE_INNER (GET_MODE (op
)));
882 machine_mode op0_mode
= GET_MODE (XEXP (op
, 0));
883 /* Constants shouldn't reach here. */
884 gcc_assert (op0_mode
!= VOIDmode
);
885 int in_prec
= GET_MODE_UNIT_PRECISION (op0_mode
);
886 int in_bits
= in_prec
;
887 if (HWI_COMPUTABLE_MODE_P (op0_mode
))
889 unsigned HOST_WIDE_INT nonzero
= nonzero_bits (XEXP (op
, 0), op0_mode
);
890 if (GET_CODE (op
) == FLOAT
)
891 in_bits
-= num_sign_bit_copies (XEXP (op
, 0), op0_mode
);
892 else if (GET_CODE (op
) == UNSIGNED_FLOAT
)
893 in_bits
= wi::min_precision (wi::uhwi (nonzero
, in_prec
), UNSIGNED
);
896 in_bits
-= wi::ctz (wi::uhwi (nonzero
, in_prec
));
898 return in_bits
<= out_bits
;
901 /* Perform some simplifications we can do even if the operands
904 simplify_unary_operation_1 (enum rtx_code code
, machine_mode mode
, rtx op
)
906 enum rtx_code reversed
;
907 rtx temp
, elt
, base
, step
;
908 scalar_int_mode inner
, int_mode
, op_mode
, op0_mode
;
913 /* (not (not X)) == X. */
914 if (GET_CODE (op
) == NOT
)
917 /* (not (eq X Y)) == (ne X Y), etc. if BImode or the result of the
918 comparison is all ones. */
919 if (COMPARISON_P (op
)
920 && (mode
== BImode
|| STORE_FLAG_VALUE
== -1)
921 && ((reversed
= reversed_comparison_code (op
, NULL
)) != UNKNOWN
))
922 return simplify_gen_relational (reversed
, mode
, VOIDmode
,
923 XEXP (op
, 0), XEXP (op
, 1));
925 /* (not (plus X -1)) can become (neg X). */
926 if (GET_CODE (op
) == PLUS
927 && XEXP (op
, 1) == constm1_rtx
)
928 return simplify_gen_unary (NEG
, mode
, XEXP (op
, 0), mode
);
930 /* Similarly, (not (neg X)) is (plus X -1). Only do this for
931 modes that have CONSTM1_RTX, i.e. MODE_INT, MODE_PARTIAL_INT
932 and MODE_VECTOR_INT. */
933 if (GET_CODE (op
) == NEG
&& CONSTM1_RTX (mode
))
934 return simplify_gen_binary (PLUS
, mode
, XEXP (op
, 0),
937 /* (not (xor X C)) for C constant is (xor X D) with D = ~C. */
938 if (GET_CODE (op
) == XOR
939 && CONST_INT_P (XEXP (op
, 1))
940 && (temp
= simplify_unary_operation (NOT
, mode
,
941 XEXP (op
, 1), mode
)) != 0)
942 return simplify_gen_binary (XOR
, mode
, XEXP (op
, 0), temp
);
944 /* (not (plus X C)) for signbit C is (xor X D) with D = ~C. */
945 if (GET_CODE (op
) == PLUS
946 && CONST_INT_P (XEXP (op
, 1))
947 && mode_signbit_p (mode
, XEXP (op
, 1))
948 && (temp
= simplify_unary_operation (NOT
, mode
,
949 XEXP (op
, 1), mode
)) != 0)
950 return simplify_gen_binary (XOR
, mode
, XEXP (op
, 0), temp
);
953 /* (not (ashift 1 X)) is (rotate ~1 X). We used to do this for
954 operands other than 1, but that is not valid. We could do a
955 similar simplification for (not (lshiftrt C X)) where C is
956 just the sign bit, but this doesn't seem common enough to
958 if (GET_CODE (op
) == ASHIFT
959 && XEXP (op
, 0) == const1_rtx
)
961 temp
= simplify_gen_unary (NOT
, mode
, const1_rtx
, mode
);
962 return simplify_gen_binary (ROTATE
, mode
, temp
, XEXP (op
, 1));
965 /* (not (ashiftrt foo C)) where C is the number of bits in FOO
966 minus 1 is (ge foo (const_int 0)) if STORE_FLAG_VALUE is -1,
967 so we can perform the above simplification. */
968 if (STORE_FLAG_VALUE
== -1
969 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
970 && GET_CODE (op
) == ASHIFTRT
971 && CONST_INT_P (XEXP (op
, 1))
972 && INTVAL (XEXP (op
, 1)) == GET_MODE_PRECISION (int_mode
) - 1)
973 return simplify_gen_relational (GE
, int_mode
, VOIDmode
,
974 XEXP (op
, 0), const0_rtx
);
977 if (partial_subreg_p (op
)
978 && subreg_lowpart_p (op
)
979 && GET_CODE (SUBREG_REG (op
)) == ASHIFT
980 && XEXP (SUBREG_REG (op
), 0) == const1_rtx
)
982 machine_mode inner_mode
= GET_MODE (SUBREG_REG (op
));
985 x
= gen_rtx_ROTATE (inner_mode
,
986 simplify_gen_unary (NOT
, inner_mode
, const1_rtx
,
988 XEXP (SUBREG_REG (op
), 1));
989 temp
= rtl_hooks
.gen_lowpart_no_emit (mode
, x
);
994 /* Apply De Morgan's laws to reduce number of patterns for machines
995 with negating logical insns (and-not, nand, etc.). If result has
996 only one NOT, put it first, since that is how the patterns are
998 if (GET_CODE (op
) == IOR
|| GET_CODE (op
) == AND
)
1000 rtx in1
= XEXP (op
, 0), in2
= XEXP (op
, 1);
1001 machine_mode op_mode
;
1003 op_mode
= GET_MODE (in1
);
1004 in1
= simplify_gen_unary (NOT
, op_mode
, in1
, op_mode
);
1006 op_mode
= GET_MODE (in2
);
1007 if (op_mode
== VOIDmode
)
1009 in2
= simplify_gen_unary (NOT
, op_mode
, in2
, op_mode
);
1011 if (GET_CODE (in2
) == NOT
&& GET_CODE (in1
) != NOT
)
1012 std::swap (in1
, in2
);
1014 return gen_rtx_fmt_ee (GET_CODE (op
) == IOR
? AND
: IOR
,
1018 /* (not (bswap x)) -> (bswap (not x)). */
1019 if (GET_CODE (op
) == BSWAP
)
1021 rtx x
= simplify_gen_unary (NOT
, mode
, XEXP (op
, 0), mode
);
1022 return simplify_gen_unary (BSWAP
, mode
, x
, mode
);
1027 /* (neg (neg X)) == X. */
1028 if (GET_CODE (op
) == NEG
)
1029 return XEXP (op
, 0);
1031 /* (neg (x ? (neg y) : y)) == !x ? (neg y) : y.
1032 If comparison is not reversible use
1034 if (GET_CODE (op
) == IF_THEN_ELSE
)
1036 rtx cond
= XEXP (op
, 0);
1037 rtx true_rtx
= XEXP (op
, 1);
1038 rtx false_rtx
= XEXP (op
, 2);
1040 if ((GET_CODE (true_rtx
) == NEG
1041 && rtx_equal_p (XEXP (true_rtx
, 0), false_rtx
))
1042 || (GET_CODE (false_rtx
) == NEG
1043 && rtx_equal_p (XEXP (false_rtx
, 0), true_rtx
)))
1045 if (reversed_comparison_code (cond
, NULL
) != UNKNOWN
)
1046 temp
= reversed_comparison (cond
, mode
);
1050 std::swap (true_rtx
, false_rtx
);
1052 return simplify_gen_ternary (IF_THEN_ELSE
, mode
,
1053 mode
, temp
, true_rtx
, false_rtx
);
1057 /* (neg (plus X 1)) can become (not X). */
1058 if (GET_CODE (op
) == PLUS
1059 && XEXP (op
, 1) == const1_rtx
)
1060 return simplify_gen_unary (NOT
, mode
, XEXP (op
, 0), mode
);
1062 /* Similarly, (neg (not X)) is (plus X 1). */
1063 if (GET_CODE (op
) == NOT
)
1064 return simplify_gen_binary (PLUS
, mode
, XEXP (op
, 0),
1067 /* (neg (minus X Y)) can become (minus Y X). This transformation
1068 isn't safe for modes with signed zeros, since if X and Y are
1069 both +0, (minus Y X) is the same as (minus X Y). If the
1070 rounding mode is towards +infinity (or -infinity) then the two
1071 expressions will be rounded differently. */
1072 if (GET_CODE (op
) == MINUS
1073 && !HONOR_SIGNED_ZEROS (mode
)
1074 && !HONOR_SIGN_DEPENDENT_ROUNDING (mode
))
1075 return simplify_gen_binary (MINUS
, mode
, XEXP (op
, 1), XEXP (op
, 0));
1077 if (GET_CODE (op
) == PLUS
1078 && !HONOR_SIGNED_ZEROS (mode
)
1079 && !HONOR_SIGN_DEPENDENT_ROUNDING (mode
))
1081 /* (neg (plus A C)) is simplified to (minus -C A). */
1082 if (CONST_SCALAR_INT_P (XEXP (op
, 1))
1083 || CONST_DOUBLE_AS_FLOAT_P (XEXP (op
, 1)))
1085 temp
= simplify_unary_operation (NEG
, mode
, XEXP (op
, 1), mode
);
1087 return simplify_gen_binary (MINUS
, mode
, temp
, XEXP (op
, 0));
1090 /* (neg (plus A B)) is canonicalized to (minus (neg A) B). */
1091 temp
= simplify_gen_unary (NEG
, mode
, XEXP (op
, 0), mode
);
1092 return simplify_gen_binary (MINUS
, mode
, temp
, XEXP (op
, 1));
1095 /* (neg (mult A B)) becomes (mult A (neg B)).
1096 This works even for floating-point values. */
1097 if (GET_CODE (op
) == MULT
1098 && !HONOR_SIGN_DEPENDENT_ROUNDING (mode
))
1100 temp
= simplify_gen_unary (NEG
, mode
, XEXP (op
, 1), mode
);
1101 return simplify_gen_binary (MULT
, mode
, XEXP (op
, 0), temp
);
1104 /* NEG commutes with ASHIFT since it is multiplication. Only do
1105 this if we can then eliminate the NEG (e.g., if the operand
1107 if (GET_CODE (op
) == ASHIFT
)
1109 temp
= simplify_unary_operation (NEG
, mode
, XEXP (op
, 0), mode
);
1111 return simplify_gen_binary (ASHIFT
, mode
, temp
, XEXP (op
, 1));
1114 /* (neg (ashiftrt X C)) can be replaced by (lshiftrt X C) when
1115 C is equal to the width of MODE minus 1. */
1116 if (GET_CODE (op
) == ASHIFTRT
1117 && CONST_INT_P (XEXP (op
, 1))
1118 && INTVAL (XEXP (op
, 1)) == GET_MODE_UNIT_PRECISION (mode
) - 1)
1119 return simplify_gen_binary (LSHIFTRT
, mode
,
1120 XEXP (op
, 0), XEXP (op
, 1));
1122 /* (neg (lshiftrt X C)) can be replaced by (ashiftrt X C) when
1123 C is equal to the width of MODE minus 1. */
1124 if (GET_CODE (op
) == LSHIFTRT
1125 && CONST_INT_P (XEXP (op
, 1))
1126 && INTVAL (XEXP (op
, 1)) == GET_MODE_UNIT_PRECISION (mode
) - 1)
1127 return simplify_gen_binary (ASHIFTRT
, mode
,
1128 XEXP (op
, 0), XEXP (op
, 1));
1130 /* (neg (xor A 1)) is (plus A -1) if A is known to be either 0 or 1. */
1131 if (GET_CODE (op
) == XOR
1132 && XEXP (op
, 1) == const1_rtx
1133 && nonzero_bits (XEXP (op
, 0), mode
) == 1)
1134 return plus_constant (mode
, XEXP (op
, 0), -1);
1136 /* (neg (lt x 0)) is (ashiftrt X C) if STORE_FLAG_VALUE is 1. */
1137 /* (neg (lt x 0)) is (lshiftrt X C) if STORE_FLAG_VALUE is -1. */
1138 if (GET_CODE (op
) == LT
1139 && XEXP (op
, 1) == const0_rtx
1140 && is_a
<scalar_int_mode
> (GET_MODE (XEXP (op
, 0)), &inner
))
1142 int_mode
= as_a
<scalar_int_mode
> (mode
);
1143 int isize
= GET_MODE_PRECISION (inner
);
1144 if (STORE_FLAG_VALUE
== 1)
1146 temp
= simplify_gen_binary (ASHIFTRT
, inner
, XEXP (op
, 0),
1147 gen_int_shift_amount (inner
,
1149 if (int_mode
== inner
)
1151 if (GET_MODE_PRECISION (int_mode
) > isize
)
1152 return simplify_gen_unary (SIGN_EXTEND
, int_mode
, temp
, inner
);
1153 return simplify_gen_unary (TRUNCATE
, int_mode
, temp
, inner
);
1155 else if (STORE_FLAG_VALUE
== -1)
1157 temp
= simplify_gen_binary (LSHIFTRT
, inner
, XEXP (op
, 0),
1158 gen_int_shift_amount (inner
,
1160 if (int_mode
== inner
)
1162 if (GET_MODE_PRECISION (int_mode
) > isize
)
1163 return simplify_gen_unary (ZERO_EXTEND
, int_mode
, temp
, inner
);
1164 return simplify_gen_unary (TRUNCATE
, int_mode
, temp
, inner
);
1168 if (vec_series_p (op
, &base
, &step
))
1170 /* Only create a new series if we can simplify both parts. In other
1171 cases this isn't really a simplification, and it's not necessarily
1172 a win to replace a vector operation with a scalar operation. */
1173 scalar_mode inner_mode
= GET_MODE_INNER (mode
);
1174 base
= simplify_unary_operation (NEG
, inner_mode
, base
, inner_mode
);
1177 step
= simplify_unary_operation (NEG
, inner_mode
,
1180 return gen_vec_series (mode
, base
, step
);
1186 /* Don't optimize (lshiftrt (mult ...)) as it would interfere
1187 with the umulXi3_highpart patterns. */
1188 if (GET_CODE (op
) == LSHIFTRT
1189 && GET_CODE (XEXP (op
, 0)) == MULT
)
1192 if (GET_MODE_CLASS (mode
) == MODE_PARTIAL_INT
)
1194 if (TRULY_NOOP_TRUNCATION_MODES_P (mode
, GET_MODE (op
)))
1196 temp
= rtl_hooks
.gen_lowpart_no_emit (mode
, op
);
1200 /* We can't handle truncation to a partial integer mode here
1201 because we don't know the real bitsize of the partial
1206 if (GET_MODE (op
) != VOIDmode
)
1208 temp
= simplify_truncation (mode
, op
, GET_MODE (op
));
1213 /* If we know that the value is already truncated, we can
1214 replace the TRUNCATE with a SUBREG. */
1215 if (known_eq (GET_MODE_NUNITS (mode
), 1)
1216 && (TRULY_NOOP_TRUNCATION_MODES_P (mode
, GET_MODE (op
))
1217 || truncated_to_mode (mode
, op
)))
1219 temp
= rtl_hooks
.gen_lowpart_no_emit (mode
, op
);
1224 /* A truncate of a comparison can be replaced with a subreg if
1225 STORE_FLAG_VALUE permits. This is like the previous test,
1226 but it works even if the comparison is done in a mode larger
1227 than HOST_BITS_PER_WIDE_INT. */
1228 if (HWI_COMPUTABLE_MODE_P (mode
)
1229 && COMPARISON_P (op
)
1230 && (STORE_FLAG_VALUE
& ~GET_MODE_MASK (mode
)) == 0)
1232 temp
= rtl_hooks
.gen_lowpart_no_emit (mode
, op
);
1237 /* A truncate of a memory is just loading the low part of the memory
1238 if we are not changing the meaning of the address. */
1239 if (GET_CODE (op
) == MEM
1240 && !VECTOR_MODE_P (mode
)
1241 && !MEM_VOLATILE_P (op
)
1242 && !mode_dependent_address_p (XEXP (op
, 0), MEM_ADDR_SPACE (op
)))
1244 temp
= rtl_hooks
.gen_lowpart_no_emit (mode
, op
);
1251 case FLOAT_TRUNCATE
:
1252 if (DECIMAL_FLOAT_MODE_P (mode
))
1255 /* (float_truncate:SF (float_extend:DF foo:SF)) = foo:SF. */
1256 if (GET_CODE (op
) == FLOAT_EXTEND
1257 && GET_MODE (XEXP (op
, 0)) == mode
)
1258 return XEXP (op
, 0);
1260 /* (float_truncate:SF (float_truncate:DF foo:XF))
1261 = (float_truncate:SF foo:XF).
1262 This may eliminate double rounding, so it is unsafe.
1264 (float_truncate:SF (float_extend:XF foo:DF))
1265 = (float_truncate:SF foo:DF).
1267 (float_truncate:DF (float_extend:XF foo:SF))
1268 = (float_extend:DF foo:SF). */
1269 if ((GET_CODE (op
) == FLOAT_TRUNCATE
1270 && flag_unsafe_math_optimizations
)
1271 || GET_CODE (op
) == FLOAT_EXTEND
)
1272 return simplify_gen_unary (GET_MODE_UNIT_SIZE (GET_MODE (XEXP (op
, 0)))
1273 > GET_MODE_UNIT_SIZE (mode
)
1274 ? FLOAT_TRUNCATE
: FLOAT_EXTEND
,
1276 XEXP (op
, 0), mode
);
1278 /* (float_truncate (float x)) is (float x) */
1279 if ((GET_CODE (op
) == FLOAT
|| GET_CODE (op
) == UNSIGNED_FLOAT
)
1280 && (flag_unsafe_math_optimizations
1281 || exact_int_to_float_conversion_p (op
)))
1282 return simplify_gen_unary (GET_CODE (op
), mode
,
1284 GET_MODE (XEXP (op
, 0)));
1286 /* (float_truncate:SF (OP:DF (float_extend:DF foo:sf))) is
1287 (OP:SF foo:SF) if OP is NEG or ABS. */
1288 if ((GET_CODE (op
) == ABS
1289 || GET_CODE (op
) == NEG
)
1290 && GET_CODE (XEXP (op
, 0)) == FLOAT_EXTEND
1291 && GET_MODE (XEXP (XEXP (op
, 0), 0)) == mode
)
1292 return simplify_gen_unary (GET_CODE (op
), mode
,
1293 XEXP (XEXP (op
, 0), 0), mode
);
1295 /* (float_truncate:SF (subreg:DF (float_truncate:SF X) 0))
1296 is (float_truncate:SF x). */
1297 if (GET_CODE (op
) == SUBREG
1298 && subreg_lowpart_p (op
)
1299 && GET_CODE (SUBREG_REG (op
)) == FLOAT_TRUNCATE
)
1300 return SUBREG_REG (op
);
1304 if (DECIMAL_FLOAT_MODE_P (mode
))
1307 /* (float_extend (float_extend x)) is (float_extend x)
1309 (float_extend (float x)) is (float x) assuming that double
1310 rounding can't happen.
1312 if (GET_CODE (op
) == FLOAT_EXTEND
1313 || ((GET_CODE (op
) == FLOAT
|| GET_CODE (op
) == UNSIGNED_FLOAT
)
1314 && exact_int_to_float_conversion_p (op
)))
1315 return simplify_gen_unary (GET_CODE (op
), mode
,
1317 GET_MODE (XEXP (op
, 0)));
1322 /* (abs (neg <foo>)) -> (abs <foo>) */
1323 if (GET_CODE (op
) == NEG
)
1324 return simplify_gen_unary (ABS
, mode
, XEXP (op
, 0),
1325 GET_MODE (XEXP (op
, 0)));
1327 /* If the mode of the operand is VOIDmode (i.e. if it is ASM_OPERANDS),
1329 if (GET_MODE (op
) == VOIDmode
)
1332 /* If operand is something known to be positive, ignore the ABS. */
1333 if (GET_CODE (op
) == FFS
|| GET_CODE (op
) == ABS
1334 || val_signbit_known_clear_p (GET_MODE (op
),
1335 nonzero_bits (op
, GET_MODE (op
))))
1338 /* If operand is known to be only -1 or 0, convert ABS to NEG. */
1339 if (is_a
<scalar_int_mode
> (mode
, &int_mode
)
1340 && (num_sign_bit_copies (op
, int_mode
)
1341 == GET_MODE_PRECISION (int_mode
)))
1342 return gen_rtx_NEG (int_mode
, op
);
1347 /* (ffs (*_extend <X>)) = (ffs <X>) */
1348 if (GET_CODE (op
) == SIGN_EXTEND
1349 || GET_CODE (op
) == ZERO_EXTEND
)
1350 return simplify_gen_unary (FFS
, mode
, XEXP (op
, 0),
1351 GET_MODE (XEXP (op
, 0)));
1355 switch (GET_CODE (op
))
1359 /* (popcount (zero_extend <X>)) = (popcount <X>) */
1360 return simplify_gen_unary (POPCOUNT
, mode
, XEXP (op
, 0),
1361 GET_MODE (XEXP (op
, 0)));
1365 /* Rotations don't affect popcount. */
1366 if (!side_effects_p (XEXP (op
, 1)))
1367 return simplify_gen_unary (POPCOUNT
, mode
, XEXP (op
, 0),
1368 GET_MODE (XEXP (op
, 0)));
1377 switch (GET_CODE (op
))
1383 return simplify_gen_unary (PARITY
, mode
, XEXP (op
, 0),
1384 GET_MODE (XEXP (op
, 0)));
1388 /* Rotations don't affect parity. */
1389 if (!side_effects_p (XEXP (op
, 1)))
1390 return simplify_gen_unary (PARITY
, mode
, XEXP (op
, 0),
1391 GET_MODE (XEXP (op
, 0)));
1400 /* (bswap (bswap x)) -> x. */
1401 if (GET_CODE (op
) == BSWAP
)
1402 return XEXP (op
, 0);
1406 /* (float (sign_extend <X>)) = (float <X>). */
1407 if (GET_CODE (op
) == SIGN_EXTEND
)
1408 return simplify_gen_unary (FLOAT
, mode
, XEXP (op
, 0),
1409 GET_MODE (XEXP (op
, 0)));
1413 /* (sign_extend (truncate (minus (label_ref L1) (label_ref L2))))
1414 becomes just the MINUS if its mode is MODE. This allows
1415 folding switch statements on machines using casesi (such as
1417 if (GET_CODE (op
) == TRUNCATE
1418 && GET_MODE (XEXP (op
, 0)) == mode
1419 && GET_CODE (XEXP (op
, 0)) == MINUS
1420 && GET_CODE (XEXP (XEXP (op
, 0), 0)) == LABEL_REF
1421 && GET_CODE (XEXP (XEXP (op
, 0), 1)) == LABEL_REF
)
1422 return XEXP (op
, 0);
1424 /* Extending a widening multiplication should be canonicalized to
1425 a wider widening multiplication. */
1426 if (GET_CODE (op
) == MULT
)
1428 rtx lhs
= XEXP (op
, 0);
1429 rtx rhs
= XEXP (op
, 1);
1430 enum rtx_code lcode
= GET_CODE (lhs
);
1431 enum rtx_code rcode
= GET_CODE (rhs
);
1433 /* Widening multiplies usually extend both operands, but sometimes
1434 they use a shift to extract a portion of a register. */
1435 if ((lcode
== SIGN_EXTEND
1436 || (lcode
== ASHIFTRT
&& CONST_INT_P (XEXP (lhs
, 1))))
1437 && (rcode
== SIGN_EXTEND
1438 || (rcode
== ASHIFTRT
&& CONST_INT_P (XEXP (rhs
, 1)))))
1440 machine_mode lmode
= GET_MODE (lhs
);
1441 machine_mode rmode
= GET_MODE (rhs
);
1444 if (lcode
== ASHIFTRT
)
1445 /* Number of bits not shifted off the end. */
1446 bits
= (GET_MODE_UNIT_PRECISION (lmode
)
1447 - INTVAL (XEXP (lhs
, 1)));
1448 else /* lcode == SIGN_EXTEND */
1449 /* Size of inner mode. */
1450 bits
= GET_MODE_UNIT_PRECISION (GET_MODE (XEXP (lhs
, 0)));
1452 if (rcode
== ASHIFTRT
)
1453 bits
+= (GET_MODE_UNIT_PRECISION (rmode
)
1454 - INTVAL (XEXP (rhs
, 1)));
1455 else /* rcode == SIGN_EXTEND */
1456 bits
+= GET_MODE_UNIT_PRECISION (GET_MODE (XEXP (rhs
, 0)));
1458 /* We can only widen multiplies if the result is mathematiclly
1459 equivalent. I.e. if overflow was impossible. */
1460 if (bits
<= GET_MODE_UNIT_PRECISION (GET_MODE (op
)))
1461 return simplify_gen_binary
1463 simplify_gen_unary (SIGN_EXTEND
, mode
, lhs
, lmode
),
1464 simplify_gen_unary (SIGN_EXTEND
, mode
, rhs
, rmode
));
1468 /* Check for a sign extension of a subreg of a promoted
1469 variable, where the promotion is sign-extended, and the
1470 target mode is the same as the variable's promotion. */
1471 if (GET_CODE (op
) == SUBREG
1472 && SUBREG_PROMOTED_VAR_P (op
)
1473 && SUBREG_PROMOTED_SIGNED_P (op
)
1474 && !paradoxical_subreg_p (mode
, GET_MODE (SUBREG_REG (op
))))
1476 temp
= rtl_hooks
.gen_lowpart_no_emit (mode
, SUBREG_REG (op
));
1481 /* (sign_extend:M (sign_extend:N <X>)) is (sign_extend:M <X>).
1482 (sign_extend:M (zero_extend:N <X>)) is (zero_extend:M <X>). */
1483 if (GET_CODE (op
) == SIGN_EXTEND
|| GET_CODE (op
) == ZERO_EXTEND
)
1485 gcc_assert (GET_MODE_UNIT_PRECISION (mode
)
1486 > GET_MODE_UNIT_PRECISION (GET_MODE (op
)));
1487 return simplify_gen_unary (GET_CODE (op
), mode
, XEXP (op
, 0),
1488 GET_MODE (XEXP (op
, 0)));
1491 /* (sign_extend:M (ashiftrt:N (ashift <X> (const_int I)) (const_int I)))
1492 is (sign_extend:M (subreg:O <X>)) if there is mode with
1493 GET_MODE_BITSIZE (N) - I bits.
1494 (sign_extend:M (lshiftrt:N (ashift <X> (const_int I)) (const_int I)))
1495 is similarly (zero_extend:M (subreg:O <X>)). */
1496 if ((GET_CODE (op
) == ASHIFTRT
|| GET_CODE (op
) == LSHIFTRT
)
1497 && GET_CODE (XEXP (op
, 0)) == ASHIFT
1498 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
1499 && CONST_INT_P (XEXP (op
, 1))
1500 && XEXP (XEXP (op
, 0), 1) == XEXP (op
, 1)
1501 && (op_mode
= as_a
<scalar_int_mode
> (GET_MODE (op
)),
1502 GET_MODE_PRECISION (op_mode
) > INTVAL (XEXP (op
, 1))))
1504 scalar_int_mode tmode
;
1505 gcc_assert (GET_MODE_PRECISION (int_mode
)
1506 > GET_MODE_PRECISION (op_mode
));
1507 if (int_mode_for_size (GET_MODE_PRECISION (op_mode
)
1508 - INTVAL (XEXP (op
, 1)), 1).exists (&tmode
))
1511 rtl_hooks
.gen_lowpart_no_emit (tmode
, XEXP (XEXP (op
, 0), 0));
1513 return simplify_gen_unary (GET_CODE (op
) == ASHIFTRT
1514 ? SIGN_EXTEND
: ZERO_EXTEND
,
1515 int_mode
, inner
, tmode
);
1519 /* (sign_extend:M (lshiftrt:N <X> (const_int I))) is better as
1520 (zero_extend:M (lshiftrt:N <X> (const_int I))) if I is not 0. */
1521 if (GET_CODE (op
) == LSHIFTRT
1522 && CONST_INT_P (XEXP (op
, 1))
1523 && XEXP (op
, 1) != const0_rtx
)
1524 return simplify_gen_unary (ZERO_EXTEND
, mode
, op
, GET_MODE (op
));
1526 #if defined(POINTERS_EXTEND_UNSIGNED)
1527 /* As we do not know which address space the pointer is referring to,
1528 we can do this only if the target does not support different pointer
1529 or address modes depending on the address space. */
1530 if (target_default_pointer_address_modes_p ()
1531 && ! POINTERS_EXTEND_UNSIGNED
1532 && mode
== Pmode
&& GET_MODE (op
) == ptr_mode
1534 || (GET_CODE (op
) == SUBREG
1535 && REG_P (SUBREG_REG (op
))
1536 && REG_POINTER (SUBREG_REG (op
))
1537 && GET_MODE (SUBREG_REG (op
)) == Pmode
))
1538 && !targetm
.have_ptr_extend ())
1541 = convert_memory_address_addr_space_1 (Pmode
, op
,
1542 ADDR_SPACE_GENERIC
, false,
1551 /* Check for a zero extension of a subreg of a promoted
1552 variable, where the promotion is zero-extended, and the
1553 target mode is the same as the variable's promotion. */
1554 if (GET_CODE (op
) == SUBREG
1555 && SUBREG_PROMOTED_VAR_P (op
)
1556 && SUBREG_PROMOTED_UNSIGNED_P (op
)
1557 && !paradoxical_subreg_p (mode
, GET_MODE (SUBREG_REG (op
))))
1559 temp
= rtl_hooks
.gen_lowpart_no_emit (mode
, SUBREG_REG (op
));
1564 /* Extending a widening multiplication should be canonicalized to
1565 a wider widening multiplication. */
1566 if (GET_CODE (op
) == MULT
)
1568 rtx lhs
= XEXP (op
, 0);
1569 rtx rhs
= XEXP (op
, 1);
1570 enum rtx_code lcode
= GET_CODE (lhs
);
1571 enum rtx_code rcode
= GET_CODE (rhs
);
1573 /* Widening multiplies usually extend both operands, but sometimes
1574 they use a shift to extract a portion of a register. */
1575 if ((lcode
== ZERO_EXTEND
1576 || (lcode
== LSHIFTRT
&& CONST_INT_P (XEXP (lhs
, 1))))
1577 && (rcode
== ZERO_EXTEND
1578 || (rcode
== LSHIFTRT
&& CONST_INT_P (XEXP (rhs
, 1)))))
1580 machine_mode lmode
= GET_MODE (lhs
);
1581 machine_mode rmode
= GET_MODE (rhs
);
1584 if (lcode
== LSHIFTRT
)
1585 /* Number of bits not shifted off the end. */
1586 bits
= (GET_MODE_UNIT_PRECISION (lmode
)
1587 - INTVAL (XEXP (lhs
, 1)));
1588 else /* lcode == ZERO_EXTEND */
1589 /* Size of inner mode. */
1590 bits
= GET_MODE_UNIT_PRECISION (GET_MODE (XEXP (lhs
, 0)));
1592 if (rcode
== LSHIFTRT
)
1593 bits
+= (GET_MODE_UNIT_PRECISION (rmode
)
1594 - INTVAL (XEXP (rhs
, 1)));
1595 else /* rcode == ZERO_EXTEND */
1596 bits
+= GET_MODE_UNIT_PRECISION (GET_MODE (XEXP (rhs
, 0)));
1598 /* We can only widen multiplies if the result is mathematiclly
1599 equivalent. I.e. if overflow was impossible. */
1600 if (bits
<= GET_MODE_UNIT_PRECISION (GET_MODE (op
)))
1601 return simplify_gen_binary
1603 simplify_gen_unary (ZERO_EXTEND
, mode
, lhs
, lmode
),
1604 simplify_gen_unary (ZERO_EXTEND
, mode
, rhs
, rmode
));
1608 /* (zero_extend:M (zero_extend:N <X>)) is (zero_extend:M <X>). */
1609 if (GET_CODE (op
) == ZERO_EXTEND
)
1610 return simplify_gen_unary (ZERO_EXTEND
, mode
, XEXP (op
, 0),
1611 GET_MODE (XEXP (op
, 0)));
1613 /* (zero_extend:M (lshiftrt:N (ashift <X> (const_int I)) (const_int I)))
1614 is (zero_extend:M (subreg:O <X>)) if there is mode with
1615 GET_MODE_PRECISION (N) - I bits. */
1616 if (GET_CODE (op
) == LSHIFTRT
1617 && GET_CODE (XEXP (op
, 0)) == ASHIFT
1618 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
1619 && CONST_INT_P (XEXP (op
, 1))
1620 && XEXP (XEXP (op
, 0), 1) == XEXP (op
, 1)
1621 && (op_mode
= as_a
<scalar_int_mode
> (GET_MODE (op
)),
1622 GET_MODE_PRECISION (op_mode
) > INTVAL (XEXP (op
, 1))))
1624 scalar_int_mode tmode
;
1625 if (int_mode_for_size (GET_MODE_PRECISION (op_mode
)
1626 - INTVAL (XEXP (op
, 1)), 1).exists (&tmode
))
1629 rtl_hooks
.gen_lowpart_no_emit (tmode
, XEXP (XEXP (op
, 0), 0));
1631 return simplify_gen_unary (ZERO_EXTEND
, int_mode
,
1636 /* (zero_extend:M (subreg:N <X:O>)) is <X:O> (for M == O) or
1637 (zero_extend:M <X:O>), if X doesn't have any non-zero bits outside
1639 (zero_extend:SI (subreg:QI (and:SI (reg:SI) (const_int 63)) 0)) is
1640 (and:SI (reg:SI) (const_int 63)). */
1641 if (partial_subreg_p (op
)
1642 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
1643 && is_a
<scalar_int_mode
> (GET_MODE (SUBREG_REG (op
)), &op0_mode
)
1644 && GET_MODE_PRECISION (op0_mode
) <= HOST_BITS_PER_WIDE_INT
1645 && GET_MODE_PRECISION (int_mode
) >= GET_MODE_PRECISION (op0_mode
)
1646 && subreg_lowpart_p (op
)
1647 && (nonzero_bits (SUBREG_REG (op
), op0_mode
)
1648 & ~GET_MODE_MASK (GET_MODE (op
))) == 0)
1650 if (GET_MODE_PRECISION (int_mode
) == GET_MODE_PRECISION (op0_mode
))
1651 return SUBREG_REG (op
);
1652 return simplify_gen_unary (ZERO_EXTEND
, int_mode
, SUBREG_REG (op
),
1656 #if defined(POINTERS_EXTEND_UNSIGNED)
1657 /* As we do not know which address space the pointer is referring to,
1658 we can do this only if the target does not support different pointer
1659 or address modes depending on the address space. */
1660 if (target_default_pointer_address_modes_p ()
1661 && POINTERS_EXTEND_UNSIGNED
> 0
1662 && mode
== Pmode
&& GET_MODE (op
) == ptr_mode
1664 || (GET_CODE (op
) == SUBREG
1665 && REG_P (SUBREG_REG (op
))
1666 && REG_POINTER (SUBREG_REG (op
))
1667 && GET_MODE (SUBREG_REG (op
)) == Pmode
))
1668 && !targetm
.have_ptr_extend ())
1671 = convert_memory_address_addr_space_1 (Pmode
, op
,
1672 ADDR_SPACE_GENERIC
, false,
1684 if (VECTOR_MODE_P (mode
)
1685 && vec_duplicate_p (op
, &elt
)
1686 && code
!= VEC_DUPLICATE
)
1688 /* Try applying the operator to ELT and see if that simplifies.
1689 We can duplicate the result if so.
1691 The reason we don't use simplify_gen_unary is that it isn't
1692 necessarily a win to convert things like:
1694 (neg:V (vec_duplicate:V (reg:S R)))
1698 (vec_duplicate:V (neg:S (reg:S R)))
1700 The first might be done entirely in vector registers while the
1701 second might need a move between register files. */
1702 temp
= simplify_unary_operation (code
, GET_MODE_INNER (mode
),
1703 elt
, GET_MODE_INNER (GET_MODE (op
)));
1705 return gen_vec_duplicate (mode
, temp
);
1711 /* Try to compute the value of a unary operation CODE whose output mode is to
1712 be MODE with input operand OP whose mode was originally OP_MODE.
1713 Return zero if the value cannot be computed. */
1715 simplify_const_unary_operation (enum rtx_code code
, machine_mode mode
,
1716 rtx op
, machine_mode op_mode
)
1718 scalar_int_mode result_mode
;
1720 if (code
== VEC_DUPLICATE
)
1722 gcc_assert (VECTOR_MODE_P (mode
));
1723 if (GET_MODE (op
) != VOIDmode
)
1725 if (!VECTOR_MODE_P (GET_MODE (op
)))
1726 gcc_assert (GET_MODE_INNER (mode
) == GET_MODE (op
));
1728 gcc_assert (GET_MODE_INNER (mode
) == GET_MODE_INNER
1731 if (CONST_SCALAR_INT_P (op
) || CONST_DOUBLE_AS_FLOAT_P (op
))
1732 return gen_const_vec_duplicate (mode
, op
);
1733 if (GET_CODE (op
) == CONST_VECTOR
1734 && (CONST_VECTOR_DUPLICATE_P (op
)
1735 || CONST_VECTOR_NUNITS (op
).is_constant ()))
1737 unsigned int npatterns
= (CONST_VECTOR_DUPLICATE_P (op
)
1738 ? CONST_VECTOR_NPATTERNS (op
)
1739 : CONST_VECTOR_NUNITS (op
).to_constant ());
1740 gcc_assert (multiple_p (GET_MODE_NUNITS (mode
), npatterns
));
1741 rtx_vector_builder
builder (mode
, npatterns
, 1);
1742 for (unsigned i
= 0; i
< npatterns
; i
++)
1743 builder
.quick_push (CONST_VECTOR_ELT (op
, i
));
1744 return builder
.build ();
1748 if (VECTOR_MODE_P (mode
)
1749 && GET_CODE (op
) == CONST_VECTOR
1750 && known_eq (GET_MODE_NUNITS (mode
), CONST_VECTOR_NUNITS (op
)))
1752 gcc_assert (GET_MODE (op
) == op_mode
);
1754 rtx_vector_builder builder
;
1755 if (!builder
.new_unary_operation (mode
, op
, false))
1758 unsigned int count
= builder
.encoded_nelts ();
1759 for (unsigned int i
= 0; i
< count
; i
++)
1761 rtx x
= simplify_unary_operation (code
, GET_MODE_INNER (mode
),
1762 CONST_VECTOR_ELT (op
, i
),
1763 GET_MODE_INNER (op_mode
));
1764 if (!x
|| !valid_for_const_vector_p (mode
, x
))
1766 builder
.quick_push (x
);
1768 return builder
.build ();
1771 /* The order of these tests is critical so that, for example, we don't
1772 check the wrong mode (input vs. output) for a conversion operation,
1773 such as FIX. At some point, this should be simplified. */
1775 if (code
== FLOAT
&& CONST_SCALAR_INT_P (op
))
1779 if (op_mode
== VOIDmode
)
1781 /* CONST_INT have VOIDmode as the mode. We assume that all
1782 the bits of the constant are significant, though, this is
1783 a dangerous assumption as many times CONST_INTs are
1784 created and used with garbage in the bits outside of the
1785 precision of the implied mode of the const_int. */
1786 op_mode
= MAX_MODE_INT
;
1789 real_from_integer (&d
, mode
, rtx_mode_t (op
, op_mode
), SIGNED
);
1791 /* Avoid the folding if flag_signaling_nans is on and
1792 operand is a signaling NaN. */
1793 if (HONOR_SNANS (mode
) && REAL_VALUE_ISSIGNALING_NAN (d
))
1796 d
= real_value_truncate (mode
, d
);
1797 return const_double_from_real_value (d
, mode
);
1799 else if (code
== UNSIGNED_FLOAT
&& CONST_SCALAR_INT_P (op
))
1803 if (op_mode
== VOIDmode
)
1805 /* CONST_INT have VOIDmode as the mode. We assume that all
1806 the bits of the constant are significant, though, this is
1807 a dangerous assumption as many times CONST_INTs are
1808 created and used with garbage in the bits outside of the
1809 precision of the implied mode of the const_int. */
1810 op_mode
= MAX_MODE_INT
;
1813 real_from_integer (&d
, mode
, rtx_mode_t (op
, op_mode
), UNSIGNED
);
1815 /* Avoid the folding if flag_signaling_nans is on and
1816 operand is a signaling NaN. */
1817 if (HONOR_SNANS (mode
) && REAL_VALUE_ISSIGNALING_NAN (d
))
1820 d
= real_value_truncate (mode
, d
);
1821 return const_double_from_real_value (d
, mode
);
1824 if (CONST_SCALAR_INT_P (op
) && is_a
<scalar_int_mode
> (mode
, &result_mode
))
1826 unsigned int width
= GET_MODE_PRECISION (result_mode
);
1828 scalar_int_mode imode
= (op_mode
== VOIDmode
1830 : as_a
<scalar_int_mode
> (op_mode
));
1831 rtx_mode_t op0
= rtx_mode_t (op
, imode
);
1834 #if TARGET_SUPPORTS_WIDE_INT == 0
1835 /* This assert keeps the simplification from producing a result
1836 that cannot be represented in a CONST_DOUBLE but a lot of
1837 upstream callers expect that this function never fails to
1838 simplify something and so you if you added this to the test
1839 above the code would die later anyway. If this assert
1840 happens, you just need to make the port support wide int. */
1841 gcc_assert (width
<= HOST_BITS_PER_DOUBLE_INT
);
1847 result
= wi::bit_not (op0
);
1851 result
= wi::neg (op0
);
1855 result
= wi::abs (op0
);
1859 result
= wi::shwi (wi::ffs (op0
), result_mode
);
1863 if (wi::ne_p (op0
, 0))
1864 int_value
= wi::clz (op0
);
1865 else if (! CLZ_DEFINED_VALUE_AT_ZERO (imode
, int_value
))
1867 result
= wi::shwi (int_value
, result_mode
);
1871 result
= wi::shwi (wi::clrsb (op0
), result_mode
);
1875 if (wi::ne_p (op0
, 0))
1876 int_value
= wi::ctz (op0
);
1877 else if (! CTZ_DEFINED_VALUE_AT_ZERO (imode
, int_value
))
1879 result
= wi::shwi (int_value
, result_mode
);
1883 result
= wi::shwi (wi::popcount (op0
), result_mode
);
1887 result
= wi::shwi (wi::parity (op0
), result_mode
);
1891 result
= wide_int (op0
).bswap ();
1896 result
= wide_int::from (op0
, width
, UNSIGNED
);
1900 result
= wide_int::from (op0
, width
, SIGNED
);
1908 return immed_wide_int_const (result
, result_mode
);
1911 else if (CONST_DOUBLE_AS_FLOAT_P (op
)
1912 && SCALAR_FLOAT_MODE_P (mode
)
1913 && SCALAR_FLOAT_MODE_P (GET_MODE (op
)))
1915 REAL_VALUE_TYPE d
= *CONST_DOUBLE_REAL_VALUE (op
);
1921 d
= real_value_abs (&d
);
1924 d
= real_value_negate (&d
);
1926 case FLOAT_TRUNCATE
:
1927 /* Don't perform the operation if flag_signaling_nans is on
1928 and the operand is a signaling NaN. */
1929 if (HONOR_SNANS (mode
) && REAL_VALUE_ISSIGNALING_NAN (d
))
1931 d
= real_value_truncate (mode
, d
);
1934 /* Don't perform the operation if flag_signaling_nans is on
1935 and the operand is a signaling NaN. */
1936 if (HONOR_SNANS (mode
) && REAL_VALUE_ISSIGNALING_NAN (d
))
1938 /* All this does is change the mode, unless changing
1940 if (GET_MODE_CLASS (mode
) != GET_MODE_CLASS (GET_MODE (op
)))
1941 real_convert (&d
, mode
, &d
);
1944 /* Don't perform the operation if flag_signaling_nans is on
1945 and the operand is a signaling NaN. */
1946 if (HONOR_SNANS (mode
) && REAL_VALUE_ISSIGNALING_NAN (d
))
1948 real_arithmetic (&d
, FIX_TRUNC_EXPR
, &d
, NULL
);
1955 real_to_target (tmp
, &d
, GET_MODE (op
));
1956 for (i
= 0; i
< 4; i
++)
1958 real_from_target (&d
, tmp
, mode
);
1964 return const_double_from_real_value (d
, mode
);
1966 else if (CONST_DOUBLE_AS_FLOAT_P (op
)
1967 && SCALAR_FLOAT_MODE_P (GET_MODE (op
))
1968 && is_int_mode (mode
, &result_mode
))
1970 unsigned int width
= GET_MODE_PRECISION (result_mode
);
1971 /* Although the overflow semantics of RTL's FIX and UNSIGNED_FIX
1972 operators are intentionally left unspecified (to ease implementation
1973 by target backends), for consistency, this routine implements the
1974 same semantics for constant folding as used by the middle-end. */
1976 /* This was formerly used only for non-IEEE float.
1977 eggert@twinsun.com says it is safe for IEEE also. */
1979 const REAL_VALUE_TYPE
*x
= CONST_DOUBLE_REAL_VALUE (op
);
1980 wide_int wmax
, wmin
;
1981 /* This is part of the abi to real_to_integer, but we check
1982 things before making this call. */
1988 if (REAL_VALUE_ISNAN (*x
))
1991 /* Test against the signed upper bound. */
1992 wmax
= wi::max_value (width
, SIGNED
);
1993 real_from_integer (&t
, VOIDmode
, wmax
, SIGNED
);
1994 if (real_less (&t
, x
))
1995 return immed_wide_int_const (wmax
, mode
);
1997 /* Test against the signed lower bound. */
1998 wmin
= wi::min_value (width
, SIGNED
);
1999 real_from_integer (&t
, VOIDmode
, wmin
, SIGNED
);
2000 if (real_less (x
, &t
))
2001 return immed_wide_int_const (wmin
, mode
);
2003 return immed_wide_int_const (real_to_integer (x
, &fail
, width
),
2007 if (REAL_VALUE_ISNAN (*x
) || REAL_VALUE_NEGATIVE (*x
))
2010 /* Test against the unsigned upper bound. */
2011 wmax
= wi::max_value (width
, UNSIGNED
);
2012 real_from_integer (&t
, VOIDmode
, wmax
, UNSIGNED
);
2013 if (real_less (&t
, x
))
2014 return immed_wide_int_const (wmax
, mode
);
2016 return immed_wide_int_const (real_to_integer (x
, &fail
, width
),
2024 /* Handle polynomial integers. */
2025 else if (CONST_POLY_INT_P (op
))
2027 poly_wide_int result
;
2031 result
= -const_poly_int_value (op
);
2035 result
= ~const_poly_int_value (op
);
2041 return immed_wide_int_const (result
, mode
);
2047 /* Subroutine of simplify_binary_operation to simplify a binary operation
2048 CODE that can commute with byte swapping, with result mode MODE and
2049 operating on OP0 and OP1. CODE is currently one of AND, IOR or XOR.
2050 Return zero if no simplification or canonicalization is possible. */
2053 simplify_byte_swapping_operation (enum rtx_code code
, machine_mode mode
,
2058 /* (op (bswap x) C1)) -> (bswap (op x C2)) with C2 swapped. */
2059 if (GET_CODE (op0
) == BSWAP
&& CONST_SCALAR_INT_P (op1
))
2061 tem
= simplify_gen_binary (code
, mode
, XEXP (op0
, 0),
2062 simplify_gen_unary (BSWAP
, mode
, op1
, mode
));
2063 return simplify_gen_unary (BSWAP
, mode
, tem
, mode
);
2066 /* (op (bswap x) (bswap y)) -> (bswap (op x y)). */
2067 if (GET_CODE (op0
) == BSWAP
&& GET_CODE (op1
) == BSWAP
)
2069 tem
= simplify_gen_binary (code
, mode
, XEXP (op0
, 0), XEXP (op1
, 0));
2070 return simplify_gen_unary (BSWAP
, mode
, tem
, mode
);
2076 /* Subroutine of simplify_binary_operation to simplify a commutative,
2077 associative binary operation CODE with result mode MODE, operating
2078 on OP0 and OP1. CODE is currently one of PLUS, MULT, AND, IOR, XOR,
2079 SMIN, SMAX, UMIN or UMAX. Return zero if no simplification or
2080 canonicalization is possible. */
2083 simplify_associative_operation (enum rtx_code code
, machine_mode mode
,
2088 /* Linearize the operator to the left. */
2089 if (GET_CODE (op1
) == code
)
2091 /* "(a op b) op (c op d)" becomes "((a op b) op c) op d)". */
2092 if (GET_CODE (op0
) == code
)
2094 tem
= simplify_gen_binary (code
, mode
, op0
, XEXP (op1
, 0));
2095 return simplify_gen_binary (code
, mode
, tem
, XEXP (op1
, 1));
2098 /* "a op (b op c)" becomes "(b op c) op a". */
2099 if (! swap_commutative_operands_p (op1
, op0
))
2100 return simplify_gen_binary (code
, mode
, op1
, op0
);
2102 std::swap (op0
, op1
);
2105 if (GET_CODE (op0
) == code
)
2107 /* Canonicalize "(x op c) op y" as "(x op y) op c". */
2108 if (swap_commutative_operands_p (XEXP (op0
, 1), op1
))
2110 tem
= simplify_gen_binary (code
, mode
, XEXP (op0
, 0), op1
);
2111 return simplify_gen_binary (code
, mode
, tem
, XEXP (op0
, 1));
2114 /* Attempt to simplify "(a op b) op c" as "a op (b op c)". */
2115 tem
= simplify_binary_operation (code
, mode
, XEXP (op0
, 1), op1
);
2117 return simplify_gen_binary (code
, mode
, XEXP (op0
, 0), tem
);
2119 /* Attempt to simplify "(a op b) op c" as "(a op c) op b". */
2120 tem
= simplify_binary_operation (code
, mode
, XEXP (op0
, 0), op1
);
2122 return simplify_gen_binary (code
, mode
, tem
, XEXP (op0
, 1));
2129 /* Simplify a binary operation CODE with result mode MODE, operating on OP0
2130 and OP1. Return 0 if no simplification is possible.
2132 Don't use this for relational operations such as EQ or LT.
2133 Use simplify_relational_operation instead. */
2135 simplify_binary_operation (enum rtx_code code
, machine_mode mode
,
2138 rtx trueop0
, trueop1
;
2141 /* Relational operations don't work here. We must know the mode
2142 of the operands in order to do the comparison correctly.
2143 Assuming a full word can give incorrect results.
2144 Consider comparing 128 with -128 in QImode. */
2145 gcc_assert (GET_RTX_CLASS (code
) != RTX_COMPARE
);
2146 gcc_assert (GET_RTX_CLASS (code
) != RTX_COMM_COMPARE
);
2148 /* Make sure the constant is second. */
2149 if (GET_RTX_CLASS (code
) == RTX_COMM_ARITH
2150 && swap_commutative_operands_p (op0
, op1
))
2151 std::swap (op0
, op1
);
2153 trueop0
= avoid_constant_pool_reference (op0
);
2154 trueop1
= avoid_constant_pool_reference (op1
);
2156 tem
= simplify_const_binary_operation (code
, mode
, trueop0
, trueop1
);
2159 tem
= simplify_binary_operation_1 (code
, mode
, op0
, op1
, trueop0
, trueop1
);
2164 /* If the above steps did not result in a simplification and op0 or op1
2165 were constant pool references, use the referenced constants directly. */
2166 if (trueop0
!= op0
|| trueop1
!= op1
)
2167 return simplify_gen_binary (code
, mode
, trueop0
, trueop1
);
2172 /* Subroutine of simplify_binary_operation_1 that looks for cases in
2173 which OP0 and OP1 are both vector series or vector duplicates
2174 (which are really just series with a step of 0). If so, try to
2175 form a new series by applying CODE to the bases and to the steps.
2176 Return null if no simplification is possible.
2178 MODE is the mode of the operation and is known to be a vector
2182 simplify_binary_operation_series (rtx_code code
, machine_mode mode
,
2186 if (vec_duplicate_p (op0
, &base0
))
2188 else if (!vec_series_p (op0
, &base0
, &step0
))
2192 if (vec_duplicate_p (op1
, &base1
))
2194 else if (!vec_series_p (op1
, &base1
, &step1
))
2197 /* Only create a new series if we can simplify both parts. In other
2198 cases this isn't really a simplification, and it's not necessarily
2199 a win to replace a vector operation with a scalar operation. */
2200 scalar_mode inner_mode
= GET_MODE_INNER (mode
);
2201 rtx new_base
= simplify_binary_operation (code
, inner_mode
, base0
, base1
);
2205 rtx new_step
= simplify_binary_operation (code
, inner_mode
, step0
, step1
);
2209 return gen_vec_series (mode
, new_base
, new_step
);
2212 /* Subroutine of simplify_binary_operation. Simplify a binary operation
2213 CODE with result mode MODE, operating on OP0 and OP1. If OP0 and/or
2214 OP1 are constant pool references, TRUEOP0 and TRUEOP1 represent the
2215 actual constants. */
2218 simplify_binary_operation_1 (enum rtx_code code
, machine_mode mode
,
2219 rtx op0
, rtx op1
, rtx trueop0
, rtx trueop1
)
2221 rtx tem
, reversed
, opleft
, opright
, elt0
, elt1
;
2223 scalar_int_mode int_mode
, inner_mode
;
2226 /* Even if we can't compute a constant result,
2227 there are some cases worth simplifying. */
2232 /* Maybe simplify x + 0 to x. The two expressions are equivalent
2233 when x is NaN, infinite, or finite and nonzero. They aren't
2234 when x is -0 and the rounding mode is not towards -infinity,
2235 since (-0) + 0 is then 0. */
2236 if (!HONOR_SIGNED_ZEROS (mode
) && trueop1
== CONST0_RTX (mode
))
2239 /* ((-a) + b) -> (b - a) and similarly for (a + (-b)). These
2240 transformations are safe even for IEEE. */
2241 if (GET_CODE (op0
) == NEG
)
2242 return simplify_gen_binary (MINUS
, mode
, op1
, XEXP (op0
, 0));
2243 else if (GET_CODE (op1
) == NEG
)
2244 return simplify_gen_binary (MINUS
, mode
, op0
, XEXP (op1
, 0));
2246 /* (~a) + 1 -> -a */
2247 if (INTEGRAL_MODE_P (mode
)
2248 && GET_CODE (op0
) == NOT
2249 && trueop1
== const1_rtx
)
2250 return simplify_gen_unary (NEG
, mode
, XEXP (op0
, 0), mode
);
2252 /* Handle both-operands-constant cases. We can only add
2253 CONST_INTs to constants since the sum of relocatable symbols
2254 can't be handled by most assemblers. Don't add CONST_INT
2255 to CONST_INT since overflow won't be computed properly if wider
2256 than HOST_BITS_PER_WIDE_INT. */
2258 if ((GET_CODE (op0
) == CONST
2259 || GET_CODE (op0
) == SYMBOL_REF
2260 || GET_CODE (op0
) == LABEL_REF
)
2261 && poly_int_rtx_p (op1
, &offset
))
2262 return plus_constant (mode
, op0
, offset
);
2263 else if ((GET_CODE (op1
) == CONST
2264 || GET_CODE (op1
) == SYMBOL_REF
2265 || GET_CODE (op1
) == LABEL_REF
)
2266 && poly_int_rtx_p (op0
, &offset
))
2267 return plus_constant (mode
, op1
, offset
);
2269 /* See if this is something like X * C - X or vice versa or
2270 if the multiplication is written as a shift. If so, we can
2271 distribute and make a new multiply, shift, or maybe just
2272 have X (if C is 2 in the example above). But don't make
2273 something more expensive than we had before. */
2275 if (is_a
<scalar_int_mode
> (mode
, &int_mode
))
2277 rtx lhs
= op0
, rhs
= op1
;
2279 wide_int coeff0
= wi::one (GET_MODE_PRECISION (int_mode
));
2280 wide_int coeff1
= wi::one (GET_MODE_PRECISION (int_mode
));
2282 if (GET_CODE (lhs
) == NEG
)
2284 coeff0
= wi::minus_one (GET_MODE_PRECISION (int_mode
));
2285 lhs
= XEXP (lhs
, 0);
2287 else if (GET_CODE (lhs
) == MULT
2288 && CONST_SCALAR_INT_P (XEXP (lhs
, 1)))
2290 coeff0
= rtx_mode_t (XEXP (lhs
, 1), int_mode
);
2291 lhs
= XEXP (lhs
, 0);
2293 else if (GET_CODE (lhs
) == ASHIFT
2294 && CONST_INT_P (XEXP (lhs
, 1))
2295 && INTVAL (XEXP (lhs
, 1)) >= 0
2296 && INTVAL (XEXP (lhs
, 1)) < GET_MODE_PRECISION (int_mode
))
2298 coeff0
= wi::set_bit_in_zero (INTVAL (XEXP (lhs
, 1)),
2299 GET_MODE_PRECISION (int_mode
));
2300 lhs
= XEXP (lhs
, 0);
2303 if (GET_CODE (rhs
) == NEG
)
2305 coeff1
= wi::minus_one (GET_MODE_PRECISION (int_mode
));
2306 rhs
= XEXP (rhs
, 0);
2308 else if (GET_CODE (rhs
) == MULT
2309 && CONST_INT_P (XEXP (rhs
, 1)))
2311 coeff1
= rtx_mode_t (XEXP (rhs
, 1), int_mode
);
2312 rhs
= XEXP (rhs
, 0);
2314 else if (GET_CODE (rhs
) == ASHIFT
2315 && CONST_INT_P (XEXP (rhs
, 1))
2316 && INTVAL (XEXP (rhs
, 1)) >= 0
2317 && INTVAL (XEXP (rhs
, 1)) < GET_MODE_PRECISION (int_mode
))
2319 coeff1
= wi::set_bit_in_zero (INTVAL (XEXP (rhs
, 1)),
2320 GET_MODE_PRECISION (int_mode
));
2321 rhs
= XEXP (rhs
, 0);
2324 if (rtx_equal_p (lhs
, rhs
))
2326 rtx orig
= gen_rtx_PLUS (int_mode
, op0
, op1
);
2328 bool speed
= optimize_function_for_speed_p (cfun
);
2330 coeff
= immed_wide_int_const (coeff0
+ coeff1
, int_mode
);
2332 tem
= simplify_gen_binary (MULT
, int_mode
, lhs
, coeff
);
2333 return (set_src_cost (tem
, int_mode
, speed
)
2334 <= set_src_cost (orig
, int_mode
, speed
) ? tem
: 0);
2338 /* (plus (xor X C1) C2) is (xor X (C1^C2)) if C2 is signbit. */
2339 if (CONST_SCALAR_INT_P (op1
)
2340 && GET_CODE (op0
) == XOR
2341 && CONST_SCALAR_INT_P (XEXP (op0
, 1))
2342 && mode_signbit_p (mode
, op1
))
2343 return simplify_gen_binary (XOR
, mode
, XEXP (op0
, 0),
2344 simplify_gen_binary (XOR
, mode
, op1
,
2347 /* Canonicalize (plus (mult (neg B) C) A) to (minus A (mult B C)). */
2348 if (!HONOR_SIGN_DEPENDENT_ROUNDING (mode
)
2349 && GET_CODE (op0
) == MULT
2350 && GET_CODE (XEXP (op0
, 0)) == NEG
)
2354 in1
= XEXP (XEXP (op0
, 0), 0);
2355 in2
= XEXP (op0
, 1);
2356 return simplify_gen_binary (MINUS
, mode
, op1
,
2357 simplify_gen_binary (MULT
, mode
,
2361 /* (plus (comparison A B) C) can become (neg (rev-comp A B)) if
2362 C is 1 and STORE_FLAG_VALUE is -1 or if C is -1 and STORE_FLAG_VALUE
2364 if (COMPARISON_P (op0
)
2365 && ((STORE_FLAG_VALUE
== -1 && trueop1
== const1_rtx
)
2366 || (STORE_FLAG_VALUE
== 1 && trueop1
== constm1_rtx
))
2367 && (reversed
= reversed_comparison (op0
, mode
)))
2369 simplify_gen_unary (NEG
, mode
, reversed
, mode
);
2371 /* If one of the operands is a PLUS or a MINUS, see if we can
2372 simplify this by the associative law.
2373 Don't use the associative law for floating point.
2374 The inaccuracy makes it nonassociative,
2375 and subtle programs can break if operations are associated. */
2377 if (INTEGRAL_MODE_P (mode
)
2378 && (plus_minus_operand_p (op0
)
2379 || plus_minus_operand_p (op1
))
2380 && (tem
= simplify_plus_minus (code
, mode
, op0
, op1
)) != 0)
2383 /* Reassociate floating point addition only when the user
2384 specifies associative math operations. */
2385 if (FLOAT_MODE_P (mode
)
2386 && flag_associative_math
)
2388 tem
= simplify_associative_operation (code
, mode
, op0
, op1
);
2393 /* Handle vector series. */
2394 if (GET_MODE_CLASS (mode
) == MODE_VECTOR_INT
)
2396 tem
= simplify_binary_operation_series (code
, mode
, op0
, op1
);
2403 /* Convert (compare (gt (flags) 0) (lt (flags) 0)) to (flags). */
2404 if (((GET_CODE (op0
) == GT
&& GET_CODE (op1
) == LT
)
2405 || (GET_CODE (op0
) == GTU
&& GET_CODE (op1
) == LTU
))
2406 && XEXP (op0
, 1) == const0_rtx
&& XEXP (op1
, 1) == const0_rtx
)
2408 rtx xop00
= XEXP (op0
, 0);
2409 rtx xop10
= XEXP (op1
, 0);
2411 if (GET_CODE (xop00
) == CC0
&& GET_CODE (xop10
) == CC0
)
2414 if (REG_P (xop00
) && REG_P (xop10
)
2415 && REGNO (xop00
) == REGNO (xop10
)
2416 && GET_MODE (xop00
) == mode
2417 && GET_MODE (xop10
) == mode
2418 && GET_MODE_CLASS (mode
) == MODE_CC
)
2424 /* We can't assume x-x is 0 even with non-IEEE floating point,
2425 but since it is zero except in very strange circumstances, we
2426 will treat it as zero with -ffinite-math-only. */
2427 if (rtx_equal_p (trueop0
, trueop1
)
2428 && ! side_effects_p (op0
)
2429 && (!FLOAT_MODE_P (mode
) || !HONOR_NANS (mode
)))
2430 return CONST0_RTX (mode
);
2432 /* Change subtraction from zero into negation. (0 - x) is the
2433 same as -x when x is NaN, infinite, or finite and nonzero.
2434 But if the mode has signed zeros, and does not round towards
2435 -infinity, then 0 - 0 is 0, not -0. */
2436 if (!HONOR_SIGNED_ZEROS (mode
) && trueop0
== CONST0_RTX (mode
))
2437 return simplify_gen_unary (NEG
, mode
, op1
, mode
);
2439 /* (-1 - a) is ~a, unless the expression contains symbolic
2440 constants, in which case not retaining additions and
2441 subtractions could cause invalid assembly to be produced. */
2442 if (trueop0
== constm1_rtx
2443 && !contains_symbolic_reference_p (op1
))
2444 return simplify_gen_unary (NOT
, mode
, op1
, mode
);
2446 /* Subtracting 0 has no effect unless the mode has signed zeros
2447 and supports rounding towards -infinity. In such a case,
2449 if (!(HONOR_SIGNED_ZEROS (mode
)
2450 && HONOR_SIGN_DEPENDENT_ROUNDING (mode
))
2451 && trueop1
== CONST0_RTX (mode
))
2454 /* See if this is something like X * C - X or vice versa or
2455 if the multiplication is written as a shift. If so, we can
2456 distribute and make a new multiply, shift, or maybe just
2457 have X (if C is 2 in the example above). But don't make
2458 something more expensive than we had before. */
2460 if (is_a
<scalar_int_mode
> (mode
, &int_mode
))
2462 rtx lhs
= op0
, rhs
= op1
;
2464 wide_int coeff0
= wi::one (GET_MODE_PRECISION (int_mode
));
2465 wide_int negcoeff1
= wi::minus_one (GET_MODE_PRECISION (int_mode
));
2467 if (GET_CODE (lhs
) == NEG
)
2469 coeff0
= wi::minus_one (GET_MODE_PRECISION (int_mode
));
2470 lhs
= XEXP (lhs
, 0);
2472 else if (GET_CODE (lhs
) == MULT
2473 && CONST_SCALAR_INT_P (XEXP (lhs
, 1)))
2475 coeff0
= rtx_mode_t (XEXP (lhs
, 1), int_mode
);
2476 lhs
= XEXP (lhs
, 0);
2478 else if (GET_CODE (lhs
) == ASHIFT
2479 && CONST_INT_P (XEXP (lhs
, 1))
2480 && INTVAL (XEXP (lhs
, 1)) >= 0
2481 && INTVAL (XEXP (lhs
, 1)) < GET_MODE_PRECISION (int_mode
))
2483 coeff0
= wi::set_bit_in_zero (INTVAL (XEXP (lhs
, 1)),
2484 GET_MODE_PRECISION (int_mode
));
2485 lhs
= XEXP (lhs
, 0);
2488 if (GET_CODE (rhs
) == NEG
)
2490 negcoeff1
= wi::one (GET_MODE_PRECISION (int_mode
));
2491 rhs
= XEXP (rhs
, 0);
2493 else if (GET_CODE (rhs
) == MULT
2494 && CONST_INT_P (XEXP (rhs
, 1)))
2496 negcoeff1
= wi::neg (rtx_mode_t (XEXP (rhs
, 1), int_mode
));
2497 rhs
= XEXP (rhs
, 0);
2499 else if (GET_CODE (rhs
) == ASHIFT
2500 && CONST_INT_P (XEXP (rhs
, 1))
2501 && INTVAL (XEXP (rhs
, 1)) >= 0
2502 && INTVAL (XEXP (rhs
, 1)) < GET_MODE_PRECISION (int_mode
))
2504 negcoeff1
= wi::set_bit_in_zero (INTVAL (XEXP (rhs
, 1)),
2505 GET_MODE_PRECISION (int_mode
));
2506 negcoeff1
= -negcoeff1
;
2507 rhs
= XEXP (rhs
, 0);
2510 if (rtx_equal_p (lhs
, rhs
))
2512 rtx orig
= gen_rtx_MINUS (int_mode
, op0
, op1
);
2514 bool speed
= optimize_function_for_speed_p (cfun
);
2516 coeff
= immed_wide_int_const (coeff0
+ negcoeff1
, int_mode
);
2518 tem
= simplify_gen_binary (MULT
, int_mode
, lhs
, coeff
);
2519 return (set_src_cost (tem
, int_mode
, speed
)
2520 <= set_src_cost (orig
, int_mode
, speed
) ? tem
: 0);
2524 /* (a - (-b)) -> (a + b). True even for IEEE. */
2525 if (GET_CODE (op1
) == NEG
)
2526 return simplify_gen_binary (PLUS
, mode
, op0
, XEXP (op1
, 0));
2528 /* (-x - c) may be simplified as (-c - x). */
2529 if (GET_CODE (op0
) == NEG
2530 && (CONST_SCALAR_INT_P (op1
) || CONST_DOUBLE_AS_FLOAT_P (op1
)))
2532 tem
= simplify_unary_operation (NEG
, mode
, op1
, mode
);
2534 return simplify_gen_binary (MINUS
, mode
, tem
, XEXP (op0
, 0));
2537 if ((GET_CODE (op0
) == CONST
2538 || GET_CODE (op0
) == SYMBOL_REF
2539 || GET_CODE (op0
) == LABEL_REF
)
2540 && poly_int_rtx_p (op1
, &offset
))
2541 return plus_constant (mode
, op0
, trunc_int_for_mode (-offset
, mode
));
2543 /* Don't let a relocatable value get a negative coeff. */
2544 if (poly_int_rtx_p (op1
) && GET_MODE (op0
) != VOIDmode
)
2545 return simplify_gen_binary (PLUS
, mode
,
2547 neg_poly_int_rtx (mode
, op1
));
2549 /* (x - (x & y)) -> (x & ~y) */
2550 if (INTEGRAL_MODE_P (mode
) && GET_CODE (op1
) == AND
)
2552 if (rtx_equal_p (op0
, XEXP (op1
, 0)))
2554 tem
= simplify_gen_unary (NOT
, mode
, XEXP (op1
, 1),
2555 GET_MODE (XEXP (op1
, 1)));
2556 return simplify_gen_binary (AND
, mode
, op0
, tem
);
2558 if (rtx_equal_p (op0
, XEXP (op1
, 1)))
2560 tem
= simplify_gen_unary (NOT
, mode
, XEXP (op1
, 0),
2561 GET_MODE (XEXP (op1
, 0)));
2562 return simplify_gen_binary (AND
, mode
, op0
, tem
);
2566 /* If STORE_FLAG_VALUE is 1, (minus 1 (comparison foo bar)) can be done
2567 by reversing the comparison code if valid. */
2568 if (STORE_FLAG_VALUE
== 1
2569 && trueop0
== const1_rtx
2570 && COMPARISON_P (op1
)
2571 && (reversed
= reversed_comparison (op1
, mode
)))
2574 /* Canonicalize (minus A (mult (neg B) C)) to (plus (mult B C) A). */
2575 if (!HONOR_SIGN_DEPENDENT_ROUNDING (mode
)
2576 && GET_CODE (op1
) == MULT
2577 && GET_CODE (XEXP (op1
, 0)) == NEG
)
2581 in1
= XEXP (XEXP (op1
, 0), 0);
2582 in2
= XEXP (op1
, 1);
2583 return simplify_gen_binary (PLUS
, mode
,
2584 simplify_gen_binary (MULT
, mode
,
2589 /* Canonicalize (minus (neg A) (mult B C)) to
2590 (minus (mult (neg B) C) A). */
2591 if (!HONOR_SIGN_DEPENDENT_ROUNDING (mode
)
2592 && GET_CODE (op1
) == MULT
2593 && GET_CODE (op0
) == NEG
)
2597 in1
= simplify_gen_unary (NEG
, mode
, XEXP (op1
, 0), mode
);
2598 in2
= XEXP (op1
, 1);
2599 return simplify_gen_binary (MINUS
, mode
,
2600 simplify_gen_binary (MULT
, mode
,
2605 /* If one of the operands is a PLUS or a MINUS, see if we can
2606 simplify this by the associative law. This will, for example,
2607 canonicalize (minus A (plus B C)) to (minus (minus A B) C).
2608 Don't use the associative law for floating point.
2609 The inaccuracy makes it nonassociative,
2610 and subtle programs can break if operations are associated. */
2612 if (INTEGRAL_MODE_P (mode
)
2613 && (plus_minus_operand_p (op0
)
2614 || plus_minus_operand_p (op1
))
2615 && (tem
= simplify_plus_minus (code
, mode
, op0
, op1
)) != 0)
2618 /* Handle vector series. */
2619 if (GET_MODE_CLASS (mode
) == MODE_VECTOR_INT
)
2621 tem
= simplify_binary_operation_series (code
, mode
, op0
, op1
);
2628 if (trueop1
== constm1_rtx
)
2629 return simplify_gen_unary (NEG
, mode
, op0
, mode
);
2631 if (GET_CODE (op0
) == NEG
)
2633 rtx temp
= simplify_unary_operation (NEG
, mode
, op1
, mode
);
2634 /* If op1 is a MULT as well and simplify_unary_operation
2635 just moved the NEG to the second operand, simplify_gen_binary
2636 below could through simplify_associative_operation move
2637 the NEG around again and recurse endlessly. */
2639 && GET_CODE (op1
) == MULT
2640 && GET_CODE (temp
) == MULT
2641 && XEXP (op1
, 0) == XEXP (temp
, 0)
2642 && GET_CODE (XEXP (temp
, 1)) == NEG
2643 && XEXP (op1
, 1) == XEXP (XEXP (temp
, 1), 0))
2646 return simplify_gen_binary (MULT
, mode
, XEXP (op0
, 0), temp
);
2648 if (GET_CODE (op1
) == NEG
)
2650 rtx temp
= simplify_unary_operation (NEG
, mode
, op0
, mode
);
2651 /* If op0 is a MULT as well and simplify_unary_operation
2652 just moved the NEG to the second operand, simplify_gen_binary
2653 below could through simplify_associative_operation move
2654 the NEG around again and recurse endlessly. */
2656 && GET_CODE (op0
) == MULT
2657 && GET_CODE (temp
) == MULT
2658 && XEXP (op0
, 0) == XEXP (temp
, 0)
2659 && GET_CODE (XEXP (temp
, 1)) == NEG
2660 && XEXP (op0
, 1) == XEXP (XEXP (temp
, 1), 0))
2663 return simplify_gen_binary (MULT
, mode
, temp
, XEXP (op1
, 0));
2666 /* Maybe simplify x * 0 to 0. The reduction is not valid if
2667 x is NaN, since x * 0 is then also NaN. Nor is it valid
2668 when the mode has signed zeros, since multiplying a negative
2669 number by 0 will give -0, not 0. */
2670 if (!HONOR_NANS (mode
)
2671 && !HONOR_SIGNED_ZEROS (mode
)
2672 && trueop1
== CONST0_RTX (mode
)
2673 && ! side_effects_p (op0
))
2676 /* In IEEE floating point, x*1 is not equivalent to x for
2678 if (!HONOR_SNANS (mode
)
2679 && trueop1
== CONST1_RTX (mode
))
2682 /* Convert multiply by constant power of two into shift. */
2683 if (CONST_SCALAR_INT_P (trueop1
))
2685 val
= wi::exact_log2 (rtx_mode_t (trueop1
, mode
));
2687 return simplify_gen_binary (ASHIFT
, mode
, op0
,
2688 gen_int_shift_amount (mode
, val
));
2691 /* x*2 is x+x and x*(-1) is -x */
2692 if (CONST_DOUBLE_AS_FLOAT_P (trueop1
)
2693 && SCALAR_FLOAT_MODE_P (GET_MODE (trueop1
))
2694 && !DECIMAL_FLOAT_MODE_P (GET_MODE (trueop1
))
2695 && GET_MODE (op0
) == mode
)
2697 const REAL_VALUE_TYPE
*d1
= CONST_DOUBLE_REAL_VALUE (trueop1
);
2699 if (real_equal (d1
, &dconst2
))
2700 return simplify_gen_binary (PLUS
, mode
, op0
, copy_rtx (op0
));
2702 if (!HONOR_SNANS (mode
)
2703 && real_equal (d1
, &dconstm1
))
2704 return simplify_gen_unary (NEG
, mode
, op0
, mode
);
2707 /* Optimize -x * -x as x * x. */
2708 if (FLOAT_MODE_P (mode
)
2709 && GET_CODE (op0
) == NEG
2710 && GET_CODE (op1
) == NEG
2711 && rtx_equal_p (XEXP (op0
, 0), XEXP (op1
, 0))
2712 && !side_effects_p (XEXP (op0
, 0)))
2713 return simplify_gen_binary (MULT
, mode
, XEXP (op0
, 0), XEXP (op1
, 0));
2715 /* Likewise, optimize abs(x) * abs(x) as x * x. */
2716 if (SCALAR_FLOAT_MODE_P (mode
)
2717 && GET_CODE (op0
) == ABS
2718 && GET_CODE (op1
) == ABS
2719 && rtx_equal_p (XEXP (op0
, 0), XEXP (op1
, 0))
2720 && !side_effects_p (XEXP (op0
, 0)))
2721 return simplify_gen_binary (MULT
, mode
, XEXP (op0
, 0), XEXP (op1
, 0));
2723 /* Reassociate multiplication, but for floating point MULTs
2724 only when the user specifies unsafe math optimizations. */
2725 if (! FLOAT_MODE_P (mode
)
2726 || flag_unsafe_math_optimizations
)
2728 tem
= simplify_associative_operation (code
, mode
, op0
, op1
);
2735 if (trueop1
== CONST0_RTX (mode
))
2737 if (INTEGRAL_MODE_P (mode
)
2738 && trueop1
== CONSTM1_RTX (mode
)
2739 && !side_effects_p (op0
))
2741 if (rtx_equal_p (trueop0
, trueop1
) && ! side_effects_p (op0
))
2743 /* A | (~A) -> -1 */
2744 if (((GET_CODE (op0
) == NOT
&& rtx_equal_p (XEXP (op0
, 0), op1
))
2745 || (GET_CODE (op1
) == NOT
&& rtx_equal_p (XEXP (op1
, 0), op0
)))
2746 && ! side_effects_p (op0
)
2747 && SCALAR_INT_MODE_P (mode
))
2750 /* (ior A C) is C if all bits of A that might be nonzero are on in C. */
2751 if (CONST_INT_P (op1
)
2752 && HWI_COMPUTABLE_MODE_P (mode
)
2753 && (nonzero_bits (op0
, mode
) & ~UINTVAL (op1
)) == 0
2754 && !side_effects_p (op0
))
2757 /* Canonicalize (X & C1) | C2. */
2758 if (GET_CODE (op0
) == AND
2759 && CONST_INT_P (trueop1
)
2760 && CONST_INT_P (XEXP (op0
, 1)))
2762 HOST_WIDE_INT mask
= GET_MODE_MASK (mode
);
2763 HOST_WIDE_INT c1
= INTVAL (XEXP (op0
, 1));
2764 HOST_WIDE_INT c2
= INTVAL (trueop1
);
2766 /* If (C1&C2) == C1, then (X&C1)|C2 becomes C2. */
2768 && !side_effects_p (XEXP (op0
, 0)))
2771 /* If (C1|C2) == ~0 then (X&C1)|C2 becomes X|C2. */
2772 if (((c1
|c2
) & mask
) == mask
)
2773 return simplify_gen_binary (IOR
, mode
, XEXP (op0
, 0), op1
);
2776 /* Convert (A & B) | A to A. */
2777 if (GET_CODE (op0
) == AND
2778 && (rtx_equal_p (XEXP (op0
, 0), op1
)
2779 || rtx_equal_p (XEXP (op0
, 1), op1
))
2780 && ! side_effects_p (XEXP (op0
, 0))
2781 && ! side_effects_p (XEXP (op0
, 1)))
2784 /* Convert (ior (ashift A CX) (lshiftrt A CY)) where CX+CY equals the
2785 mode size to (rotate A CX). */
2787 if (GET_CODE (op1
) == ASHIFT
2788 || GET_CODE (op1
) == SUBREG
)
2799 if (GET_CODE (opleft
) == ASHIFT
&& GET_CODE (opright
) == LSHIFTRT
2800 && rtx_equal_p (XEXP (opleft
, 0), XEXP (opright
, 0))
2801 && CONST_INT_P (XEXP (opleft
, 1))
2802 && CONST_INT_P (XEXP (opright
, 1))
2803 && (INTVAL (XEXP (opleft
, 1)) + INTVAL (XEXP (opright
, 1))
2804 == GET_MODE_UNIT_PRECISION (mode
)))
2805 return gen_rtx_ROTATE (mode
, XEXP (opright
, 0), XEXP (opleft
, 1));
2807 /* Same, but for ashift that has been "simplified" to a wider mode
2808 by simplify_shift_const. */
2810 if (GET_CODE (opleft
) == SUBREG
2811 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
2812 && is_a
<scalar_int_mode
> (GET_MODE (SUBREG_REG (opleft
)),
2814 && GET_CODE (SUBREG_REG (opleft
)) == ASHIFT
2815 && GET_CODE (opright
) == LSHIFTRT
2816 && GET_CODE (XEXP (opright
, 0)) == SUBREG
2817 && known_eq (SUBREG_BYTE (opleft
), SUBREG_BYTE (XEXP (opright
, 0)))
2818 && GET_MODE_SIZE (int_mode
) < GET_MODE_SIZE (inner_mode
)
2819 && rtx_equal_p (XEXP (SUBREG_REG (opleft
), 0),
2820 SUBREG_REG (XEXP (opright
, 0)))
2821 && CONST_INT_P (XEXP (SUBREG_REG (opleft
), 1))
2822 && CONST_INT_P (XEXP (opright
, 1))
2823 && (INTVAL (XEXP (SUBREG_REG (opleft
), 1))
2824 + INTVAL (XEXP (opright
, 1))
2825 == GET_MODE_PRECISION (int_mode
)))
2826 return gen_rtx_ROTATE (int_mode
, XEXP (opright
, 0),
2827 XEXP (SUBREG_REG (opleft
), 1));
2829 /* If OP0 is (ashiftrt (plus ...) C), it might actually be
2830 a (sign_extend (plus ...)). Then check if OP1 is a CONST_INT and
2831 the PLUS does not affect any of the bits in OP1: then we can do
2832 the IOR as a PLUS and we can associate. This is valid if OP1
2833 can be safely shifted left C bits. */
2834 if (CONST_INT_P (trueop1
) && GET_CODE (op0
) == ASHIFTRT
2835 && GET_CODE (XEXP (op0
, 0)) == PLUS
2836 && CONST_INT_P (XEXP (XEXP (op0
, 0), 1))
2837 && CONST_INT_P (XEXP (op0
, 1))
2838 && INTVAL (XEXP (op0
, 1)) < HOST_BITS_PER_WIDE_INT
)
2840 int count
= INTVAL (XEXP (op0
, 1));
2841 HOST_WIDE_INT mask
= UINTVAL (trueop1
) << count
;
2843 if (mask
>> count
== INTVAL (trueop1
)
2844 && trunc_int_for_mode (mask
, mode
) == mask
2845 && (mask
& nonzero_bits (XEXP (op0
, 0), mode
)) == 0)
2846 return simplify_gen_binary (ASHIFTRT
, mode
,
2847 plus_constant (mode
, XEXP (op0
, 0),
2852 /* The following happens with bitfield merging.
2853 (X & C) | ((X | Y) & ~C) -> X | (Y & ~C) */
2854 if (GET_CODE (op0
) == AND
2855 && GET_CODE (op1
) == AND
2856 && CONST_INT_P (XEXP (op0
, 1))
2857 && CONST_INT_P (XEXP (op1
, 1))
2858 && (INTVAL (XEXP (op0
, 1))
2859 == ~INTVAL (XEXP (op1
, 1))))
2861 /* The IOR may be on both sides. */
2862 rtx top0
= NULL_RTX
, top1
= NULL_RTX
;
2863 if (GET_CODE (XEXP (op1
, 0)) == IOR
)
2864 top0
= op0
, top1
= op1
;
2865 else if (GET_CODE (XEXP (op0
, 0)) == IOR
)
2866 top0
= op1
, top1
= op0
;
2869 /* X may be on either side of the inner IOR. */
2871 if (rtx_equal_p (XEXP (top0
, 0),
2872 XEXP (XEXP (top1
, 0), 0)))
2873 tem
= XEXP (XEXP (top1
, 0), 1);
2874 else if (rtx_equal_p (XEXP (top0
, 0),
2875 XEXP (XEXP (top1
, 0), 1)))
2876 tem
= XEXP (XEXP (top1
, 0), 0);
2878 return simplify_gen_binary (IOR
, mode
, XEXP (top0
, 0),
2880 (AND
, mode
, tem
, XEXP (top1
, 1)));
2884 tem
= simplify_byte_swapping_operation (code
, mode
, op0
, op1
);
2888 tem
= simplify_associative_operation (code
, mode
, op0
, op1
);
2894 if (trueop1
== CONST0_RTX (mode
))
2896 if (INTEGRAL_MODE_P (mode
) && trueop1
== CONSTM1_RTX (mode
))
2897 return simplify_gen_unary (NOT
, mode
, op0
, mode
);
2898 if (rtx_equal_p (trueop0
, trueop1
)
2899 && ! side_effects_p (op0
)
2900 && GET_MODE_CLASS (mode
) != MODE_CC
)
2901 return CONST0_RTX (mode
);
2903 /* Canonicalize XOR of the most significant bit to PLUS. */
2904 if (CONST_SCALAR_INT_P (op1
)
2905 && mode_signbit_p (mode
, op1
))
2906 return simplify_gen_binary (PLUS
, mode
, op0
, op1
);
2907 /* (xor (plus X C1) C2) is (xor X (C1^C2)) if C1 is signbit. */
2908 if (CONST_SCALAR_INT_P (op1
)
2909 && GET_CODE (op0
) == PLUS
2910 && CONST_SCALAR_INT_P (XEXP (op0
, 1))
2911 && mode_signbit_p (mode
, XEXP (op0
, 1)))
2912 return simplify_gen_binary (XOR
, mode
, XEXP (op0
, 0),
2913 simplify_gen_binary (XOR
, mode
, op1
,
2916 /* If we are XORing two things that have no bits in common,
2917 convert them into an IOR. This helps to detect rotation encoded
2918 using those methods and possibly other simplifications. */
2920 if (HWI_COMPUTABLE_MODE_P (mode
)
2921 && (nonzero_bits (op0
, mode
)
2922 & nonzero_bits (op1
, mode
)) == 0)
2923 return (simplify_gen_binary (IOR
, mode
, op0
, op1
));
2925 /* Convert (XOR (NOT x) (NOT y)) to (XOR x y).
2926 Also convert (XOR (NOT x) y) to (NOT (XOR x y)), similarly for
2929 int num_negated
= 0;
2931 if (GET_CODE (op0
) == NOT
)
2932 num_negated
++, op0
= XEXP (op0
, 0);
2933 if (GET_CODE (op1
) == NOT
)
2934 num_negated
++, op1
= XEXP (op1
, 0);
2936 if (num_negated
== 2)
2937 return simplify_gen_binary (XOR
, mode
, op0
, op1
);
2938 else if (num_negated
== 1)
2939 return simplify_gen_unary (NOT
, mode
,
2940 simplify_gen_binary (XOR
, mode
, op0
, op1
),
2944 /* Convert (xor (and A B) B) to (and (not A) B). The latter may
2945 correspond to a machine insn or result in further simplifications
2946 if B is a constant. */
2948 if (GET_CODE (op0
) == AND
2949 && rtx_equal_p (XEXP (op0
, 1), op1
)
2950 && ! side_effects_p (op1
))
2951 return simplify_gen_binary (AND
, mode
,
2952 simplify_gen_unary (NOT
, mode
,
2953 XEXP (op0
, 0), mode
),
2956 else if (GET_CODE (op0
) == AND
2957 && rtx_equal_p (XEXP (op0
, 0), op1
)
2958 && ! side_effects_p (op1
))
2959 return simplify_gen_binary (AND
, mode
,
2960 simplify_gen_unary (NOT
, mode
,
2961 XEXP (op0
, 1), mode
),
2964 /* Given (xor (ior (xor A B) C) D), where B, C and D are
2965 constants, simplify to (xor (ior A C) (B&~C)^D), canceling
2966 out bits inverted twice and not set by C. Similarly, given
2967 (xor (and (xor A B) C) D), simplify without inverting C in
2968 the xor operand: (xor (and A C) (B&C)^D).
2970 else if ((GET_CODE (op0
) == IOR
|| GET_CODE (op0
) == AND
)
2971 && GET_CODE (XEXP (op0
, 0)) == XOR
2972 && CONST_INT_P (op1
)
2973 && CONST_INT_P (XEXP (op0
, 1))
2974 && CONST_INT_P (XEXP (XEXP (op0
, 0), 1)))
2976 enum rtx_code op
= GET_CODE (op0
);
2977 rtx a
= XEXP (XEXP (op0
, 0), 0);
2978 rtx b
= XEXP (XEXP (op0
, 0), 1);
2979 rtx c
= XEXP (op0
, 1);
2981 HOST_WIDE_INT bval
= INTVAL (b
);
2982 HOST_WIDE_INT cval
= INTVAL (c
);
2983 HOST_WIDE_INT dval
= INTVAL (d
);
2984 HOST_WIDE_INT xcval
;
2991 return simplify_gen_binary (XOR
, mode
,
2992 simplify_gen_binary (op
, mode
, a
, c
),
2993 gen_int_mode ((bval
& xcval
) ^ dval
,
2997 /* Given (xor (and A B) C), using P^Q == (~P&Q) | (~Q&P),
2998 we can transform like this:
2999 (A&B)^C == ~(A&B)&C | ~C&(A&B)
3000 == (~A|~B)&C | ~C&(A&B) * DeMorgan's Law
3001 == ~A&C | ~B&C | A&(~C&B) * Distribute and re-order
3002 Attempt a few simplifications when B and C are both constants. */
3003 if (GET_CODE (op0
) == AND
3004 && CONST_INT_P (op1
)
3005 && CONST_INT_P (XEXP (op0
, 1)))
3007 rtx a
= XEXP (op0
, 0);
3008 rtx b
= XEXP (op0
, 1);
3010 HOST_WIDE_INT bval
= INTVAL (b
);
3011 HOST_WIDE_INT cval
= INTVAL (c
);
3013 /* Instead of computing ~A&C, we compute its negated value,
3014 ~(A|~C). If it yields -1, ~A&C is zero, so we can
3015 optimize for sure. If it does not simplify, we still try
3016 to compute ~A&C below, but since that always allocates
3017 RTL, we don't try that before committing to returning a
3018 simplified expression. */
3019 rtx n_na_c
= simplify_binary_operation (IOR
, mode
, a
,
3022 if ((~cval
& bval
) == 0)
3024 rtx na_c
= NULL_RTX
;
3026 na_c
= simplify_gen_unary (NOT
, mode
, n_na_c
, mode
);
3029 /* If ~A does not simplify, don't bother: we don't
3030 want to simplify 2 operations into 3, and if na_c
3031 were to simplify with na, n_na_c would have
3032 simplified as well. */
3033 rtx na
= simplify_unary_operation (NOT
, mode
, a
, mode
);
3035 na_c
= simplify_gen_binary (AND
, mode
, na
, c
);
3038 /* Try to simplify ~A&C | ~B&C. */
3039 if (na_c
!= NULL_RTX
)
3040 return simplify_gen_binary (IOR
, mode
, na_c
,
3041 gen_int_mode (~bval
& cval
, mode
));
3045 /* If ~A&C is zero, simplify A&(~C&B) | ~B&C. */
3046 if (n_na_c
== CONSTM1_RTX (mode
))
3048 rtx a_nc_b
= simplify_gen_binary (AND
, mode
, a
,
3049 gen_int_mode (~cval
& bval
,
3051 return simplify_gen_binary (IOR
, mode
, a_nc_b
,
3052 gen_int_mode (~bval
& cval
,
3058 /* If we have (xor (and (xor A B) C) A) with C a constant we can instead
3059 do (ior (and A ~C) (and B C)) which is a machine instruction on some
3060 machines, and also has shorter instruction path length. */
3061 if (GET_CODE (op0
) == AND
3062 && GET_CODE (XEXP (op0
, 0)) == XOR
3063 && CONST_INT_P (XEXP (op0
, 1))
3064 && rtx_equal_p (XEXP (XEXP (op0
, 0), 0), trueop1
))
3067 rtx b
= XEXP (XEXP (op0
, 0), 1);
3068 rtx c
= XEXP (op0
, 1);
3069 rtx nc
= simplify_gen_unary (NOT
, mode
, c
, mode
);
3070 rtx a_nc
= simplify_gen_binary (AND
, mode
, a
, nc
);
3071 rtx bc
= simplify_gen_binary (AND
, mode
, b
, c
);
3072 return simplify_gen_binary (IOR
, mode
, a_nc
, bc
);
3074 /* Similarly, (xor (and (xor A B) C) B) as (ior (and A C) (and B ~C)) */
3075 else if (GET_CODE (op0
) == AND
3076 && GET_CODE (XEXP (op0
, 0)) == XOR
3077 && CONST_INT_P (XEXP (op0
, 1))
3078 && rtx_equal_p (XEXP (XEXP (op0
, 0), 1), trueop1
))
3080 rtx a
= XEXP (XEXP (op0
, 0), 0);
3082 rtx c
= XEXP (op0
, 1);
3083 rtx nc
= simplify_gen_unary (NOT
, mode
, c
, mode
);
3084 rtx b_nc
= simplify_gen_binary (AND
, mode
, b
, nc
);
3085 rtx ac
= simplify_gen_binary (AND
, mode
, a
, c
);
3086 return simplify_gen_binary (IOR
, mode
, ac
, b_nc
);
3089 /* (xor (comparison foo bar) (const_int 1)) can become the reversed
3090 comparison if STORE_FLAG_VALUE is 1. */
3091 if (STORE_FLAG_VALUE
== 1
3092 && trueop1
== const1_rtx
3093 && COMPARISON_P (op0
)
3094 && (reversed
= reversed_comparison (op0
, mode
)))
3097 /* (lshiftrt foo C) where C is the number of bits in FOO minus 1
3098 is (lt foo (const_int 0)), so we can perform the above
3099 simplification if STORE_FLAG_VALUE is 1. */
3101 if (is_a
<scalar_int_mode
> (mode
, &int_mode
)
3102 && STORE_FLAG_VALUE
== 1
3103 && trueop1
== const1_rtx
3104 && GET_CODE (op0
) == LSHIFTRT
3105 && CONST_INT_P (XEXP (op0
, 1))
3106 && INTVAL (XEXP (op0
, 1)) == GET_MODE_PRECISION (int_mode
) - 1)
3107 return gen_rtx_GE (int_mode
, XEXP (op0
, 0), const0_rtx
);
3109 /* (xor (comparison foo bar) (const_int sign-bit))
3110 when STORE_FLAG_VALUE is the sign bit. */
3111 if (is_a
<scalar_int_mode
> (mode
, &int_mode
)
3112 && val_signbit_p (int_mode
, STORE_FLAG_VALUE
)
3113 && trueop1
== const_true_rtx
3114 && COMPARISON_P (op0
)
3115 && (reversed
= reversed_comparison (op0
, int_mode
)))
3118 tem
= simplify_byte_swapping_operation (code
, mode
, op0
, op1
);
3122 tem
= simplify_associative_operation (code
, mode
, op0
, op1
);
3128 if (trueop1
== CONST0_RTX (mode
) && ! side_effects_p (op0
))
3130 if (INTEGRAL_MODE_P (mode
) && trueop1
== CONSTM1_RTX (mode
))
3132 if (HWI_COMPUTABLE_MODE_P (mode
))
3134 HOST_WIDE_INT nzop0
= nonzero_bits (trueop0
, mode
);
3135 HOST_WIDE_INT nzop1
;
3136 if (CONST_INT_P (trueop1
))
3138 HOST_WIDE_INT val1
= INTVAL (trueop1
);
3139 /* If we are turning off bits already known off in OP0, we need
3141 if ((nzop0
& ~val1
) == 0)
3144 nzop1
= nonzero_bits (trueop1
, mode
);
3145 /* If we are clearing all the nonzero bits, the result is zero. */
3146 if ((nzop1
& nzop0
) == 0
3147 && !side_effects_p (op0
) && !side_effects_p (op1
))
3148 return CONST0_RTX (mode
);
3150 if (rtx_equal_p (trueop0
, trueop1
) && ! side_effects_p (op0
)
3151 && GET_MODE_CLASS (mode
) != MODE_CC
)
3154 if (((GET_CODE (op0
) == NOT
&& rtx_equal_p (XEXP (op0
, 0), op1
))
3155 || (GET_CODE (op1
) == NOT
&& rtx_equal_p (XEXP (op1
, 0), op0
)))
3156 && ! side_effects_p (op0
)
3157 && GET_MODE_CLASS (mode
) != MODE_CC
)
3158 return CONST0_RTX (mode
);
3160 /* Transform (and (extend X) C) into (zero_extend (and X C)) if
3161 there are no nonzero bits of C outside of X's mode. */
3162 if ((GET_CODE (op0
) == SIGN_EXTEND
3163 || GET_CODE (op0
) == ZERO_EXTEND
)
3164 && CONST_INT_P (trueop1
)
3165 && HWI_COMPUTABLE_MODE_P (mode
)
3166 && (~GET_MODE_MASK (GET_MODE (XEXP (op0
, 0)))
3167 & UINTVAL (trueop1
)) == 0)
3169 machine_mode imode
= GET_MODE (XEXP (op0
, 0));
3170 tem
= simplify_gen_binary (AND
, imode
, XEXP (op0
, 0),
3171 gen_int_mode (INTVAL (trueop1
),
3173 return simplify_gen_unary (ZERO_EXTEND
, mode
, tem
, imode
);
3176 /* Transform (and (truncate X) C) into (truncate (and X C)). This way
3177 we might be able to further simplify the AND with X and potentially
3178 remove the truncation altogether. */
3179 if (GET_CODE (op0
) == TRUNCATE
&& CONST_INT_P (trueop1
))
3181 rtx x
= XEXP (op0
, 0);
3182 machine_mode xmode
= GET_MODE (x
);
3183 tem
= simplify_gen_binary (AND
, xmode
, x
,
3184 gen_int_mode (INTVAL (trueop1
), xmode
));
3185 return simplify_gen_unary (TRUNCATE
, mode
, tem
, xmode
);
3188 /* Canonicalize (A | C1) & C2 as (A & C2) | (C1 & C2). */
3189 if (GET_CODE (op0
) == IOR
3190 && CONST_INT_P (trueop1
)
3191 && CONST_INT_P (XEXP (op0
, 1)))
3193 HOST_WIDE_INT tmp
= INTVAL (trueop1
) & INTVAL (XEXP (op0
, 1));
3194 return simplify_gen_binary (IOR
, mode
,
3195 simplify_gen_binary (AND
, mode
,
3196 XEXP (op0
, 0), op1
),
3197 gen_int_mode (tmp
, mode
));
3200 /* Convert (A ^ B) & A to A & (~B) since the latter is often a single
3201 insn (and may simplify more). */
3202 if (GET_CODE (op0
) == XOR
3203 && rtx_equal_p (XEXP (op0
, 0), op1
)
3204 && ! side_effects_p (op1
))
3205 return simplify_gen_binary (AND
, mode
,
3206 simplify_gen_unary (NOT
, mode
,
3207 XEXP (op0
, 1), mode
),
3210 if (GET_CODE (op0
) == XOR
3211 && rtx_equal_p (XEXP (op0
, 1), op1
)
3212 && ! side_effects_p (op1
))
3213 return simplify_gen_binary (AND
, mode
,
3214 simplify_gen_unary (NOT
, mode
,
3215 XEXP (op0
, 0), mode
),
3218 /* Similarly for (~(A ^ B)) & A. */
3219 if (GET_CODE (op0
) == NOT
3220 && GET_CODE (XEXP (op0
, 0)) == XOR
3221 && rtx_equal_p (XEXP (XEXP (op0
, 0), 0), op1
)
3222 && ! side_effects_p (op1
))
3223 return simplify_gen_binary (AND
, mode
, XEXP (XEXP (op0
, 0), 1), op1
);
3225 if (GET_CODE (op0
) == NOT
3226 && GET_CODE (XEXP (op0
, 0)) == XOR
3227 && rtx_equal_p (XEXP (XEXP (op0
, 0), 1), op1
)
3228 && ! side_effects_p (op1
))
3229 return simplify_gen_binary (AND
, mode
, XEXP (XEXP (op0
, 0), 0), op1
);
3231 /* Convert (A | B) & A to A. */
3232 if (GET_CODE (op0
) == IOR
3233 && (rtx_equal_p (XEXP (op0
, 0), op1
)
3234 || rtx_equal_p (XEXP (op0
, 1), op1
))
3235 && ! side_effects_p (XEXP (op0
, 0))
3236 && ! side_effects_p (XEXP (op0
, 1)))
3239 /* For constants M and N, if M == (1LL << cst) - 1 && (N & M) == M,
3240 ((A & N) + B) & M -> (A + B) & M
3241 Similarly if (N & M) == 0,
3242 ((A | N) + B) & M -> (A + B) & M
3243 and for - instead of + and/or ^ instead of |.
3244 Also, if (N & M) == 0, then
3245 (A +- N) & M -> A & M. */
3246 if (CONST_INT_P (trueop1
)
3247 && HWI_COMPUTABLE_MODE_P (mode
)
3248 && ~UINTVAL (trueop1
)
3249 && (UINTVAL (trueop1
) & (UINTVAL (trueop1
) + 1)) == 0
3250 && (GET_CODE (op0
) == PLUS
|| GET_CODE (op0
) == MINUS
))
3255 pmop
[0] = XEXP (op0
, 0);
3256 pmop
[1] = XEXP (op0
, 1);
3258 if (CONST_INT_P (pmop
[1])
3259 && (UINTVAL (pmop
[1]) & UINTVAL (trueop1
)) == 0)
3260 return simplify_gen_binary (AND
, mode
, pmop
[0], op1
);
3262 for (which
= 0; which
< 2; which
++)
3265 switch (GET_CODE (tem
))
3268 if (CONST_INT_P (XEXP (tem
, 1))
3269 && (UINTVAL (XEXP (tem
, 1)) & UINTVAL (trueop1
))
3270 == UINTVAL (trueop1
))
3271 pmop
[which
] = XEXP (tem
, 0);
3275 if (CONST_INT_P (XEXP (tem
, 1))
3276 && (UINTVAL (XEXP (tem
, 1)) & UINTVAL (trueop1
)) == 0)
3277 pmop
[which
] = XEXP (tem
, 0);
3284 if (pmop
[0] != XEXP (op0
, 0) || pmop
[1] != XEXP (op0
, 1))
3286 tem
= simplify_gen_binary (GET_CODE (op0
), mode
,
3288 return simplify_gen_binary (code
, mode
, tem
, op1
);
3292 /* (and X (ior (not X) Y) -> (and X Y) */
3293 if (GET_CODE (op1
) == IOR
3294 && GET_CODE (XEXP (op1
, 0)) == NOT
3295 && rtx_equal_p (op0
, XEXP (XEXP (op1
, 0), 0)))
3296 return simplify_gen_binary (AND
, mode
, op0
, XEXP (op1
, 1));
3298 /* (and (ior (not X) Y) X) -> (and X Y) */
3299 if (GET_CODE (op0
) == IOR
3300 && GET_CODE (XEXP (op0
, 0)) == NOT
3301 && rtx_equal_p (op1
, XEXP (XEXP (op0
, 0), 0)))
3302 return simplify_gen_binary (AND
, mode
, op1
, XEXP (op0
, 1));
3304 /* (and X (ior Y (not X)) -> (and X Y) */
3305 if (GET_CODE (op1
) == IOR
3306 && GET_CODE (XEXP (op1
, 1)) == NOT
3307 && rtx_equal_p (op0
, XEXP (XEXP (op1
, 1), 0)))
3308 return simplify_gen_binary (AND
, mode
, op0
, XEXP (op1
, 0));
3310 /* (and (ior Y (not X)) X) -> (and X Y) */
3311 if (GET_CODE (op0
) == IOR
3312 && GET_CODE (XEXP (op0
, 1)) == NOT
3313 && rtx_equal_p (op1
, XEXP (XEXP (op0
, 1), 0)))
3314 return simplify_gen_binary (AND
, mode
, op1
, XEXP (op0
, 0));
3316 tem
= simplify_byte_swapping_operation (code
, mode
, op0
, op1
);
3320 tem
= simplify_associative_operation (code
, mode
, op0
, op1
);
3326 /* 0/x is 0 (or x&0 if x has side-effects). */
3327 if (trueop0
== CONST0_RTX (mode
)
3328 && !cfun
->can_throw_non_call_exceptions
)
3330 if (side_effects_p (op1
))
3331 return simplify_gen_binary (AND
, mode
, op1
, trueop0
);
3335 if (trueop1
== CONST1_RTX (mode
))
3337 tem
= rtl_hooks
.gen_lowpart_no_emit (mode
, op0
);
3341 /* Convert divide by power of two into shift. */
3342 if (CONST_INT_P (trueop1
)
3343 && (val
= exact_log2 (UINTVAL (trueop1
))) > 0)
3344 return simplify_gen_binary (LSHIFTRT
, mode
, op0
,
3345 gen_int_shift_amount (mode
, val
));
3349 /* Handle floating point and integers separately. */
3350 if (SCALAR_FLOAT_MODE_P (mode
))
3352 /* Maybe change 0.0 / x to 0.0. This transformation isn't
3353 safe for modes with NaNs, since 0.0 / 0.0 will then be
3354 NaN rather than 0.0. Nor is it safe for modes with signed
3355 zeros, since dividing 0 by a negative number gives -0.0 */
3356 if (trueop0
== CONST0_RTX (mode
)
3357 && !HONOR_NANS (mode
)
3358 && !HONOR_SIGNED_ZEROS (mode
)
3359 && ! side_effects_p (op1
))
3362 if (trueop1
== CONST1_RTX (mode
)
3363 && !HONOR_SNANS (mode
))
3366 if (CONST_DOUBLE_AS_FLOAT_P (trueop1
)
3367 && trueop1
!= CONST0_RTX (mode
))
3369 const REAL_VALUE_TYPE
*d1
= CONST_DOUBLE_REAL_VALUE (trueop1
);
3372 if (real_equal (d1
, &dconstm1
)
3373 && !HONOR_SNANS (mode
))
3374 return simplify_gen_unary (NEG
, mode
, op0
, mode
);
3376 /* Change FP division by a constant into multiplication.
3377 Only do this with -freciprocal-math. */
3378 if (flag_reciprocal_math
3379 && !real_equal (d1
, &dconst0
))
3382 real_arithmetic (&d
, RDIV_EXPR
, &dconst1
, d1
);
3383 tem
= const_double_from_real_value (d
, mode
);
3384 return simplify_gen_binary (MULT
, mode
, op0
, tem
);
3388 else if (SCALAR_INT_MODE_P (mode
))
3390 /* 0/x is 0 (or x&0 if x has side-effects). */
3391 if (trueop0
== CONST0_RTX (mode
)
3392 && !cfun
->can_throw_non_call_exceptions
)
3394 if (side_effects_p (op1
))
3395 return simplify_gen_binary (AND
, mode
, op1
, trueop0
);
3399 if (trueop1
== CONST1_RTX (mode
))
3401 tem
= rtl_hooks
.gen_lowpart_no_emit (mode
, op0
);
3406 if (trueop1
== constm1_rtx
)
3408 rtx x
= rtl_hooks
.gen_lowpart_no_emit (mode
, op0
);
3410 return simplify_gen_unary (NEG
, mode
, x
, mode
);
3416 /* 0%x is 0 (or x&0 if x has side-effects). */
3417 if (trueop0
== CONST0_RTX (mode
))
3419 if (side_effects_p (op1
))
3420 return simplify_gen_binary (AND
, mode
, op1
, trueop0
);
3423 /* x%1 is 0 (of x&0 if x has side-effects). */
3424 if (trueop1
== CONST1_RTX (mode
))
3426 if (side_effects_p (op0
))
3427 return simplify_gen_binary (AND
, mode
, op0
, CONST0_RTX (mode
));
3428 return CONST0_RTX (mode
);
3430 /* Implement modulus by power of two as AND. */
3431 if (CONST_INT_P (trueop1
)
3432 && exact_log2 (UINTVAL (trueop1
)) > 0)
3433 return simplify_gen_binary (AND
, mode
, op0
,
3434 gen_int_mode (UINTVAL (trueop1
) - 1,
3439 /* 0%x is 0 (or x&0 if x has side-effects). */
3440 if (trueop0
== CONST0_RTX (mode
))
3442 if (side_effects_p (op1
))
3443 return simplify_gen_binary (AND
, mode
, op1
, trueop0
);
3446 /* x%1 and x%-1 is 0 (or x&0 if x has side-effects). */
3447 if (trueop1
== CONST1_RTX (mode
) || trueop1
== constm1_rtx
)
3449 if (side_effects_p (op0
))
3450 return simplify_gen_binary (AND
, mode
, op0
, CONST0_RTX (mode
));
3451 return CONST0_RTX (mode
);
3457 /* Canonicalize rotates by constant amount. If op1 is bitsize / 2,
3458 prefer left rotation, if op1 is from bitsize / 2 + 1 to
3459 bitsize - 1, use other direction of rotate with 1 .. bitsize / 2 - 1
3461 #if defined(HAVE_rotate) && defined(HAVE_rotatert)
3462 if (CONST_INT_P (trueop1
)
3463 && IN_RANGE (INTVAL (trueop1
),
3464 GET_MODE_UNIT_PRECISION (mode
) / 2 + (code
== ROTATE
),
3465 GET_MODE_UNIT_PRECISION (mode
) - 1))
3467 int new_amount
= GET_MODE_UNIT_PRECISION (mode
) - INTVAL (trueop1
);
3468 rtx new_amount_rtx
= gen_int_shift_amount (mode
, new_amount
);
3469 return simplify_gen_binary (code
== ROTATE
? ROTATERT
: ROTATE
,
3470 mode
, op0
, new_amount_rtx
);
3475 if (trueop1
== CONST0_RTX (mode
))
3477 if (trueop0
== CONST0_RTX (mode
) && ! side_effects_p (op1
))
3479 /* Rotating ~0 always results in ~0. */
3480 if (CONST_INT_P (trueop0
)
3481 && HWI_COMPUTABLE_MODE_P (mode
)
3482 && UINTVAL (trueop0
) == GET_MODE_MASK (mode
)
3483 && ! side_effects_p (op1
))
3489 scalar constants c1, c2
3490 size (M2) > size (M1)
3491 c1 == size (M2) - size (M1)
3493 ([a|l]shiftrt:M1 (subreg:M1 (lshiftrt:M2 (reg:M2) (const_int <c1>))
3497 (subreg:M1 ([a|l]shiftrt:M2 (reg:M2) (const_int <c1 + c2>))
3499 if ((code
== ASHIFTRT
|| code
== LSHIFTRT
)
3500 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
3502 && CONST_INT_P (op1
)
3503 && GET_CODE (SUBREG_REG (op0
)) == LSHIFTRT
3504 && is_a
<scalar_int_mode
> (GET_MODE (SUBREG_REG (op0
)),
3506 && CONST_INT_P (XEXP (SUBREG_REG (op0
), 1))
3507 && GET_MODE_BITSIZE (inner_mode
) > GET_MODE_BITSIZE (int_mode
)
3508 && (INTVAL (XEXP (SUBREG_REG (op0
), 1))
3509 == GET_MODE_BITSIZE (inner_mode
) - GET_MODE_BITSIZE (int_mode
))
3510 && subreg_lowpart_p (op0
))
3512 rtx tmp
= gen_int_shift_amount
3513 (inner_mode
, INTVAL (XEXP (SUBREG_REG (op0
), 1)) + INTVAL (op1
));
3514 tmp
= simplify_gen_binary (code
, inner_mode
,
3515 XEXP (SUBREG_REG (op0
), 0),
3517 return lowpart_subreg (int_mode
, tmp
, inner_mode
);
3520 if (SHIFT_COUNT_TRUNCATED
&& CONST_INT_P (op1
))
3522 val
= INTVAL (op1
) & (GET_MODE_UNIT_PRECISION (mode
) - 1);
3523 if (val
!= INTVAL (op1
))
3524 return simplify_gen_binary (code
, mode
, op0
,
3525 gen_int_shift_amount (mode
, val
));
3532 if (trueop1
== CONST0_RTX (mode
))
3534 if (trueop0
== CONST0_RTX (mode
) && ! side_effects_p (op1
))
3536 goto canonicalize_shift
;
3539 if (trueop1
== CONST0_RTX (mode
))
3541 if (trueop0
== CONST0_RTX (mode
) && ! side_effects_p (op1
))
3543 /* Optimize (lshiftrt (clz X) C) as (eq X 0). */
3544 if (GET_CODE (op0
) == CLZ
3545 && is_a
<scalar_int_mode
> (GET_MODE (XEXP (op0
, 0)), &inner_mode
)
3546 && CONST_INT_P (trueop1
)
3547 && STORE_FLAG_VALUE
== 1
3548 && INTVAL (trueop1
) < GET_MODE_UNIT_PRECISION (mode
))
3550 unsigned HOST_WIDE_INT zero_val
= 0;
3552 if (CLZ_DEFINED_VALUE_AT_ZERO (inner_mode
, zero_val
)
3553 && zero_val
== GET_MODE_PRECISION (inner_mode
)
3554 && INTVAL (trueop1
) == exact_log2 (zero_val
))
3555 return simplify_gen_relational (EQ
, mode
, inner_mode
,
3556 XEXP (op0
, 0), const0_rtx
);
3558 goto canonicalize_shift
;
3561 if (HWI_COMPUTABLE_MODE_P (mode
)
3562 && mode_signbit_p (mode
, trueop1
)
3563 && ! side_effects_p (op0
))
3565 if (rtx_equal_p (trueop0
, trueop1
) && ! side_effects_p (op0
))
3567 tem
= simplify_associative_operation (code
, mode
, op0
, op1
);
3573 if (HWI_COMPUTABLE_MODE_P (mode
)
3574 && CONST_INT_P (trueop1
)
3575 && (UINTVAL (trueop1
) == GET_MODE_MASK (mode
) >> 1)
3576 && ! side_effects_p (op0
))
3578 if (rtx_equal_p (trueop0
, trueop1
) && ! side_effects_p (op0
))
3580 tem
= simplify_associative_operation (code
, mode
, op0
, op1
);
3586 if (trueop1
== CONST0_RTX (mode
) && ! side_effects_p (op0
))
3588 if (rtx_equal_p (trueop0
, trueop1
) && ! side_effects_p (op0
))
3590 tem
= simplify_associative_operation (code
, mode
, op0
, op1
);
3596 if (trueop1
== constm1_rtx
&& ! side_effects_p (op0
))
3598 if (rtx_equal_p (trueop0
, trueop1
) && ! side_effects_p (op0
))
3600 tem
= simplify_associative_operation (code
, mode
, op0
, op1
);
3613 /* ??? There are simplifications that can be done. */
3617 if (op1
== CONST0_RTX (GET_MODE_INNER (mode
)))
3618 return gen_vec_duplicate (mode
, op0
);
3619 if (valid_for_const_vector_p (mode
, op0
)
3620 && valid_for_const_vector_p (mode
, op1
))
3621 return gen_const_vec_series (mode
, op0
, op1
);
3625 if (!VECTOR_MODE_P (mode
))
3627 gcc_assert (VECTOR_MODE_P (GET_MODE (trueop0
)));
3628 gcc_assert (mode
== GET_MODE_INNER (GET_MODE (trueop0
)));
3629 gcc_assert (GET_CODE (trueop1
) == PARALLEL
);
3630 gcc_assert (XVECLEN (trueop1
, 0) == 1);
3632 /* We can't reason about selections made at runtime. */
3633 if (!CONST_INT_P (XVECEXP (trueop1
, 0, 0)))
3636 if (vec_duplicate_p (trueop0
, &elt0
))
3639 if (GET_CODE (trueop0
) == CONST_VECTOR
)
3640 return CONST_VECTOR_ELT (trueop0
, INTVAL (XVECEXP
3643 /* Extract a scalar element from a nested VEC_SELECT expression
3644 (with optional nested VEC_CONCAT expression). Some targets
3645 (i386) extract scalar element from a vector using chain of
3646 nested VEC_SELECT expressions. When input operand is a memory
3647 operand, this operation can be simplified to a simple scalar
3648 load from an offseted memory address. */
3650 if (GET_CODE (trueop0
) == VEC_SELECT
3651 && (GET_MODE_NUNITS (GET_MODE (XEXP (trueop0
, 0)))
3652 .is_constant (&n_elts
)))
3654 rtx op0
= XEXP (trueop0
, 0);
3655 rtx op1
= XEXP (trueop0
, 1);
3657 int i
= INTVAL (XVECEXP (trueop1
, 0, 0));
3663 gcc_assert (GET_CODE (op1
) == PARALLEL
);
3664 gcc_assert (i
< n_elts
);
3666 /* Select element, pointed by nested selector. */
3667 elem
= INTVAL (XVECEXP (op1
, 0, i
));
3669 /* Handle the case when nested VEC_SELECT wraps VEC_CONCAT. */
3670 if (GET_CODE (op0
) == VEC_CONCAT
)
3672 rtx op00
= XEXP (op0
, 0);
3673 rtx op01
= XEXP (op0
, 1);
3675 machine_mode mode00
, mode01
;
3676 int n_elts00
, n_elts01
;
3678 mode00
= GET_MODE (op00
);
3679 mode01
= GET_MODE (op01
);
3681 /* Find out the number of elements of each operand.
3682 Since the concatenated result has a constant number
3683 of elements, the operands must too. */
3684 n_elts00
= GET_MODE_NUNITS (mode00
).to_constant ();
3685 n_elts01
= GET_MODE_NUNITS (mode01
).to_constant ();
3687 gcc_assert (n_elts
== n_elts00
+ n_elts01
);
3689 /* Select correct operand of VEC_CONCAT
3690 and adjust selector. */
3691 if (elem
< n_elts01
)
3702 vec
= rtvec_alloc (1);
3703 RTVEC_ELT (vec
, 0) = GEN_INT (elem
);
3705 tmp
= gen_rtx_fmt_ee (code
, mode
,
3706 tmp_op
, gen_rtx_PARALLEL (VOIDmode
, vec
));
3712 gcc_assert (VECTOR_MODE_P (GET_MODE (trueop0
)));
3713 gcc_assert (GET_MODE_INNER (mode
)
3714 == GET_MODE_INNER (GET_MODE (trueop0
)));
3715 gcc_assert (GET_CODE (trueop1
) == PARALLEL
);
3717 if (vec_duplicate_p (trueop0
, &elt0
))
3718 /* It doesn't matter which elements are selected by trueop1,
3719 because they are all the same. */
3720 return gen_vec_duplicate (mode
, elt0
);
3722 if (GET_CODE (trueop0
) == CONST_VECTOR
)
3724 unsigned n_elts
= XVECLEN (trueop1
, 0);
3725 rtvec v
= rtvec_alloc (n_elts
);
3728 gcc_assert (known_eq (n_elts
, GET_MODE_NUNITS (mode
)));
3729 for (i
= 0; i
< n_elts
; i
++)
3731 rtx x
= XVECEXP (trueop1
, 0, i
);
3733 if (!CONST_INT_P (x
))
3736 RTVEC_ELT (v
, i
) = CONST_VECTOR_ELT (trueop0
,
3740 return gen_rtx_CONST_VECTOR (mode
, v
);
3743 /* Recognize the identity. */
3744 if (GET_MODE (trueop0
) == mode
)
3746 bool maybe_ident
= true;
3747 for (int i
= 0; i
< XVECLEN (trueop1
, 0); i
++)
3749 rtx j
= XVECEXP (trueop1
, 0, i
);
3750 if (!CONST_INT_P (j
) || INTVAL (j
) != i
)
3752 maybe_ident
= false;
3760 /* If we build {a,b} then permute it, build the result directly. */
3761 if (XVECLEN (trueop1
, 0) == 2
3762 && CONST_INT_P (XVECEXP (trueop1
, 0, 0))
3763 && CONST_INT_P (XVECEXP (trueop1
, 0, 1))
3764 && GET_CODE (trueop0
) == VEC_CONCAT
3765 && GET_CODE (XEXP (trueop0
, 0)) == VEC_CONCAT
3766 && GET_MODE (XEXP (trueop0
, 0)) == mode
3767 && GET_CODE (XEXP (trueop0
, 1)) == VEC_CONCAT
3768 && GET_MODE (XEXP (trueop0
, 1)) == mode
)
3770 unsigned int i0
= INTVAL (XVECEXP (trueop1
, 0, 0));
3771 unsigned int i1
= INTVAL (XVECEXP (trueop1
, 0, 1));
3774 gcc_assert (i0
< 4 && i1
< 4);
3775 subop0
= XEXP (XEXP (trueop0
, i0
/ 2), i0
% 2);
3776 subop1
= XEXP (XEXP (trueop0
, i1
/ 2), i1
% 2);
3778 return simplify_gen_binary (VEC_CONCAT
, mode
, subop0
, subop1
);
3781 if (XVECLEN (trueop1
, 0) == 2
3782 && CONST_INT_P (XVECEXP (trueop1
, 0, 0))
3783 && CONST_INT_P (XVECEXP (trueop1
, 0, 1))
3784 && GET_CODE (trueop0
) == VEC_CONCAT
3785 && GET_MODE (trueop0
) == mode
)
3787 unsigned int i0
= INTVAL (XVECEXP (trueop1
, 0, 0));
3788 unsigned int i1
= INTVAL (XVECEXP (trueop1
, 0, 1));
3791 gcc_assert (i0
< 2 && i1
< 2);
3792 subop0
= XEXP (trueop0
, i0
);
3793 subop1
= XEXP (trueop0
, i1
);
3795 return simplify_gen_binary (VEC_CONCAT
, mode
, subop0
, subop1
);
3798 /* If we select one half of a vec_concat, return that. */
3800 if (GET_CODE (trueop0
) == VEC_CONCAT
3801 && (GET_MODE_NUNITS (GET_MODE (XEXP (trueop0
, 0)))
3803 && (GET_MODE_NUNITS (GET_MODE (XEXP (trueop0
, 1)))
3805 && CONST_INT_P (XVECEXP (trueop1
, 0, 0)))
3807 rtx subop0
= XEXP (trueop0
, 0);
3808 rtx subop1
= XEXP (trueop0
, 1);
3809 machine_mode mode0
= GET_MODE (subop0
);
3810 machine_mode mode1
= GET_MODE (subop1
);
3811 int i0
= INTVAL (XVECEXP (trueop1
, 0, 0));
3812 if (i0
== 0 && !side_effects_p (op1
) && mode
== mode0
)
3814 bool success
= true;
3815 for (int i
= 1; i
< l0
; ++i
)
3817 rtx j
= XVECEXP (trueop1
, 0, i
);
3818 if (!CONST_INT_P (j
) || INTVAL (j
) != i
)
3827 if (i0
== l0
&& !side_effects_p (op0
) && mode
== mode1
)
3829 bool success
= true;
3830 for (int i
= 1; i
< l1
; ++i
)
3832 rtx j
= XVECEXP (trueop1
, 0, i
);
3833 if (!CONST_INT_P (j
) || INTVAL (j
) != i0
+ i
)
3845 if (XVECLEN (trueop1
, 0) == 1
3846 && CONST_INT_P (XVECEXP (trueop1
, 0, 0))
3847 && GET_CODE (trueop0
) == VEC_CONCAT
)
3850 offset
= INTVAL (XVECEXP (trueop1
, 0, 0)) * GET_MODE_SIZE (mode
);
3852 /* Try to find the element in the VEC_CONCAT. */
3853 while (GET_MODE (vec
) != mode
3854 && GET_CODE (vec
) == VEC_CONCAT
)
3856 poly_int64 vec_size
;
3858 if (CONST_INT_P (XEXP (vec
, 0)))
3860 /* vec_concat of two const_ints doesn't make sense with
3861 respect to modes. */
3862 if (CONST_INT_P (XEXP (vec
, 1)))
3865 vec_size
= GET_MODE_SIZE (GET_MODE (trueop0
))
3866 - GET_MODE_SIZE (GET_MODE (XEXP (vec
, 1)));
3869 vec_size
= GET_MODE_SIZE (GET_MODE (XEXP (vec
, 0)));
3871 if (known_lt (offset
, vec_size
))
3872 vec
= XEXP (vec
, 0);
3873 else if (known_ge (offset
, vec_size
))
3876 vec
= XEXP (vec
, 1);
3880 vec
= avoid_constant_pool_reference (vec
);
3883 if (GET_MODE (vec
) == mode
)
3887 /* If we select elements in a vec_merge that all come from the same
3888 operand, select from that operand directly. */
3889 if (GET_CODE (op0
) == VEC_MERGE
)
3891 rtx trueop02
= avoid_constant_pool_reference (XEXP (op0
, 2));
3892 if (CONST_INT_P (trueop02
))
3894 unsigned HOST_WIDE_INT sel
= UINTVAL (trueop02
);
3895 bool all_operand0
= true;
3896 bool all_operand1
= true;
3897 for (int i
= 0; i
< XVECLEN (trueop1
, 0); i
++)
3899 rtx j
= XVECEXP (trueop1
, 0, i
);
3900 if (sel
& (HOST_WIDE_INT_1U
<< UINTVAL (j
)))
3901 all_operand1
= false;
3903 all_operand0
= false;
3905 if (all_operand0
&& !side_effects_p (XEXP (op0
, 1)))
3906 return simplify_gen_binary (VEC_SELECT
, mode
, XEXP (op0
, 0), op1
);
3907 if (all_operand1
&& !side_effects_p (XEXP (op0
, 0)))
3908 return simplify_gen_binary (VEC_SELECT
, mode
, XEXP (op0
, 1), op1
);
3912 /* If we have two nested selects that are inverses of each
3913 other, replace them with the source operand. */
3914 if (GET_CODE (trueop0
) == VEC_SELECT
3915 && GET_MODE (XEXP (trueop0
, 0)) == mode
)
3917 rtx op0_subop1
= XEXP (trueop0
, 1);
3918 gcc_assert (GET_CODE (op0_subop1
) == PARALLEL
);
3919 gcc_assert (known_eq (XVECLEN (trueop1
, 0), GET_MODE_NUNITS (mode
)));
3921 /* Apply the outer ordering vector to the inner one. (The inner
3922 ordering vector is expressly permitted to be of a different
3923 length than the outer one.) If the result is { 0, 1, ..., n-1 }
3924 then the two VEC_SELECTs cancel. */
3925 for (int i
= 0; i
< XVECLEN (trueop1
, 0); ++i
)
3927 rtx x
= XVECEXP (trueop1
, 0, i
);
3928 if (!CONST_INT_P (x
))
3930 rtx y
= XVECEXP (op0_subop1
, 0, INTVAL (x
));
3931 if (!CONST_INT_P (y
) || i
!= INTVAL (y
))
3934 return XEXP (trueop0
, 0);
3940 machine_mode op0_mode
= (GET_MODE (trueop0
) != VOIDmode
3941 ? GET_MODE (trueop0
)
3942 : GET_MODE_INNER (mode
));
3943 machine_mode op1_mode
= (GET_MODE (trueop1
) != VOIDmode
3944 ? GET_MODE (trueop1
)
3945 : GET_MODE_INNER (mode
));
3947 gcc_assert (VECTOR_MODE_P (mode
));
3948 gcc_assert (known_eq (GET_MODE_SIZE (op0_mode
)
3949 + GET_MODE_SIZE (op1_mode
),
3950 GET_MODE_SIZE (mode
)));
3952 if (VECTOR_MODE_P (op0_mode
))
3953 gcc_assert (GET_MODE_INNER (mode
)
3954 == GET_MODE_INNER (op0_mode
));
3956 gcc_assert (GET_MODE_INNER (mode
) == op0_mode
);
3958 if (VECTOR_MODE_P (op1_mode
))
3959 gcc_assert (GET_MODE_INNER (mode
)
3960 == GET_MODE_INNER (op1_mode
));
3962 gcc_assert (GET_MODE_INNER (mode
) == op1_mode
);
3964 unsigned int n_elts
, in_n_elts
;
3965 if ((GET_CODE (trueop0
) == CONST_VECTOR
3966 || CONST_SCALAR_INT_P (trueop0
)
3967 || CONST_DOUBLE_AS_FLOAT_P (trueop0
))
3968 && (GET_CODE (trueop1
) == CONST_VECTOR
3969 || CONST_SCALAR_INT_P (trueop1
)
3970 || CONST_DOUBLE_AS_FLOAT_P (trueop1
))
3971 && GET_MODE_NUNITS (mode
).is_constant (&n_elts
)
3972 && GET_MODE_NUNITS (op0_mode
).is_constant (&in_n_elts
))
3974 rtvec v
= rtvec_alloc (n_elts
);
3976 for (i
= 0; i
< n_elts
; i
++)
3980 if (!VECTOR_MODE_P (op0_mode
))
3981 RTVEC_ELT (v
, i
) = trueop0
;
3983 RTVEC_ELT (v
, i
) = CONST_VECTOR_ELT (trueop0
, i
);
3987 if (!VECTOR_MODE_P (op1_mode
))
3988 RTVEC_ELT (v
, i
) = trueop1
;
3990 RTVEC_ELT (v
, i
) = CONST_VECTOR_ELT (trueop1
,
3995 return gen_rtx_CONST_VECTOR (mode
, v
);
3998 /* Try to merge two VEC_SELECTs from the same vector into a single one.
3999 Restrict the transformation to avoid generating a VEC_SELECT with a
4000 mode unrelated to its operand. */
4001 if (GET_CODE (trueop0
) == VEC_SELECT
4002 && GET_CODE (trueop1
) == VEC_SELECT
4003 && rtx_equal_p (XEXP (trueop0
, 0), XEXP (trueop1
, 0))
4004 && GET_MODE (XEXP (trueop0
, 0)) == mode
)
4006 rtx par0
= XEXP (trueop0
, 1);
4007 rtx par1
= XEXP (trueop1
, 1);
4008 int len0
= XVECLEN (par0
, 0);
4009 int len1
= XVECLEN (par1
, 0);
4010 rtvec vec
= rtvec_alloc (len0
+ len1
);
4011 for (int i
= 0; i
< len0
; i
++)
4012 RTVEC_ELT (vec
, i
) = XVECEXP (par0
, 0, i
);
4013 for (int i
= 0; i
< len1
; i
++)
4014 RTVEC_ELT (vec
, len0
+ i
) = XVECEXP (par1
, 0, i
);
4015 return simplify_gen_binary (VEC_SELECT
, mode
, XEXP (trueop0
, 0),
4016 gen_rtx_PARALLEL (VOIDmode
, vec
));
4025 if (mode
== GET_MODE (op0
)
4026 && mode
== GET_MODE (op1
)
4027 && vec_duplicate_p (op0
, &elt0
)
4028 && vec_duplicate_p (op1
, &elt1
))
4030 /* Try applying the operator to ELT and see if that simplifies.
4031 We can duplicate the result if so.
4033 The reason we don't use simplify_gen_binary is that it isn't
4034 necessarily a win to convert things like:
4036 (plus:V (vec_duplicate:V (reg:S R1))
4037 (vec_duplicate:V (reg:S R2)))
4041 (vec_duplicate:V (plus:S (reg:S R1) (reg:S R2)))
4043 The first might be done entirely in vector registers while the
4044 second might need a move between register files. */
4045 tem
= simplify_binary_operation (code
, GET_MODE_INNER (mode
),
4048 return gen_vec_duplicate (mode
, tem
);
4054 /* Return true if binary operation OP distributes over addition in operand
4055 OPNO, with the other operand being held constant. OPNO counts from 1. */
4058 distributes_over_addition_p (rtx_code op
, int opno
)
4076 simplify_const_binary_operation (enum rtx_code code
, machine_mode mode
,
4079 if (VECTOR_MODE_P (mode
)
4080 && code
!= VEC_CONCAT
4081 && GET_CODE (op0
) == CONST_VECTOR
4082 && GET_CODE (op1
) == CONST_VECTOR
)
4085 if (CONST_VECTOR_STEPPED_P (op0
)
4086 && CONST_VECTOR_STEPPED_P (op1
))
4087 /* We can operate directly on the encoding if:
4089 a3 - a2 == a2 - a1 && b3 - b2 == b2 - b1
4091 (a3 op b3) - (a2 op b2) == (a2 op b2) - (a1 op b1)
4093 Addition and subtraction are the supported operators
4094 for which this is true. */
4095 step_ok_p
= (code
== PLUS
|| code
== MINUS
);
4096 else if (CONST_VECTOR_STEPPED_P (op0
))
4097 /* We can operate directly on stepped encodings if:
4101 (a3 op c) - (a2 op c) == (a2 op c) - (a1 op c)
4103 which is true if (x -> x op c) distributes over addition. */
4104 step_ok_p
= distributes_over_addition_p (code
, 1);
4106 /* Similarly in reverse. */
4107 step_ok_p
= distributes_over_addition_p (code
, 2);
4108 rtx_vector_builder builder
;
4109 if (!builder
.new_binary_operation (mode
, op0
, op1
, step_ok_p
))
4112 unsigned int count
= builder
.encoded_nelts ();
4113 for (unsigned int i
= 0; i
< count
; i
++)
4115 rtx x
= simplify_binary_operation (code
, GET_MODE_INNER (mode
),
4116 CONST_VECTOR_ELT (op0
, i
),
4117 CONST_VECTOR_ELT (op1
, i
));
4118 if (!x
|| !valid_for_const_vector_p (mode
, x
))
4120 builder
.quick_push (x
);
4122 return builder
.build ();
4125 if (VECTOR_MODE_P (mode
)
4126 && code
== VEC_CONCAT
4127 && (CONST_SCALAR_INT_P (op0
)
4128 || CONST_FIXED_P (op0
)
4129 || CONST_DOUBLE_AS_FLOAT_P (op0
))
4130 && (CONST_SCALAR_INT_P (op1
)
4131 || CONST_DOUBLE_AS_FLOAT_P (op1
)
4132 || CONST_FIXED_P (op1
)))
4134 /* Both inputs have a constant number of elements, so the result
4136 unsigned n_elts
= GET_MODE_NUNITS (mode
).to_constant ();
4137 rtvec v
= rtvec_alloc (n_elts
);
4139 gcc_assert (n_elts
>= 2);
4142 gcc_assert (GET_CODE (op0
) != CONST_VECTOR
);
4143 gcc_assert (GET_CODE (op1
) != CONST_VECTOR
);
4145 RTVEC_ELT (v
, 0) = op0
;
4146 RTVEC_ELT (v
, 1) = op1
;
4150 unsigned op0_n_elts
= GET_MODE_NUNITS (GET_MODE (op0
)).to_constant ();
4151 unsigned op1_n_elts
= GET_MODE_NUNITS (GET_MODE (op1
)).to_constant ();
4154 gcc_assert (GET_CODE (op0
) == CONST_VECTOR
);
4155 gcc_assert (GET_CODE (op1
) == CONST_VECTOR
);
4156 gcc_assert (op0_n_elts
+ op1_n_elts
== n_elts
);
4158 for (i
= 0; i
< op0_n_elts
; ++i
)
4159 RTVEC_ELT (v
, i
) = CONST_VECTOR_ELT (op0
, i
);
4160 for (i
= 0; i
< op1_n_elts
; ++i
)
4161 RTVEC_ELT (v
, op0_n_elts
+i
) = CONST_VECTOR_ELT (op1
, i
);
4164 return gen_rtx_CONST_VECTOR (mode
, v
);
4167 if (SCALAR_FLOAT_MODE_P (mode
)
4168 && CONST_DOUBLE_AS_FLOAT_P (op0
)
4169 && CONST_DOUBLE_AS_FLOAT_P (op1
)
4170 && mode
== GET_MODE (op0
) && mode
== GET_MODE (op1
))
4181 real_to_target (tmp0
, CONST_DOUBLE_REAL_VALUE (op0
),
4183 real_to_target (tmp1
, CONST_DOUBLE_REAL_VALUE (op1
),
4185 for (i
= 0; i
< 4; i
++)
4202 real_from_target (&r
, tmp0
, mode
);
4203 return const_double_from_real_value (r
, mode
);
4207 REAL_VALUE_TYPE f0
, f1
, value
, result
;
4208 const REAL_VALUE_TYPE
*opr0
, *opr1
;
4211 opr0
= CONST_DOUBLE_REAL_VALUE (op0
);
4212 opr1
= CONST_DOUBLE_REAL_VALUE (op1
);
4214 if (HONOR_SNANS (mode
)
4215 && (REAL_VALUE_ISSIGNALING_NAN (*opr0
)
4216 || REAL_VALUE_ISSIGNALING_NAN (*opr1
)))
4219 real_convert (&f0
, mode
, opr0
);
4220 real_convert (&f1
, mode
, opr1
);
4223 && real_equal (&f1
, &dconst0
)
4224 && (flag_trapping_math
|| ! MODE_HAS_INFINITIES (mode
)))
4227 if (MODE_HAS_INFINITIES (mode
) && HONOR_NANS (mode
)
4228 && flag_trapping_math
4229 && REAL_VALUE_ISINF (f0
) && REAL_VALUE_ISINF (f1
))
4231 int s0
= REAL_VALUE_NEGATIVE (f0
);
4232 int s1
= REAL_VALUE_NEGATIVE (f1
);
4237 /* Inf + -Inf = NaN plus exception. */
4242 /* Inf - Inf = NaN plus exception. */
4247 /* Inf / Inf = NaN plus exception. */
4254 if (code
== MULT
&& MODE_HAS_INFINITIES (mode
) && HONOR_NANS (mode
)
4255 && flag_trapping_math
4256 && ((REAL_VALUE_ISINF (f0
) && real_equal (&f1
, &dconst0
))
4257 || (REAL_VALUE_ISINF (f1
)
4258 && real_equal (&f0
, &dconst0
))))
4259 /* Inf * 0 = NaN plus exception. */
4262 inexact
= real_arithmetic (&value
, rtx_to_tree_code (code
),
4264 real_convert (&result
, mode
, &value
);
4266 /* Don't constant fold this floating point operation if
4267 the result has overflowed and flag_trapping_math. */
4269 if (flag_trapping_math
4270 && MODE_HAS_INFINITIES (mode
)
4271 && REAL_VALUE_ISINF (result
)
4272 && !REAL_VALUE_ISINF (f0
)
4273 && !REAL_VALUE_ISINF (f1
))
4274 /* Overflow plus exception. */
4277 /* Don't constant fold this floating point operation if the
4278 result may dependent upon the run-time rounding mode and
4279 flag_rounding_math is set, or if GCC's software emulation
4280 is unable to accurately represent the result. */
4282 if ((flag_rounding_math
4283 || (MODE_COMPOSITE_P (mode
) && !flag_unsafe_math_optimizations
))
4284 && (inexact
|| !real_identical (&result
, &value
)))
4287 return const_double_from_real_value (result
, mode
);
4291 /* We can fold some multi-word operations. */
4292 scalar_int_mode int_mode
;
4293 if (is_a
<scalar_int_mode
> (mode
, &int_mode
)
4294 && CONST_SCALAR_INT_P (op0
)
4295 && CONST_SCALAR_INT_P (op1
))
4298 wi::overflow_type overflow
;
4299 rtx_mode_t pop0
= rtx_mode_t (op0
, int_mode
);
4300 rtx_mode_t pop1
= rtx_mode_t (op1
, int_mode
);
4302 #if TARGET_SUPPORTS_WIDE_INT == 0
4303 /* This assert keeps the simplification from producing a result
4304 that cannot be represented in a CONST_DOUBLE but a lot of
4305 upstream callers expect that this function never fails to
4306 simplify something and so you if you added this to the test
4307 above the code would die later anyway. If this assert
4308 happens, you just need to make the port support wide int. */
4309 gcc_assert (GET_MODE_PRECISION (int_mode
) <= HOST_BITS_PER_DOUBLE_INT
);
4314 result
= wi::sub (pop0
, pop1
);
4318 result
= wi::add (pop0
, pop1
);
4322 result
= wi::mul (pop0
, pop1
);
4326 result
= wi::div_trunc (pop0
, pop1
, SIGNED
, &overflow
);
4332 result
= wi::mod_trunc (pop0
, pop1
, SIGNED
, &overflow
);
4338 result
= wi::div_trunc (pop0
, pop1
, UNSIGNED
, &overflow
);
4344 result
= wi::mod_trunc (pop0
, pop1
, UNSIGNED
, &overflow
);
4350 result
= wi::bit_and (pop0
, pop1
);
4354 result
= wi::bit_or (pop0
, pop1
);
4358 result
= wi::bit_xor (pop0
, pop1
);
4362 result
= wi::smin (pop0
, pop1
);
4366 result
= wi::smax (pop0
, pop1
);
4370 result
= wi::umin (pop0
, pop1
);
4374 result
= wi::umax (pop0
, pop1
);
4381 wide_int wop1
= pop1
;
4382 if (SHIFT_COUNT_TRUNCATED
)
4383 wop1
= wi::umod_trunc (wop1
, GET_MODE_PRECISION (int_mode
));
4384 else if (wi::geu_p (wop1
, GET_MODE_PRECISION (int_mode
)))
4390 result
= wi::lrshift (pop0
, wop1
);
4394 result
= wi::arshift (pop0
, wop1
);
4398 result
= wi::lshift (pop0
, wop1
);
4409 if (wi::neg_p (pop1
))
4415 result
= wi::lrotate (pop0
, pop1
);
4419 result
= wi::rrotate (pop0
, pop1
);
4430 return immed_wide_int_const (result
, int_mode
);
4433 /* Handle polynomial integers. */
4434 if (NUM_POLY_INT_COEFFS
> 1
4435 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
4436 && poly_int_rtx_p (op0
)
4437 && poly_int_rtx_p (op1
))
4439 poly_wide_int result
;
4443 result
= wi::to_poly_wide (op0
, mode
) + wi::to_poly_wide (op1
, mode
);
4447 result
= wi::to_poly_wide (op0
, mode
) - wi::to_poly_wide (op1
, mode
);
4451 if (CONST_SCALAR_INT_P (op1
))
4452 result
= wi::to_poly_wide (op0
, mode
) * rtx_mode_t (op1
, mode
);
4458 if (CONST_SCALAR_INT_P (op1
))
4460 wide_int shift
= rtx_mode_t (op1
, mode
);
4461 if (SHIFT_COUNT_TRUNCATED
)
4462 shift
= wi::umod_trunc (shift
, GET_MODE_PRECISION (int_mode
));
4463 else if (wi::geu_p (shift
, GET_MODE_PRECISION (int_mode
)))
4465 result
= wi::to_poly_wide (op0
, mode
) << shift
;
4472 if (!CONST_SCALAR_INT_P (op1
)
4473 || !can_ior_p (wi::to_poly_wide (op0
, mode
),
4474 rtx_mode_t (op1
, mode
), &result
))
4481 return immed_wide_int_const (result
, int_mode
);
4489 /* Return a positive integer if X should sort after Y. The value
4490 returned is 1 if and only if X and Y are both regs. */
4493 simplify_plus_minus_op_data_cmp (rtx x
, rtx y
)
4497 result
= (commutative_operand_precedence (y
)
4498 - commutative_operand_precedence (x
));
4500 return result
+ result
;
4502 /* Group together equal REGs to do more simplification. */
4503 if (REG_P (x
) && REG_P (y
))
4504 return REGNO (x
) > REGNO (y
);
4509 /* Simplify and canonicalize a PLUS or MINUS, at least one of whose
4510 operands may be another PLUS or MINUS.
4512 Rather than test for specific case, we do this by a brute-force method
4513 and do all possible simplifications until no more changes occur. Then
4514 we rebuild the operation.
4516 May return NULL_RTX when no changes were made. */
4519 simplify_plus_minus (enum rtx_code code
, machine_mode mode
, rtx op0
,
4522 struct simplify_plus_minus_op_data
4529 int changed
, n_constants
, canonicalized
= 0;
4532 memset (ops
, 0, sizeof ops
);
4534 /* Set up the two operands and then expand them until nothing has been
4535 changed. If we run out of room in our array, give up; this should
4536 almost never happen. */
4541 ops
[1].neg
= (code
== MINUS
);
4548 for (i
= 0; i
< n_ops
; i
++)
4550 rtx this_op
= ops
[i
].op
;
4551 int this_neg
= ops
[i
].neg
;
4552 enum rtx_code this_code
= GET_CODE (this_op
);
4558 if (n_ops
== ARRAY_SIZE (ops
))
4561 ops
[n_ops
].op
= XEXP (this_op
, 1);
4562 ops
[n_ops
].neg
= (this_code
== MINUS
) ^ this_neg
;
4565 ops
[i
].op
= XEXP (this_op
, 0);
4567 /* If this operand was negated then we will potentially
4568 canonicalize the expression. Similarly if we don't
4569 place the operands adjacent we're re-ordering the
4570 expression and thus might be performing a
4571 canonicalization. Ignore register re-ordering.
4572 ??? It might be better to shuffle the ops array here,
4573 but then (plus (plus (A, B), plus (C, D))) wouldn't
4574 be seen as non-canonical. */
4577 && !(REG_P (ops
[i
].op
) && REG_P (ops
[n_ops
- 1].op
))))
4582 ops
[i
].op
= XEXP (this_op
, 0);
4583 ops
[i
].neg
= ! this_neg
;
4589 if (n_ops
!= ARRAY_SIZE (ops
)
4590 && GET_CODE (XEXP (this_op
, 0)) == PLUS
4591 && CONSTANT_P (XEXP (XEXP (this_op
, 0), 0))
4592 && CONSTANT_P (XEXP (XEXP (this_op
, 0), 1)))
4594 ops
[i
].op
= XEXP (XEXP (this_op
, 0), 0);
4595 ops
[n_ops
].op
= XEXP (XEXP (this_op
, 0), 1);
4596 ops
[n_ops
].neg
= this_neg
;
4604 /* ~a -> (-a - 1) */
4605 if (n_ops
!= ARRAY_SIZE (ops
))
4607 ops
[n_ops
].op
= CONSTM1_RTX (mode
);
4608 ops
[n_ops
++].neg
= this_neg
;
4609 ops
[i
].op
= XEXP (this_op
, 0);
4610 ops
[i
].neg
= !this_neg
;
4616 CASE_CONST_SCALAR_INT
:
4617 case CONST_POLY_INT
:
4621 ops
[i
].op
= neg_poly_int_rtx (mode
, this_op
);
4635 if (n_constants
> 1)
4638 gcc_assert (n_ops
>= 2);
4640 /* If we only have two operands, we can avoid the loops. */
4643 enum rtx_code code
= ops
[0].neg
|| ops
[1].neg
? MINUS
: PLUS
;
4646 /* Get the two operands. Be careful with the order, especially for
4647 the cases where code == MINUS. */
4648 if (ops
[0].neg
&& ops
[1].neg
)
4650 lhs
= gen_rtx_NEG (mode
, ops
[0].op
);
4653 else if (ops
[0].neg
)
4664 return simplify_const_binary_operation (code
, mode
, lhs
, rhs
);
4667 /* Now simplify each pair of operands until nothing changes. */
4670 /* Insertion sort is good enough for a small array. */
4671 for (i
= 1; i
< n_ops
; i
++)
4673 struct simplify_plus_minus_op_data save
;
4677 cmp
= simplify_plus_minus_op_data_cmp (ops
[j
].op
, ops
[i
].op
);
4680 /* Just swapping registers doesn't count as canonicalization. */
4686 ops
[j
+ 1] = ops
[j
];
4688 && simplify_plus_minus_op_data_cmp (ops
[j
].op
, save
.op
) > 0);
4693 for (i
= n_ops
- 1; i
> 0; i
--)
4694 for (j
= i
- 1; j
>= 0; j
--)
4696 rtx lhs
= ops
[j
].op
, rhs
= ops
[i
].op
;
4697 int lneg
= ops
[j
].neg
, rneg
= ops
[i
].neg
;
4699 if (lhs
!= 0 && rhs
!= 0)
4701 enum rtx_code ncode
= PLUS
;
4707 std::swap (lhs
, rhs
);
4709 else if (swap_commutative_operands_p (lhs
, rhs
))
4710 std::swap (lhs
, rhs
);
4712 if ((GET_CODE (lhs
) == CONST
|| CONST_INT_P (lhs
))
4713 && (GET_CODE (rhs
) == CONST
|| CONST_INT_P (rhs
)))
4715 rtx tem_lhs
, tem_rhs
;
4717 tem_lhs
= GET_CODE (lhs
) == CONST
? XEXP (lhs
, 0) : lhs
;
4718 tem_rhs
= GET_CODE (rhs
) == CONST
? XEXP (rhs
, 0) : rhs
;
4719 tem
= simplify_binary_operation (ncode
, mode
, tem_lhs
,
4722 if (tem
&& !CONSTANT_P (tem
))
4723 tem
= gen_rtx_CONST (GET_MODE (tem
), tem
);
4726 tem
= simplify_binary_operation (ncode
, mode
, lhs
, rhs
);
4730 /* Reject "simplifications" that just wrap the two
4731 arguments in a CONST. Failure to do so can result
4732 in infinite recursion with simplify_binary_operation
4733 when it calls us to simplify CONST operations.
4734 Also, if we find such a simplification, don't try
4735 any more combinations with this rhs: We must have
4736 something like symbol+offset, ie. one of the
4737 trivial CONST expressions we handle later. */
4738 if (GET_CODE (tem
) == CONST
4739 && GET_CODE (XEXP (tem
, 0)) == ncode
4740 && XEXP (XEXP (tem
, 0), 0) == lhs
4741 && XEXP (XEXP (tem
, 0), 1) == rhs
)
4744 if (GET_CODE (tem
) == NEG
)
4745 tem
= XEXP (tem
, 0), lneg
= !lneg
;
4746 if (poly_int_rtx_p (tem
) && lneg
)
4747 tem
= neg_poly_int_rtx (mode
, tem
), lneg
= 0;
4751 ops
[j
].op
= NULL_RTX
;
4761 /* Pack all the operands to the lower-numbered entries. */
4762 for (i
= 0, j
= 0; j
< n_ops
; j
++)
4771 /* If nothing changed, check that rematerialization of rtl instructions
4772 is still required. */
4775 /* Perform rematerialization if only all operands are registers and
4776 all operations are PLUS. */
4777 /* ??? Also disallow (non-global, non-frame) fixed registers to work
4778 around rs6000 and how it uses the CA register. See PR67145. */
4779 for (i
= 0; i
< n_ops
; i
++)
4781 || !REG_P (ops
[i
].op
)
4782 || (REGNO (ops
[i
].op
) < FIRST_PSEUDO_REGISTER
4783 && fixed_regs
[REGNO (ops
[i
].op
)]
4784 && !global_regs
[REGNO (ops
[i
].op
)]
4785 && ops
[i
].op
!= frame_pointer_rtx
4786 && ops
[i
].op
!= arg_pointer_rtx
4787 && ops
[i
].op
!= stack_pointer_rtx
))
4792 /* Create (minus -C X) instead of (neg (const (plus X C))). */
4794 && CONST_INT_P (ops
[1].op
)
4795 && CONSTANT_P (ops
[0].op
)
4797 return gen_rtx_fmt_ee (MINUS
, mode
, ops
[1].op
, ops
[0].op
);
4799 /* We suppressed creation of trivial CONST expressions in the
4800 combination loop to avoid recursion. Create one manually now.
4801 The combination loop should have ensured that there is exactly
4802 one CONST_INT, and the sort will have ensured that it is last
4803 in the array and that any other constant will be next-to-last. */
4806 && poly_int_rtx_p (ops
[n_ops
- 1].op
)
4807 && CONSTANT_P (ops
[n_ops
- 2].op
))
4809 rtx value
= ops
[n_ops
- 1].op
;
4810 if (ops
[n_ops
- 1].neg
^ ops
[n_ops
- 2].neg
)
4811 value
= neg_poly_int_rtx (mode
, value
);
4812 if (CONST_INT_P (value
))
4814 ops
[n_ops
- 2].op
= plus_constant (mode
, ops
[n_ops
- 2].op
,
4820 /* Put a non-negated operand first, if possible. */
4822 for (i
= 0; i
< n_ops
&& ops
[i
].neg
; i
++)
4825 ops
[0].op
= gen_rtx_NEG (mode
, ops
[0].op
);
4834 /* Now make the result by performing the requested operations. */
4837 for (i
= 1; i
< n_ops
; i
++)
4838 result
= gen_rtx_fmt_ee (ops
[i
].neg
? MINUS
: PLUS
,
4839 mode
, result
, ops
[i
].op
);
4844 /* Check whether an operand is suitable for calling simplify_plus_minus. */
4846 plus_minus_operand_p (const_rtx x
)
4848 return GET_CODE (x
) == PLUS
4849 || GET_CODE (x
) == MINUS
4850 || (GET_CODE (x
) == CONST
4851 && GET_CODE (XEXP (x
, 0)) == PLUS
4852 && CONSTANT_P (XEXP (XEXP (x
, 0), 0))
4853 && CONSTANT_P (XEXP (XEXP (x
, 0), 1)));
4856 /* Like simplify_binary_operation except used for relational operators.
4857 MODE is the mode of the result. If MODE is VOIDmode, both operands must
4858 not also be VOIDmode.
4860 CMP_MODE specifies in which mode the comparison is done in, so it is
4861 the mode of the operands. If CMP_MODE is VOIDmode, it is taken from
4862 the operands or, if both are VOIDmode, the operands are compared in
4863 "infinite precision". */
4865 simplify_relational_operation (enum rtx_code code
, machine_mode mode
,
4866 machine_mode cmp_mode
, rtx op0
, rtx op1
)
4868 rtx tem
, trueop0
, trueop1
;
4870 if (cmp_mode
== VOIDmode
)
4871 cmp_mode
= GET_MODE (op0
);
4872 if (cmp_mode
== VOIDmode
)
4873 cmp_mode
= GET_MODE (op1
);
4875 tem
= simplify_const_relational_operation (code
, cmp_mode
, op0
, op1
);
4878 if (SCALAR_FLOAT_MODE_P (mode
))
4880 if (tem
== const0_rtx
)
4881 return CONST0_RTX (mode
);
4882 #ifdef FLOAT_STORE_FLAG_VALUE
4884 REAL_VALUE_TYPE val
;
4885 val
= FLOAT_STORE_FLAG_VALUE (mode
);
4886 return const_double_from_real_value (val
, mode
);
4892 if (VECTOR_MODE_P (mode
))
4894 if (tem
== const0_rtx
)
4895 return CONST0_RTX (mode
);
4896 #ifdef VECTOR_STORE_FLAG_VALUE
4898 rtx val
= VECTOR_STORE_FLAG_VALUE (mode
);
4899 if (val
== NULL_RTX
)
4901 if (val
== const1_rtx
)
4902 return CONST1_RTX (mode
);
4904 return gen_const_vec_duplicate (mode
, val
);
4914 /* For the following tests, ensure const0_rtx is op1. */
4915 if (swap_commutative_operands_p (op0
, op1
)
4916 || (op0
== const0_rtx
&& op1
!= const0_rtx
))
4917 std::swap (op0
, op1
), code
= swap_condition (code
);
4919 /* If op0 is a compare, extract the comparison arguments from it. */
4920 if (GET_CODE (op0
) == COMPARE
&& op1
== const0_rtx
)
4921 return simplify_gen_relational (code
, mode
, VOIDmode
,
4922 XEXP (op0
, 0), XEXP (op0
, 1));
4924 if (GET_MODE_CLASS (cmp_mode
) == MODE_CC
4928 trueop0
= avoid_constant_pool_reference (op0
);
4929 trueop1
= avoid_constant_pool_reference (op1
);
4930 return simplify_relational_operation_1 (code
, mode
, cmp_mode
,
4934 /* This part of simplify_relational_operation is only used when CMP_MODE
4935 is not in class MODE_CC (i.e. it is a real comparison).
4937 MODE is the mode of the result, while CMP_MODE specifies in which
4938 mode the comparison is done in, so it is the mode of the operands. */
4941 simplify_relational_operation_1 (enum rtx_code code
, machine_mode mode
,
4942 machine_mode cmp_mode
, rtx op0
, rtx op1
)
4944 enum rtx_code op0code
= GET_CODE (op0
);
4946 if (op1
== const0_rtx
&& COMPARISON_P (op0
))
4948 /* If op0 is a comparison, extract the comparison arguments
4952 if (GET_MODE (op0
) == mode
)
4953 return simplify_rtx (op0
);
4955 return simplify_gen_relational (GET_CODE (op0
), mode
, VOIDmode
,
4956 XEXP (op0
, 0), XEXP (op0
, 1));
4958 else if (code
== EQ
)
4960 enum rtx_code new_code
= reversed_comparison_code (op0
, NULL
);
4961 if (new_code
!= UNKNOWN
)
4962 return simplify_gen_relational (new_code
, mode
, VOIDmode
,
4963 XEXP (op0
, 0), XEXP (op0
, 1));
4967 /* (LTU/GEU (PLUS a C) C), where C is constant, can be simplified to
4968 (GEU/LTU a -C). Likewise for (LTU/GEU (PLUS a C) a). */
4969 if ((code
== LTU
|| code
== GEU
)
4970 && GET_CODE (op0
) == PLUS
4971 && CONST_INT_P (XEXP (op0
, 1))
4972 && (rtx_equal_p (op1
, XEXP (op0
, 0))
4973 || rtx_equal_p (op1
, XEXP (op0
, 1)))
4974 /* (LTU/GEU (PLUS a 0) 0) is not the same as (GEU/LTU a 0). */
4975 && XEXP (op0
, 1) != const0_rtx
)
4978 = simplify_gen_unary (NEG
, cmp_mode
, XEXP (op0
, 1), cmp_mode
);
4979 return simplify_gen_relational ((code
== LTU
? GEU
: LTU
), mode
,
4980 cmp_mode
, XEXP (op0
, 0), new_cmp
);
4983 /* (GTU (PLUS a C) (C - 1)) where C is a non-zero constant can be
4984 transformed into (LTU a -C). */
4985 if (code
== GTU
&& GET_CODE (op0
) == PLUS
&& CONST_INT_P (op1
)
4986 && CONST_INT_P (XEXP (op0
, 1))
4987 && (UINTVAL (op1
) == UINTVAL (XEXP (op0
, 1)) - 1)
4988 && XEXP (op0
, 1) != const0_rtx
)
4991 = simplify_gen_unary (NEG
, cmp_mode
, XEXP (op0
, 1), cmp_mode
);
4992 return simplify_gen_relational (LTU
, mode
, cmp_mode
,
4993 XEXP (op0
, 0), new_cmp
);
4996 /* Canonicalize (LTU/GEU (PLUS a b) b) as (LTU/GEU (PLUS a b) a). */
4997 if ((code
== LTU
|| code
== GEU
)
4998 && GET_CODE (op0
) == PLUS
4999 && rtx_equal_p (op1
, XEXP (op0
, 1))
5000 /* Don't recurse "infinitely" for (LTU/GEU (PLUS b b) b). */
5001 && !rtx_equal_p (op1
, XEXP (op0
, 0)))
5002 return simplify_gen_relational (code
, mode
, cmp_mode
, op0
,
5003 copy_rtx (XEXP (op0
, 0)));
5005 if (op1
== const0_rtx
)
5007 /* Canonicalize (GTU x 0) as (NE x 0). */
5009 return simplify_gen_relational (NE
, mode
, cmp_mode
, op0
, op1
);
5010 /* Canonicalize (LEU x 0) as (EQ x 0). */
5012 return simplify_gen_relational (EQ
, mode
, cmp_mode
, op0
, op1
);
5014 else if (op1
== const1_rtx
)
5019 /* Canonicalize (GE x 1) as (GT x 0). */
5020 return simplify_gen_relational (GT
, mode
, cmp_mode
,
5023 /* Canonicalize (GEU x 1) as (NE x 0). */
5024 return simplify_gen_relational (NE
, mode
, cmp_mode
,
5027 /* Canonicalize (LT x 1) as (LE x 0). */
5028 return simplify_gen_relational (LE
, mode
, cmp_mode
,
5031 /* Canonicalize (LTU x 1) as (EQ x 0). */
5032 return simplify_gen_relational (EQ
, mode
, cmp_mode
,
5038 else if (op1
== constm1_rtx
)
5040 /* Canonicalize (LE x -1) as (LT x 0). */
5042 return simplify_gen_relational (LT
, mode
, cmp_mode
, op0
, const0_rtx
);
5043 /* Canonicalize (GT x -1) as (GE x 0). */
5045 return simplify_gen_relational (GE
, mode
, cmp_mode
, op0
, const0_rtx
);
5048 /* (eq/ne (plus x cst1) cst2) simplifies to (eq/ne x (cst2 - cst1)) */
5049 if ((code
== EQ
|| code
== NE
)
5050 && (op0code
== PLUS
|| op0code
== MINUS
)
5052 && CONSTANT_P (XEXP (op0
, 1))
5053 && (INTEGRAL_MODE_P (cmp_mode
) || flag_unsafe_math_optimizations
))
5055 rtx x
= XEXP (op0
, 0);
5056 rtx c
= XEXP (op0
, 1);
5057 enum rtx_code invcode
= op0code
== PLUS
? MINUS
: PLUS
;
5058 rtx tem
= simplify_gen_binary (invcode
, cmp_mode
, op1
, c
);
5060 /* Detect an infinite recursive condition, where we oscillate at this
5061 simplification case between:
5062 A + B == C <---> C - B == A,
5063 where A, B, and C are all constants with non-simplifiable expressions,
5064 usually SYMBOL_REFs. */
5065 if (GET_CODE (tem
) == invcode
5067 && rtx_equal_p (c
, XEXP (tem
, 1)))
5070 return simplify_gen_relational (code
, mode
, cmp_mode
, x
, tem
);
5073 /* (ne:SI (zero_extract:SI FOO (const_int 1) BAR) (const_int 0))) is
5074 the same as (zero_extract:SI FOO (const_int 1) BAR). */
5075 scalar_int_mode int_mode
, int_cmp_mode
;
5077 && op1
== const0_rtx
5078 && is_int_mode (mode
, &int_mode
)
5079 && is_a
<scalar_int_mode
> (cmp_mode
, &int_cmp_mode
)
5080 /* ??? Work-around BImode bugs in the ia64 backend. */
5081 && int_mode
!= BImode
5082 && int_cmp_mode
!= BImode
5083 && nonzero_bits (op0
, int_cmp_mode
) == 1
5084 && STORE_FLAG_VALUE
== 1)
5085 return GET_MODE_SIZE (int_mode
) > GET_MODE_SIZE (int_cmp_mode
)
5086 ? simplify_gen_unary (ZERO_EXTEND
, int_mode
, op0
, int_cmp_mode
)
5087 : lowpart_subreg (int_mode
, op0
, int_cmp_mode
);
5089 /* (eq/ne (xor x y) 0) simplifies to (eq/ne x y). */
5090 if ((code
== EQ
|| code
== NE
)
5091 && op1
== const0_rtx
5093 return simplify_gen_relational (code
, mode
, cmp_mode
,
5094 XEXP (op0
, 0), XEXP (op0
, 1));
5096 /* (eq/ne (xor x y) x) simplifies to (eq/ne y 0). */
5097 if ((code
== EQ
|| code
== NE
)
5099 && rtx_equal_p (XEXP (op0
, 0), op1
)
5100 && !side_effects_p (XEXP (op0
, 0)))
5101 return simplify_gen_relational (code
, mode
, cmp_mode
, XEXP (op0
, 1),
5104 /* Likewise (eq/ne (xor x y) y) simplifies to (eq/ne x 0). */
5105 if ((code
== EQ
|| code
== NE
)
5107 && rtx_equal_p (XEXP (op0
, 1), op1
)
5108 && !side_effects_p (XEXP (op0
, 1)))
5109 return simplify_gen_relational (code
, mode
, cmp_mode
, XEXP (op0
, 0),
5112 /* (eq/ne (xor x C1) C2) simplifies to (eq/ne x (C1^C2)). */
5113 if ((code
== EQ
|| code
== NE
)
5115 && CONST_SCALAR_INT_P (op1
)
5116 && CONST_SCALAR_INT_P (XEXP (op0
, 1)))
5117 return simplify_gen_relational (code
, mode
, cmp_mode
, XEXP (op0
, 0),
5118 simplify_gen_binary (XOR
, cmp_mode
,
5119 XEXP (op0
, 1), op1
));
5121 /* Simplify eq/ne (and/ior x y) x/y) for targets with a BICS instruction or
5122 constant folding if x/y is a constant. */
5123 if ((code
== EQ
|| code
== NE
)
5124 && (op0code
== AND
|| op0code
== IOR
)
5125 && !side_effects_p (op1
)
5126 && op1
!= CONST0_RTX (cmp_mode
))
5128 /* Both (eq/ne (and x y) x) and (eq/ne (ior x y) y) simplify to
5129 (eq/ne (and (not y) x) 0). */
5130 if ((op0code
== AND
&& rtx_equal_p (XEXP (op0
, 0), op1
))
5131 || (op0code
== IOR
&& rtx_equal_p (XEXP (op0
, 1), op1
)))
5133 rtx not_y
= simplify_gen_unary (NOT
, cmp_mode
, XEXP (op0
, 1),
5135 rtx lhs
= simplify_gen_binary (AND
, cmp_mode
, not_y
, XEXP (op0
, 0));
5137 return simplify_gen_relational (code
, mode
, cmp_mode
, lhs
,
5138 CONST0_RTX (cmp_mode
));
5141 /* Both (eq/ne (and x y) y) and (eq/ne (ior x y) x) simplify to
5142 (eq/ne (and (not x) y) 0). */
5143 if ((op0code
== AND
&& rtx_equal_p (XEXP (op0
, 1), op1
))
5144 || (op0code
== IOR
&& rtx_equal_p (XEXP (op0
, 0), op1
)))
5146 rtx not_x
= simplify_gen_unary (NOT
, cmp_mode
, XEXP (op0
, 0),
5148 rtx lhs
= simplify_gen_binary (AND
, cmp_mode
, not_x
, XEXP (op0
, 1));
5150 return simplify_gen_relational (code
, mode
, cmp_mode
, lhs
,
5151 CONST0_RTX (cmp_mode
));
5155 /* (eq/ne (bswap x) C1) simplifies to (eq/ne x C2) with C2 swapped. */
5156 if ((code
== EQ
|| code
== NE
)
5157 && GET_CODE (op0
) == BSWAP
5158 && CONST_SCALAR_INT_P (op1
))
5159 return simplify_gen_relational (code
, mode
, cmp_mode
, XEXP (op0
, 0),
5160 simplify_gen_unary (BSWAP
, cmp_mode
,
5163 /* (eq/ne (bswap x) (bswap y)) simplifies to (eq/ne x y). */
5164 if ((code
== EQ
|| code
== NE
)
5165 && GET_CODE (op0
) == BSWAP
5166 && GET_CODE (op1
) == BSWAP
)
5167 return simplify_gen_relational (code
, mode
, cmp_mode
,
5168 XEXP (op0
, 0), XEXP (op1
, 0));
5170 if (op0code
== POPCOUNT
&& op1
== const0_rtx
)
5176 /* (eq (popcount x) (const_int 0)) -> (eq x (const_int 0)). */
5177 return simplify_gen_relational (EQ
, mode
, GET_MODE (XEXP (op0
, 0)),
5178 XEXP (op0
, 0), const0_rtx
);
5183 /* (ne (popcount x) (const_int 0)) -> (ne x (const_int 0)). */
5184 return simplify_gen_relational (NE
, mode
, GET_MODE (XEXP (op0
, 0)),
5185 XEXP (op0
, 0), const0_rtx
);
5204 /* Convert the known results for EQ, LT, GT, LTU, GTU contained in
5205 KNOWN_RESULT to a CONST_INT, based on the requested comparison CODE
5206 For KNOWN_RESULT to make sense it should be either CMP_EQ, or the
5207 logical OR of one of (CMP_LT, CMP_GT) and one of (CMP_LTU, CMP_GTU).
5208 For floating-point comparisons, assume that the operands were ordered. */
5211 comparison_result (enum rtx_code code
, int known_results
)
5217 return (known_results
& CMP_EQ
) ? const_true_rtx
: const0_rtx
;
5220 return (known_results
& CMP_EQ
) ? const0_rtx
: const_true_rtx
;
5224 return (known_results
& CMP_LT
) ? const_true_rtx
: const0_rtx
;
5227 return (known_results
& CMP_LT
) ? const0_rtx
: const_true_rtx
;
5231 return (known_results
& CMP_GT
) ? const_true_rtx
: const0_rtx
;
5234 return (known_results
& CMP_GT
) ? const0_rtx
: const_true_rtx
;
5237 return (known_results
& CMP_LTU
) ? const_true_rtx
: const0_rtx
;
5239 return (known_results
& CMP_LTU
) ? const0_rtx
: const_true_rtx
;
5242 return (known_results
& CMP_GTU
) ? const_true_rtx
: const0_rtx
;
5244 return (known_results
& CMP_GTU
) ? const0_rtx
: const_true_rtx
;
5247 return const_true_rtx
;
5255 /* Check if the given comparison (done in the given MODE) is actually
5256 a tautology or a contradiction. If the mode is VOID_mode, the
5257 comparison is done in "infinite precision". If no simplification
5258 is possible, this function returns zero. Otherwise, it returns
5259 either const_true_rtx or const0_rtx. */
5262 simplify_const_relational_operation (enum rtx_code code
,
5270 gcc_assert (mode
!= VOIDmode
5271 || (GET_MODE (op0
) == VOIDmode
5272 && GET_MODE (op1
) == VOIDmode
));
5274 /* If op0 is a compare, extract the comparison arguments from it. */
5275 if (GET_CODE (op0
) == COMPARE
&& op1
== const0_rtx
)
5277 op1
= XEXP (op0
, 1);
5278 op0
= XEXP (op0
, 0);
5280 if (GET_MODE (op0
) != VOIDmode
)
5281 mode
= GET_MODE (op0
);
5282 else if (GET_MODE (op1
) != VOIDmode
)
5283 mode
= GET_MODE (op1
);
5288 /* We can't simplify MODE_CC values since we don't know what the
5289 actual comparison is. */
5290 if (GET_MODE_CLASS (GET_MODE (op0
)) == MODE_CC
|| CC0_P (op0
))
5293 /* Make sure the constant is second. */
5294 if (swap_commutative_operands_p (op0
, op1
))
5296 std::swap (op0
, op1
);
5297 code
= swap_condition (code
);
5300 trueop0
= avoid_constant_pool_reference (op0
);
5301 trueop1
= avoid_constant_pool_reference (op1
);
5303 /* For integer comparisons of A and B maybe we can simplify A - B and can
5304 then simplify a comparison of that with zero. If A and B are both either
5305 a register or a CONST_INT, this can't help; testing for these cases will
5306 prevent infinite recursion here and speed things up.
5308 We can only do this for EQ and NE comparisons as otherwise we may
5309 lose or introduce overflow which we cannot disregard as undefined as
5310 we do not know the signedness of the operation on either the left or
5311 the right hand side of the comparison. */
5313 if (INTEGRAL_MODE_P (mode
) && trueop1
!= const0_rtx
5314 && (code
== EQ
|| code
== NE
)
5315 && ! ((REG_P (op0
) || CONST_INT_P (trueop0
))
5316 && (REG_P (op1
) || CONST_INT_P (trueop1
)))
5317 && (tem
= simplify_binary_operation (MINUS
, mode
, op0
, op1
)) != 0
5318 /* We cannot do this if tem is a nonzero address. */
5319 && ! nonzero_address_p (tem
))
5320 return simplify_const_relational_operation (signed_condition (code
),
5321 mode
, tem
, const0_rtx
);
5323 if (! HONOR_NANS (mode
) && code
== ORDERED
)
5324 return const_true_rtx
;
5326 if (! HONOR_NANS (mode
) && code
== UNORDERED
)
5329 /* For modes without NaNs, if the two operands are equal, we know the
5330 result except if they have side-effects. Even with NaNs we know
5331 the result of unordered comparisons and, if signaling NaNs are
5332 irrelevant, also the result of LT/GT/LTGT. */
5333 if ((! HONOR_NANS (trueop0
)
5334 || code
== UNEQ
|| code
== UNLE
|| code
== UNGE
5335 || ((code
== LT
|| code
== GT
|| code
== LTGT
)
5336 && ! HONOR_SNANS (trueop0
)))
5337 && rtx_equal_p (trueop0
, trueop1
)
5338 && ! side_effects_p (trueop0
))
5339 return comparison_result (code
, CMP_EQ
);
5341 /* If the operands are floating-point constants, see if we can fold
5343 if (CONST_DOUBLE_AS_FLOAT_P (trueop0
)
5344 && CONST_DOUBLE_AS_FLOAT_P (trueop1
)
5345 && SCALAR_FLOAT_MODE_P (GET_MODE (trueop0
)))
5347 const REAL_VALUE_TYPE
*d0
= CONST_DOUBLE_REAL_VALUE (trueop0
);
5348 const REAL_VALUE_TYPE
*d1
= CONST_DOUBLE_REAL_VALUE (trueop1
);
5350 /* Comparisons are unordered iff at least one of the values is NaN. */
5351 if (REAL_VALUE_ISNAN (*d0
) || REAL_VALUE_ISNAN (*d1
))
5361 return const_true_rtx
;
5374 return comparison_result (code
,
5375 (real_equal (d0
, d1
) ? CMP_EQ
:
5376 real_less (d0
, d1
) ? CMP_LT
: CMP_GT
));
5379 /* Otherwise, see if the operands are both integers. */
5380 if ((GET_MODE_CLASS (mode
) == MODE_INT
|| mode
== VOIDmode
)
5381 && CONST_SCALAR_INT_P (trueop0
) && CONST_SCALAR_INT_P (trueop1
))
5383 /* It would be nice if we really had a mode here. However, the
5384 largest int representable on the target is as good as
5386 machine_mode cmode
= (mode
== VOIDmode
) ? MAX_MODE_INT
: mode
;
5387 rtx_mode_t ptrueop0
= rtx_mode_t (trueop0
, cmode
);
5388 rtx_mode_t ptrueop1
= rtx_mode_t (trueop1
, cmode
);
5390 if (wi::eq_p (ptrueop0
, ptrueop1
))
5391 return comparison_result (code
, CMP_EQ
);
5394 int cr
= wi::lts_p (ptrueop0
, ptrueop1
) ? CMP_LT
: CMP_GT
;
5395 cr
|= wi::ltu_p (ptrueop0
, ptrueop1
) ? CMP_LTU
: CMP_GTU
;
5396 return comparison_result (code
, cr
);
5400 /* Optimize comparisons with upper and lower bounds. */
5401 scalar_int_mode int_mode
;
5402 if (CONST_INT_P (trueop1
)
5403 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
5404 && HWI_COMPUTABLE_MODE_P (int_mode
)
5405 && !side_effects_p (trueop0
))
5408 unsigned HOST_WIDE_INT nonzero
= nonzero_bits (trueop0
, int_mode
);
5409 HOST_WIDE_INT val
= INTVAL (trueop1
);
5410 HOST_WIDE_INT mmin
, mmax
;
5420 /* Get a reduced range if the sign bit is zero. */
5421 if (nonzero
<= (GET_MODE_MASK (int_mode
) >> 1))
5428 rtx mmin_rtx
, mmax_rtx
;
5429 get_mode_bounds (int_mode
, sign
, int_mode
, &mmin_rtx
, &mmax_rtx
);
5431 mmin
= INTVAL (mmin_rtx
);
5432 mmax
= INTVAL (mmax_rtx
);
5435 unsigned int sign_copies
5436 = num_sign_bit_copies (trueop0
, int_mode
);
5438 mmin
>>= (sign_copies
- 1);
5439 mmax
>>= (sign_copies
- 1);
5445 /* x >= y is always true for y <= mmin, always false for y > mmax. */
5447 if ((unsigned HOST_WIDE_INT
) val
<= (unsigned HOST_WIDE_INT
) mmin
)
5448 return const_true_rtx
;
5449 if ((unsigned HOST_WIDE_INT
) val
> (unsigned HOST_WIDE_INT
) mmax
)
5454 return const_true_rtx
;
5459 /* x <= y is always true for y >= mmax, always false for y < mmin. */
5461 if ((unsigned HOST_WIDE_INT
) val
>= (unsigned HOST_WIDE_INT
) mmax
)
5462 return const_true_rtx
;
5463 if ((unsigned HOST_WIDE_INT
) val
< (unsigned HOST_WIDE_INT
) mmin
)
5468 return const_true_rtx
;
5474 /* x == y is always false for y out of range. */
5475 if (val
< mmin
|| val
> mmax
)
5479 /* x > y is always false for y >= mmax, always true for y < mmin. */
5481 if ((unsigned HOST_WIDE_INT
) val
>= (unsigned HOST_WIDE_INT
) mmax
)
5483 if ((unsigned HOST_WIDE_INT
) val
< (unsigned HOST_WIDE_INT
) mmin
)
5484 return const_true_rtx
;
5490 return const_true_rtx
;
5493 /* x < y is always false for y <= mmin, always true for y > mmax. */
5495 if ((unsigned HOST_WIDE_INT
) val
<= (unsigned HOST_WIDE_INT
) mmin
)
5497 if ((unsigned HOST_WIDE_INT
) val
> (unsigned HOST_WIDE_INT
) mmax
)
5498 return const_true_rtx
;
5504 return const_true_rtx
;
5508 /* x != y is always true for y out of range. */
5509 if (val
< mmin
|| val
> mmax
)
5510 return const_true_rtx
;
5518 /* Optimize integer comparisons with zero. */
5519 if (is_a
<scalar_int_mode
> (mode
, &int_mode
)
5520 && trueop1
== const0_rtx
5521 && !side_effects_p (trueop0
))
5523 /* Some addresses are known to be nonzero. We don't know
5524 their sign, but equality comparisons are known. */
5525 if (nonzero_address_p (trueop0
))
5527 if (code
== EQ
|| code
== LEU
)
5529 if (code
== NE
|| code
== GTU
)
5530 return const_true_rtx
;
5533 /* See if the first operand is an IOR with a constant. If so, we
5534 may be able to determine the result of this comparison. */
5535 if (GET_CODE (op0
) == IOR
)
5537 rtx inner_const
= avoid_constant_pool_reference (XEXP (op0
, 1));
5538 if (CONST_INT_P (inner_const
) && inner_const
!= const0_rtx
)
5540 int sign_bitnum
= GET_MODE_PRECISION (int_mode
) - 1;
5541 int has_sign
= (HOST_BITS_PER_WIDE_INT
>= sign_bitnum
5542 && (UINTVAL (inner_const
)
5553 return const_true_rtx
;
5557 return const_true_rtx
;
5571 /* Optimize comparison of ABS with zero. */
5572 if (trueop1
== CONST0_RTX (mode
) && !side_effects_p (trueop0
)
5573 && (GET_CODE (trueop0
) == ABS
5574 || (GET_CODE (trueop0
) == FLOAT_EXTEND
5575 && GET_CODE (XEXP (trueop0
, 0)) == ABS
)))
5580 /* Optimize abs(x) < 0.0. */
5581 if (!INTEGRAL_MODE_P (mode
) && !HONOR_SNANS (mode
))
5586 /* Optimize abs(x) >= 0.0. */
5587 if (!INTEGRAL_MODE_P (mode
) && !HONOR_NANS (mode
))
5588 return const_true_rtx
;
5592 /* Optimize ! (abs(x) < 0.0). */
5593 return const_true_rtx
;
5603 /* Recognize expressions of the form (X CMP 0) ? VAL : OP (X)
5604 where OP is CLZ or CTZ and VAL is the value from CLZ_DEFINED_VALUE_AT_ZERO
5605 or CTZ_DEFINED_VALUE_AT_ZERO respectively and return OP (X) if the expression
5606 can be simplified to that or NULL_RTX if not.
5607 Assume X is compared against zero with CMP_CODE and the true
5608 arm is TRUE_VAL and the false arm is FALSE_VAL. */
5611 simplify_cond_clz_ctz (rtx x
, rtx_code cmp_code
, rtx true_val
, rtx false_val
)
5613 if (cmp_code
!= EQ
&& cmp_code
!= NE
)
5616 /* Result on X == 0 and X !=0 respectively. */
5617 rtx on_zero
, on_nonzero
;
5621 on_nonzero
= false_val
;
5625 on_zero
= false_val
;
5626 on_nonzero
= true_val
;
5629 rtx_code op_code
= GET_CODE (on_nonzero
);
5630 if ((op_code
!= CLZ
&& op_code
!= CTZ
)
5631 || !rtx_equal_p (XEXP (on_nonzero
, 0), x
)
5632 || !CONST_INT_P (on_zero
))
5635 HOST_WIDE_INT op_val
;
5636 scalar_int_mode mode ATTRIBUTE_UNUSED
5637 = as_a
<scalar_int_mode
> (GET_MODE (XEXP (on_nonzero
, 0)));
5638 if (((op_code
== CLZ
&& CLZ_DEFINED_VALUE_AT_ZERO (mode
, op_val
))
5639 || (op_code
== CTZ
&& CTZ_DEFINED_VALUE_AT_ZERO (mode
, op_val
)))
5640 && op_val
== INTVAL (on_zero
))
5646 /* Try to simplify X given that it appears within operand OP of a
5647 VEC_MERGE operation whose mask is MASK. X need not use the same
5648 vector mode as the VEC_MERGE, but it must have the same number of
5651 Return the simplified X on success, otherwise return NULL_RTX. */
5654 simplify_merge_mask (rtx x
, rtx mask
, int op
)
5656 gcc_assert (VECTOR_MODE_P (GET_MODE (x
)));
5657 poly_uint64 nunits
= GET_MODE_NUNITS (GET_MODE (x
));
5658 if (GET_CODE (x
) == VEC_MERGE
&& rtx_equal_p (XEXP (x
, 2), mask
))
5660 if (side_effects_p (XEXP (x
, 1 - op
)))
5663 return XEXP (x
, op
);
5666 && VECTOR_MODE_P (GET_MODE (XEXP (x
, 0)))
5667 && known_eq (GET_MODE_NUNITS (GET_MODE (XEXP (x
, 0))), nunits
))
5669 rtx top0
= simplify_merge_mask (XEXP (x
, 0), mask
, op
);
5671 return simplify_gen_unary (GET_CODE (x
), GET_MODE (x
), top0
,
5672 GET_MODE (XEXP (x
, 0)));
5675 && VECTOR_MODE_P (GET_MODE (XEXP (x
, 0)))
5676 && known_eq (GET_MODE_NUNITS (GET_MODE (XEXP (x
, 0))), nunits
)
5677 && VECTOR_MODE_P (GET_MODE (XEXP (x
, 1)))
5678 && known_eq (GET_MODE_NUNITS (GET_MODE (XEXP (x
, 1))), nunits
))
5680 rtx top0
= simplify_merge_mask (XEXP (x
, 0), mask
, op
);
5681 rtx top1
= simplify_merge_mask (XEXP (x
, 1), mask
, op
);
5684 if (COMPARISON_P (x
))
5685 return simplify_gen_relational (GET_CODE (x
), GET_MODE (x
),
5686 GET_MODE (XEXP (x
, 0)) != VOIDmode
5687 ? GET_MODE (XEXP (x
, 0))
5688 : GET_MODE (XEXP (x
, 1)),
5689 top0
? top0
: XEXP (x
, 0),
5690 top1
? top1
: XEXP (x
, 1));
5692 return simplify_gen_binary (GET_CODE (x
), GET_MODE (x
),
5693 top0
? top0
: XEXP (x
, 0),
5694 top1
? top1
: XEXP (x
, 1));
5697 if (GET_RTX_CLASS (GET_CODE (x
)) == RTX_TERNARY
5698 && VECTOR_MODE_P (GET_MODE (XEXP (x
, 0)))
5699 && known_eq (GET_MODE_NUNITS (GET_MODE (XEXP (x
, 0))), nunits
)
5700 && VECTOR_MODE_P (GET_MODE (XEXP (x
, 1)))
5701 && known_eq (GET_MODE_NUNITS (GET_MODE (XEXP (x
, 1))), nunits
)
5702 && VECTOR_MODE_P (GET_MODE (XEXP (x
, 2)))
5703 && known_eq (GET_MODE_NUNITS (GET_MODE (XEXP (x
, 2))), nunits
))
5705 rtx top0
= simplify_merge_mask (XEXP (x
, 0), mask
, op
);
5706 rtx top1
= simplify_merge_mask (XEXP (x
, 1), mask
, op
);
5707 rtx top2
= simplify_merge_mask (XEXP (x
, 2), mask
, op
);
5708 if (top0
|| top1
|| top2
)
5709 return simplify_gen_ternary (GET_CODE (x
), GET_MODE (x
),
5710 GET_MODE (XEXP (x
, 0)),
5711 top0
? top0
: XEXP (x
, 0),
5712 top1
? top1
: XEXP (x
, 1),
5713 top2
? top2
: XEXP (x
, 2));
5719 /* Simplify CODE, an operation with result mode MODE and three operands,
5720 OP0, OP1, and OP2. OP0_MODE was the mode of OP0 before it became
5721 a constant. Return 0 if no simplifications is possible. */
5724 simplify_ternary_operation (enum rtx_code code
, machine_mode mode
,
5725 machine_mode op0_mode
, rtx op0
, rtx op1
,
5728 bool any_change
= false;
5730 scalar_int_mode int_mode
, int_op0_mode
;
5731 unsigned int n_elts
;
5736 /* Simplify negations around the multiplication. */
5737 /* -a * -b + c => a * b + c. */
5738 if (GET_CODE (op0
) == NEG
)
5740 tem
= simplify_unary_operation (NEG
, mode
, op1
, mode
);
5742 op1
= tem
, op0
= XEXP (op0
, 0), any_change
= true;
5744 else if (GET_CODE (op1
) == NEG
)
5746 tem
= simplify_unary_operation (NEG
, mode
, op0
, mode
);
5748 op0
= tem
, op1
= XEXP (op1
, 0), any_change
= true;
5751 /* Canonicalize the two multiplication operands. */
5752 /* a * -b + c => -b * a + c. */
5753 if (swap_commutative_operands_p (op0
, op1
))
5754 std::swap (op0
, op1
), any_change
= true;
5757 return gen_rtx_FMA (mode
, op0
, op1
, op2
);
5762 if (CONST_INT_P (op0
)
5763 && CONST_INT_P (op1
)
5764 && CONST_INT_P (op2
)
5765 && is_a
<scalar_int_mode
> (mode
, &int_mode
)
5766 && INTVAL (op1
) + INTVAL (op2
) <= GET_MODE_PRECISION (int_mode
)
5767 && HWI_COMPUTABLE_MODE_P (int_mode
))
5769 /* Extracting a bit-field from a constant */
5770 unsigned HOST_WIDE_INT val
= UINTVAL (op0
);
5771 HOST_WIDE_INT op1val
= INTVAL (op1
);
5772 HOST_WIDE_INT op2val
= INTVAL (op2
);
5773 if (!BITS_BIG_ENDIAN
)
5775 else if (is_a
<scalar_int_mode
> (op0_mode
, &int_op0_mode
))
5776 val
>>= GET_MODE_PRECISION (int_op0_mode
) - op2val
- op1val
;
5778 /* Not enough information to calculate the bit position. */
5781 if (HOST_BITS_PER_WIDE_INT
!= op1val
)
5783 /* First zero-extend. */
5784 val
&= (HOST_WIDE_INT_1U
<< op1val
) - 1;
5785 /* If desired, propagate sign bit. */
5786 if (code
== SIGN_EXTRACT
5787 && (val
& (HOST_WIDE_INT_1U
<< (op1val
- 1)))
5789 val
|= ~ ((HOST_WIDE_INT_1U
<< op1val
) - 1);
5792 return gen_int_mode (val
, int_mode
);
5797 if (CONST_INT_P (op0
))
5798 return op0
!= const0_rtx
? op1
: op2
;
5800 /* Convert c ? a : a into "a". */
5801 if (rtx_equal_p (op1
, op2
) && ! side_effects_p (op0
))
5804 /* Convert a != b ? a : b into "a". */
5805 if (GET_CODE (op0
) == NE
5806 && ! side_effects_p (op0
)
5807 && ! HONOR_NANS (mode
)
5808 && ! HONOR_SIGNED_ZEROS (mode
)
5809 && ((rtx_equal_p (XEXP (op0
, 0), op1
)
5810 && rtx_equal_p (XEXP (op0
, 1), op2
))
5811 || (rtx_equal_p (XEXP (op0
, 0), op2
)
5812 && rtx_equal_p (XEXP (op0
, 1), op1
))))
5815 /* Convert a == b ? a : b into "b". */
5816 if (GET_CODE (op0
) == EQ
5817 && ! side_effects_p (op0
)
5818 && ! HONOR_NANS (mode
)
5819 && ! HONOR_SIGNED_ZEROS (mode
)
5820 && ((rtx_equal_p (XEXP (op0
, 0), op1
)
5821 && rtx_equal_p (XEXP (op0
, 1), op2
))
5822 || (rtx_equal_p (XEXP (op0
, 0), op2
)
5823 && rtx_equal_p (XEXP (op0
, 1), op1
))))
5826 /* Convert (!c) != {0,...,0} ? a : b into
5827 c != {0,...,0} ? b : a for vector modes. */
5828 if (VECTOR_MODE_P (GET_MODE (op1
))
5829 && GET_CODE (op0
) == NE
5830 && GET_CODE (XEXP (op0
, 0)) == NOT
5831 && GET_CODE (XEXP (op0
, 1)) == CONST_VECTOR
)
5833 rtx cv
= XEXP (op0
, 1);
5836 if (!CONST_VECTOR_NUNITS (cv
).is_constant (&nunits
))
5839 for (int i
= 0; i
< nunits
; ++i
)
5840 if (CONST_VECTOR_ELT (cv
, i
) != const0_rtx
)
5847 rtx new_op0
= gen_rtx_NE (GET_MODE (op0
),
5848 XEXP (XEXP (op0
, 0), 0),
5850 rtx retval
= gen_rtx_IF_THEN_ELSE (mode
, new_op0
, op2
, op1
);
5855 /* Convert x == 0 ? N : clz (x) into clz (x) when
5856 CLZ_DEFINED_VALUE_AT_ZERO is defined to N for the mode of x.
5857 Similarly for ctz (x). */
5858 if (COMPARISON_P (op0
) && !side_effects_p (op0
)
5859 && XEXP (op0
, 1) == const0_rtx
)
5862 = simplify_cond_clz_ctz (XEXP (op0
, 0), GET_CODE (op0
),
5868 if (COMPARISON_P (op0
) && ! side_effects_p (op0
))
5870 machine_mode cmp_mode
= (GET_MODE (XEXP (op0
, 0)) == VOIDmode
5871 ? GET_MODE (XEXP (op0
, 1))
5872 : GET_MODE (XEXP (op0
, 0)));
5875 /* Look for happy constants in op1 and op2. */
5876 if (CONST_INT_P (op1
) && CONST_INT_P (op2
))
5878 HOST_WIDE_INT t
= INTVAL (op1
);
5879 HOST_WIDE_INT f
= INTVAL (op2
);
5881 if (t
== STORE_FLAG_VALUE
&& f
== 0)
5882 code
= GET_CODE (op0
);
5883 else if (t
== 0 && f
== STORE_FLAG_VALUE
)
5886 tmp
= reversed_comparison_code (op0
, NULL
);
5894 return simplify_gen_relational (code
, mode
, cmp_mode
,
5895 XEXP (op0
, 0), XEXP (op0
, 1));
5898 temp
= simplify_relational_operation (GET_CODE (op0
), op0_mode
,
5899 cmp_mode
, XEXP (op0
, 0),
5902 /* See if any simplifications were possible. */
5905 if (CONST_INT_P (temp
))
5906 return temp
== const0_rtx
? op2
: op1
;
5908 return gen_rtx_IF_THEN_ELSE (mode
, temp
, op1
, op2
);
5914 gcc_assert (GET_MODE (op0
) == mode
);
5915 gcc_assert (GET_MODE (op1
) == mode
);
5916 gcc_assert (VECTOR_MODE_P (mode
));
5917 trueop2
= avoid_constant_pool_reference (op2
);
5918 if (CONST_INT_P (trueop2
)
5919 && GET_MODE_NUNITS (mode
).is_constant (&n_elts
))
5921 unsigned HOST_WIDE_INT sel
= UINTVAL (trueop2
);
5922 unsigned HOST_WIDE_INT mask
;
5923 if (n_elts
== HOST_BITS_PER_WIDE_INT
)
5926 mask
= (HOST_WIDE_INT_1U
<< n_elts
) - 1;
5928 if (!(sel
& mask
) && !side_effects_p (op0
))
5930 if ((sel
& mask
) == mask
&& !side_effects_p (op1
))
5933 rtx trueop0
= avoid_constant_pool_reference (op0
);
5934 rtx trueop1
= avoid_constant_pool_reference (op1
);
5935 if (GET_CODE (trueop0
) == CONST_VECTOR
5936 && GET_CODE (trueop1
) == CONST_VECTOR
)
5938 rtvec v
= rtvec_alloc (n_elts
);
5941 for (i
= 0; i
< n_elts
; i
++)
5942 RTVEC_ELT (v
, i
) = ((sel
& (HOST_WIDE_INT_1U
<< i
))
5943 ? CONST_VECTOR_ELT (trueop0
, i
)
5944 : CONST_VECTOR_ELT (trueop1
, i
));
5945 return gen_rtx_CONST_VECTOR (mode
, v
);
5948 /* Replace (vec_merge (vec_merge a b m) c n) with (vec_merge b c n)
5949 if no element from a appears in the result. */
5950 if (GET_CODE (op0
) == VEC_MERGE
)
5952 tem
= avoid_constant_pool_reference (XEXP (op0
, 2));
5953 if (CONST_INT_P (tem
))
5955 unsigned HOST_WIDE_INT sel0
= UINTVAL (tem
);
5956 if (!(sel
& sel0
& mask
) && !side_effects_p (XEXP (op0
, 0)))
5957 return simplify_gen_ternary (code
, mode
, mode
,
5958 XEXP (op0
, 1), op1
, op2
);
5959 if (!(sel
& ~sel0
& mask
) && !side_effects_p (XEXP (op0
, 1)))
5960 return simplify_gen_ternary (code
, mode
, mode
,
5961 XEXP (op0
, 0), op1
, op2
);
5964 if (GET_CODE (op1
) == VEC_MERGE
)
5966 tem
= avoid_constant_pool_reference (XEXP (op1
, 2));
5967 if (CONST_INT_P (tem
))
5969 unsigned HOST_WIDE_INT sel1
= UINTVAL (tem
);
5970 if (!(~sel
& sel1
& mask
) && !side_effects_p (XEXP (op1
, 0)))
5971 return simplify_gen_ternary (code
, mode
, mode
,
5972 op0
, XEXP (op1
, 1), op2
);
5973 if (!(~sel
& ~sel1
& mask
) && !side_effects_p (XEXP (op1
, 1)))
5974 return simplify_gen_ternary (code
, mode
, mode
,
5975 op0
, XEXP (op1
, 0), op2
);
5979 /* Replace (vec_merge (vec_duplicate (vec_select a parallel (i))) a 1 << i)
5981 if (GET_CODE (op0
) == VEC_DUPLICATE
5982 && GET_CODE (XEXP (op0
, 0)) == VEC_SELECT
5983 && GET_CODE (XEXP (XEXP (op0
, 0), 1)) == PARALLEL
5984 && known_eq (GET_MODE_NUNITS (GET_MODE (XEXP (op0
, 0))), 1))
5986 tem
= XVECEXP ((XEXP (XEXP (op0
, 0), 1)), 0, 0);
5987 if (CONST_INT_P (tem
) && CONST_INT_P (op2
))
5989 if (XEXP (XEXP (op0
, 0), 0) == op1
5990 && UINTVAL (op2
) == HOST_WIDE_INT_1U
<< UINTVAL (tem
))
5994 /* Replace (vec_merge (vec_duplicate (X)) (const_vector [A, B])
5996 with (vec_concat (X) (B)) if N == 1 or
5997 (vec_concat (A) (X)) if N == 2. */
5998 if (GET_CODE (op0
) == VEC_DUPLICATE
5999 && GET_CODE (op1
) == CONST_VECTOR
6000 && known_eq (CONST_VECTOR_NUNITS (op1
), 2)
6001 && known_eq (GET_MODE_NUNITS (GET_MODE (op0
)), 2)
6002 && IN_RANGE (sel
, 1, 2))
6004 rtx newop0
= XEXP (op0
, 0);
6005 rtx newop1
= CONST_VECTOR_ELT (op1
, 2 - sel
);
6007 std::swap (newop0
, newop1
);
6008 return simplify_gen_binary (VEC_CONCAT
, mode
, newop0
, newop1
);
6010 /* Replace (vec_merge (vec_duplicate x) (vec_concat (y) (z)) (const_int N))
6011 with (vec_concat x z) if N == 1, or (vec_concat y x) if N == 2.
6012 Only applies for vectors of two elements. */
6013 if (GET_CODE (op0
) == VEC_DUPLICATE
6014 && GET_CODE (op1
) == VEC_CONCAT
6015 && known_eq (GET_MODE_NUNITS (GET_MODE (op0
)), 2)
6016 && known_eq (GET_MODE_NUNITS (GET_MODE (op1
)), 2)
6017 && IN_RANGE (sel
, 1, 2))
6019 rtx newop0
= XEXP (op0
, 0);
6020 rtx newop1
= XEXP (op1
, 2 - sel
);
6021 rtx otherop
= XEXP (op1
, sel
- 1);
6023 std::swap (newop0
, newop1
);
6024 /* Don't want to throw away the other part of the vec_concat if
6025 it has side-effects. */
6026 if (!side_effects_p (otherop
))
6027 return simplify_gen_binary (VEC_CONCAT
, mode
, newop0
, newop1
);
6032 (vec_merge:outer (vec_duplicate:outer x:inner)
6033 (subreg:outer y:inner 0)
6036 with (vec_concat:outer x:inner y:inner) if N == 1,
6037 or (vec_concat:outer y:inner x:inner) if N == 2.
6039 Implicitly, this means we have a paradoxical subreg, but such
6040 a check is cheap, so make it anyway.
6042 Only applies for vectors of two elements. */
6043 if (GET_CODE (op0
) == VEC_DUPLICATE
6044 && GET_CODE (op1
) == SUBREG
6045 && GET_MODE (op1
) == GET_MODE (op0
)
6046 && GET_MODE (SUBREG_REG (op1
)) == GET_MODE (XEXP (op0
, 0))
6047 && paradoxical_subreg_p (op1
)
6048 && subreg_lowpart_p (op1
)
6049 && known_eq (GET_MODE_NUNITS (GET_MODE (op0
)), 2)
6050 && known_eq (GET_MODE_NUNITS (GET_MODE (op1
)), 2)
6051 && IN_RANGE (sel
, 1, 2))
6053 rtx newop0
= XEXP (op0
, 0);
6054 rtx newop1
= SUBREG_REG (op1
);
6056 std::swap (newop0
, newop1
);
6057 return simplify_gen_binary (VEC_CONCAT
, mode
, newop0
, newop1
);
6060 /* Same as above but with switched operands:
6061 Replace (vec_merge:outer (subreg:outer x:inner 0)
6062 (vec_duplicate:outer y:inner)
6065 with (vec_concat:outer x:inner y:inner) if N == 1,
6066 or (vec_concat:outer y:inner x:inner) if N == 2. */
6067 if (GET_CODE (op1
) == VEC_DUPLICATE
6068 && GET_CODE (op0
) == SUBREG
6069 && GET_MODE (op0
) == GET_MODE (op1
)
6070 && GET_MODE (SUBREG_REG (op0
)) == GET_MODE (XEXP (op1
, 0))
6071 && paradoxical_subreg_p (op0
)
6072 && subreg_lowpart_p (op0
)
6073 && known_eq (GET_MODE_NUNITS (GET_MODE (op1
)), 2)
6074 && known_eq (GET_MODE_NUNITS (GET_MODE (op0
)), 2)
6075 && IN_RANGE (sel
, 1, 2))
6077 rtx newop0
= SUBREG_REG (op0
);
6078 rtx newop1
= XEXP (op1
, 0);
6080 std::swap (newop0
, newop1
);
6081 return simplify_gen_binary (VEC_CONCAT
, mode
, newop0
, newop1
);
6084 /* Replace (vec_merge (vec_duplicate x) (vec_duplicate y)
6086 with (vec_concat x y) or (vec_concat y x) depending on value
6088 if (GET_CODE (op0
) == VEC_DUPLICATE
6089 && GET_CODE (op1
) == VEC_DUPLICATE
6090 && known_eq (GET_MODE_NUNITS (GET_MODE (op0
)), 2)
6091 && known_eq (GET_MODE_NUNITS (GET_MODE (op1
)), 2)
6092 && IN_RANGE (sel
, 1, 2))
6094 rtx newop0
= XEXP (op0
, 0);
6095 rtx newop1
= XEXP (op1
, 0);
6097 std::swap (newop0
, newop1
);
6099 return simplify_gen_binary (VEC_CONCAT
, mode
, newop0
, newop1
);
6103 if (rtx_equal_p (op0
, op1
)
6104 && !side_effects_p (op2
) && !side_effects_p (op1
))
6107 if (!side_effects_p (op2
))
6110 = may_trap_p (op0
) ? NULL_RTX
: simplify_merge_mask (op0
, op2
, 0);
6112 = may_trap_p (op1
) ? NULL_RTX
: simplify_merge_mask (op1
, op2
, 1);
6114 return simplify_gen_ternary (code
, mode
, mode
,
6116 top1
? top1
: op1
, op2
);
6128 /* Try to calculate NUM_BYTES bytes of the target memory image of X,
6129 starting at byte FIRST_BYTE. Return true on success and add the
6130 bytes to BYTES, such that each byte has BITS_PER_UNIT bits and such
6131 that the bytes follow target memory order. Leave BYTES unmodified
6134 MODE is the mode of X. The caller must reserve NUM_BYTES bytes in
6135 BYTES before calling this function. */
6138 native_encode_rtx (machine_mode mode
, rtx x
, vec
<target_unit
> &bytes
,
6139 unsigned int first_byte
, unsigned int num_bytes
)
6141 /* Check the mode is sensible. */
6142 gcc_assert (GET_MODE (x
) == VOIDmode
6143 ? is_a
<scalar_int_mode
> (mode
)
6144 : mode
== GET_MODE (x
));
6146 if (GET_CODE (x
) == CONST_VECTOR
)
6148 /* CONST_VECTOR_ELT follows target memory order, so no shuffling
6149 is necessary. The only complication is that MODE_VECTOR_BOOL
6150 vectors can have several elements per byte. */
6151 unsigned int elt_bits
= vector_element_size (GET_MODE_BITSIZE (mode
),
6152 GET_MODE_NUNITS (mode
));
6153 unsigned int elt
= first_byte
* BITS_PER_UNIT
/ elt_bits
;
6154 if (elt_bits
< BITS_PER_UNIT
)
6156 /* This is the only case in which elements can be smaller than
6158 gcc_assert (GET_MODE_CLASS (mode
) == MODE_VECTOR_BOOL
);
6159 for (unsigned int i
= 0; i
< num_bytes
; ++i
)
6161 target_unit value
= 0;
6162 for (unsigned int j
= 0; j
< BITS_PER_UNIT
; j
+= elt_bits
)
6164 value
|= (INTVAL (CONST_VECTOR_ELT (x
, elt
)) & 1) << j
;
6167 bytes
.quick_push (value
);
6172 unsigned int start
= bytes
.length ();
6173 unsigned int elt_bytes
= GET_MODE_UNIT_SIZE (mode
);
6174 /* Make FIRST_BYTE relative to ELT. */
6175 first_byte
%= elt_bytes
;
6176 while (num_bytes
> 0)
6178 /* Work out how many bytes we want from element ELT. */
6179 unsigned int chunk_bytes
= MIN (num_bytes
, elt_bytes
- first_byte
);
6180 if (!native_encode_rtx (GET_MODE_INNER (mode
),
6181 CONST_VECTOR_ELT (x
, elt
), bytes
,
6182 first_byte
, chunk_bytes
))
6184 bytes
.truncate (start
);
6189 num_bytes
-= chunk_bytes
;
6194 /* All subsequent cases are limited to scalars. */
6196 if (!is_a
<scalar_mode
> (mode
, &smode
))
6199 /* Make sure that the region is in range. */
6200 unsigned int end_byte
= first_byte
+ num_bytes
;
6201 unsigned int mode_bytes
= GET_MODE_SIZE (smode
);
6202 gcc_assert (end_byte
<= mode_bytes
);
6204 if (CONST_SCALAR_INT_P (x
))
6206 /* The target memory layout is affected by both BYTES_BIG_ENDIAN
6207 and WORDS_BIG_ENDIAN. Use the subreg machinery to get the lsb
6208 position of each byte. */
6209 rtx_mode_t
value (x
, smode
);
6210 wide_int_ref
value_wi (value
);
6211 for (unsigned int byte
= first_byte
; byte
< end_byte
; ++byte
)
6213 /* Always constant because the inputs are. */
6215 = subreg_size_lsb (1, mode_bytes
, byte
).to_constant ();
6216 /* Operate directly on the encoding rather than using
6217 wi::extract_uhwi, so that we preserve the sign or zero
6218 extension for modes that are not a whole number of bits in
6219 size. (Zero extension is only used for the combination of
6220 innermode == BImode && STORE_FLAG_VALUE == 1). */
6221 unsigned int elt
= lsb
/ HOST_BITS_PER_WIDE_INT
;
6222 unsigned int shift
= lsb
% HOST_BITS_PER_WIDE_INT
;
6223 unsigned HOST_WIDE_INT uhwi
= value_wi
.elt (elt
);
6224 bytes
.quick_push (uhwi
>> shift
);
6229 if (CONST_DOUBLE_P (x
))
6231 /* real_to_target produces an array of integers in target memory order.
6232 All integers before the last one have 32 bits; the last one may
6233 have 32 bits or fewer, depending on whether the mode bitsize
6234 is divisible by 32. Each of these integers is then laid out
6235 in target memory as any other integer would be. */
6236 long el32
[MAX_BITSIZE_MODE_ANY_MODE
/ 32];
6237 real_to_target (el32
, CONST_DOUBLE_REAL_VALUE (x
), smode
);
6239 /* The (maximum) number of target bytes per element of el32. */
6240 unsigned int bytes_per_el32
= 32 / BITS_PER_UNIT
;
6241 gcc_assert (bytes_per_el32
!= 0);
6243 /* Build up the integers in a similar way to the CONST_SCALAR_INT_P
6245 for (unsigned int byte
= first_byte
; byte
< end_byte
; ++byte
)
6247 unsigned int index
= byte
/ bytes_per_el32
;
6248 unsigned int subbyte
= byte
% bytes_per_el32
;
6249 unsigned int int_bytes
= MIN (bytes_per_el32
,
6250 mode_bytes
- index
* bytes_per_el32
);
6251 /* Always constant because the inputs are. */
6253 = subreg_size_lsb (1, int_bytes
, subbyte
).to_constant ();
6254 bytes
.quick_push ((unsigned long) el32
[index
] >> lsb
);
6259 if (GET_CODE (x
) == CONST_FIXED
)
6261 for (unsigned int byte
= first_byte
; byte
< end_byte
; ++byte
)
6263 /* Always constant because the inputs are. */
6265 = subreg_size_lsb (1, mode_bytes
, byte
).to_constant ();
6266 unsigned HOST_WIDE_INT piece
= CONST_FIXED_VALUE_LOW (x
);
6267 if (lsb
>= HOST_BITS_PER_WIDE_INT
)
6269 lsb
-= HOST_BITS_PER_WIDE_INT
;
6270 piece
= CONST_FIXED_VALUE_HIGH (x
);
6272 bytes
.quick_push (piece
>> lsb
);
6280 /* Read a vector of mode MODE from the target memory image given by BYTES,
6281 starting at byte FIRST_BYTE. The vector is known to be encodable using
6282 NPATTERNS interleaved patterns with NELTS_PER_PATTERN elements each,
6283 and BYTES is known to have enough bytes to supply NPATTERNS *
6284 NELTS_PER_PATTERN vector elements. Each element of BYTES contains
6285 BITS_PER_UNIT bits and the bytes are in target memory order.
6287 Return the vector on success, otherwise return NULL_RTX. */
6290 native_decode_vector_rtx (machine_mode mode
, vec
<target_unit
> bytes
,
6291 unsigned int first_byte
, unsigned int npatterns
,
6292 unsigned int nelts_per_pattern
)
6294 rtx_vector_builder
builder (mode
, npatterns
, nelts_per_pattern
);
6296 unsigned int elt_bits
= vector_element_size (GET_MODE_BITSIZE (mode
),
6297 GET_MODE_NUNITS (mode
));
6298 if (elt_bits
< BITS_PER_UNIT
)
6300 /* This is the only case in which elements can be smaller than a byte.
6301 Element 0 is always in the lsb of the containing byte. */
6302 gcc_assert (GET_MODE_CLASS (mode
) == MODE_VECTOR_BOOL
);
6303 for (unsigned int i
= 0; i
< builder
.encoded_nelts (); ++i
)
6305 unsigned int bit_index
= first_byte
* BITS_PER_UNIT
+ i
* elt_bits
;
6306 unsigned int byte_index
= bit_index
/ BITS_PER_UNIT
;
6307 unsigned int lsb
= bit_index
% BITS_PER_UNIT
;
6308 builder
.quick_push (bytes
[byte_index
] & (1 << lsb
)
6309 ? CONST1_RTX (BImode
)
6310 : CONST0_RTX (BImode
));
6315 for (unsigned int i
= 0; i
< builder
.encoded_nelts (); ++i
)
6317 rtx x
= native_decode_rtx (GET_MODE_INNER (mode
), bytes
, first_byte
);
6320 builder
.quick_push (x
);
6321 first_byte
+= elt_bits
/ BITS_PER_UNIT
;
6324 return builder
.build ();
6327 /* Read an rtx of mode MODE from the target memory image given by BYTES,
6328 starting at byte FIRST_BYTE. Each element of BYTES contains BITS_PER_UNIT
6329 bits and the bytes are in target memory order. The image has enough
6330 values to specify all bytes of MODE.
6332 Return the rtx on success, otherwise return NULL_RTX. */
6335 native_decode_rtx (machine_mode mode
, vec
<target_unit
> bytes
,
6336 unsigned int first_byte
)
6338 if (VECTOR_MODE_P (mode
))
6340 /* If we know at compile time how many elements there are,
6341 pull each element directly from BYTES. */
6343 if (GET_MODE_NUNITS (mode
).is_constant (&nelts
))
6344 return native_decode_vector_rtx (mode
, bytes
, first_byte
, nelts
, 1);
6348 scalar_int_mode imode
;
6349 if (is_a
<scalar_int_mode
> (mode
, &imode
)
6350 && GET_MODE_PRECISION (imode
) <= MAX_BITSIZE_MODE_ANY_INT
)
6352 /* Pull the bytes msb first, so that we can use simple
6353 shift-and-insert wide_int operations. */
6354 unsigned int size
= GET_MODE_SIZE (imode
);
6355 wide_int
result (wi::zero (GET_MODE_PRECISION (imode
)));
6356 for (unsigned int i
= 0; i
< size
; ++i
)
6358 unsigned int lsb
= (size
- i
- 1) * BITS_PER_UNIT
;
6359 /* Always constant because the inputs are. */
6360 unsigned int subbyte
6361 = subreg_size_offset_from_lsb (1, size
, lsb
).to_constant ();
6362 result
<<= BITS_PER_UNIT
;
6363 result
|= bytes
[first_byte
+ subbyte
];
6365 return immed_wide_int_const (result
, imode
);
6368 scalar_float_mode fmode
;
6369 if (is_a
<scalar_float_mode
> (mode
, &fmode
))
6371 /* We need to build an array of integers in target memory order.
6372 All integers before the last one have 32 bits; the last one may
6373 have 32 bits or fewer, depending on whether the mode bitsize
6374 is divisible by 32. */
6375 long el32
[MAX_BITSIZE_MODE_ANY_MODE
/ 32];
6376 unsigned int num_el32
= CEIL (GET_MODE_BITSIZE (fmode
), 32);
6377 memset (el32
, 0, num_el32
* sizeof (long));
6379 /* The (maximum) number of target bytes per element of el32. */
6380 unsigned int bytes_per_el32
= 32 / BITS_PER_UNIT
;
6381 gcc_assert (bytes_per_el32
!= 0);
6383 unsigned int mode_bytes
= GET_MODE_SIZE (fmode
);
6384 for (unsigned int byte
= 0; byte
< mode_bytes
; ++byte
)
6386 unsigned int index
= byte
/ bytes_per_el32
;
6387 unsigned int subbyte
= byte
% bytes_per_el32
;
6388 unsigned int int_bytes
= MIN (bytes_per_el32
,
6389 mode_bytes
- index
* bytes_per_el32
);
6390 /* Always constant because the inputs are. */
6392 = subreg_size_lsb (1, int_bytes
, subbyte
).to_constant ();
6393 el32
[index
] |= (unsigned long) bytes
[first_byte
+ byte
] << lsb
;
6396 real_from_target (&r
, el32
, fmode
);
6397 return const_double_from_real_value (r
, fmode
);
6400 if (ALL_SCALAR_FIXED_POINT_MODE_P (mode
))
6402 scalar_mode smode
= as_a
<scalar_mode
> (mode
);
6408 unsigned int mode_bytes
= GET_MODE_SIZE (smode
);
6409 for (unsigned int byte
= 0; byte
< mode_bytes
; ++byte
)
6411 /* Always constant because the inputs are. */
6413 = subreg_size_lsb (1, mode_bytes
, byte
).to_constant ();
6414 unsigned HOST_WIDE_INT unit
= bytes
[first_byte
+ byte
];
6415 if (lsb
>= HOST_BITS_PER_WIDE_INT
)
6416 f
.data
.high
|= unit
<< (lsb
- HOST_BITS_PER_WIDE_INT
);
6418 f
.data
.low
|= unit
<< lsb
;
6420 return CONST_FIXED_FROM_FIXED_VALUE (f
, mode
);
6426 /* Simplify a byte offset BYTE into CONST_VECTOR X. The main purpose
6427 is to convert a runtime BYTE value into a constant one. */
6430 simplify_const_vector_byte_offset (rtx x
, poly_uint64 byte
)
6432 /* Cope with MODE_VECTOR_BOOL by operating on bits rather than bytes. */
6433 machine_mode mode
= GET_MODE (x
);
6434 unsigned int elt_bits
= vector_element_size (GET_MODE_BITSIZE (mode
),
6435 GET_MODE_NUNITS (mode
));
6436 /* The number of bits needed to encode one element from each pattern. */
6437 unsigned int sequence_bits
= CONST_VECTOR_NPATTERNS (x
) * elt_bits
;
6439 /* Identify the start point in terms of a sequence number and a byte offset
6440 within that sequence. */
6441 poly_uint64 first_sequence
;
6442 unsigned HOST_WIDE_INT subbit
;
6443 if (can_div_trunc_p (byte
* BITS_PER_UNIT
, sequence_bits
,
6444 &first_sequence
, &subbit
))
6446 unsigned int nelts_per_pattern
= CONST_VECTOR_NELTS_PER_PATTERN (x
);
6447 if (nelts_per_pattern
== 1)
6448 /* This is a duplicated vector, so the value of FIRST_SEQUENCE
6450 byte
= subbit
/ BITS_PER_UNIT
;
6451 else if (nelts_per_pattern
== 2 && known_gt (first_sequence
, 0U))
6453 /* The subreg drops the first element from each pattern and
6454 only uses the second element. Find the first sequence
6455 that starts on a byte boundary. */
6456 subbit
+= least_common_multiple (sequence_bits
, BITS_PER_UNIT
);
6457 byte
= subbit
/ BITS_PER_UNIT
;
6463 /* Subroutine of simplify_subreg in which:
6465 - X is known to be a CONST_VECTOR
6466 - OUTERMODE is known to be a vector mode
6468 Try to handle the subreg by operating on the CONST_VECTOR encoding
6469 rather than on each individual element of the CONST_VECTOR.
6471 Return the simplified subreg on success, otherwise return NULL_RTX. */
6474 simplify_const_vector_subreg (machine_mode outermode
, rtx x
,
6475 machine_mode innermode
, unsigned int first_byte
)
6477 /* Paradoxical subregs of vectors have dubious semantics. */
6478 if (paradoxical_subreg_p (outermode
, innermode
))
6481 /* We can only preserve the semantics of a stepped pattern if the new
6482 vector element is the same as the original one. */
6483 if (CONST_VECTOR_STEPPED_P (x
)
6484 && GET_MODE_INNER (outermode
) != GET_MODE_INNER (innermode
))
6487 /* Cope with MODE_VECTOR_BOOL by operating on bits rather than bytes. */
6488 unsigned int x_elt_bits
6489 = vector_element_size (GET_MODE_BITSIZE (innermode
),
6490 GET_MODE_NUNITS (innermode
));
6491 unsigned int out_elt_bits
6492 = vector_element_size (GET_MODE_BITSIZE (outermode
),
6493 GET_MODE_NUNITS (outermode
));
6495 /* The number of bits needed to encode one element from every pattern
6496 of the original vector. */
6497 unsigned int x_sequence_bits
= CONST_VECTOR_NPATTERNS (x
) * x_elt_bits
;
6499 /* The number of bits needed to encode one element from every pattern
6501 unsigned int out_sequence_bits
6502 = least_common_multiple (x_sequence_bits
, out_elt_bits
);
6504 /* Work out the number of interleaved patterns in the output vector
6505 and the number of encoded elements per pattern. */
6506 unsigned int out_npatterns
= out_sequence_bits
/ out_elt_bits
;
6507 unsigned int nelts_per_pattern
= CONST_VECTOR_NELTS_PER_PATTERN (x
);
6509 /* The encoding scheme requires the number of elements to be a multiple
6510 of the number of patterns, so that each pattern appears at least once
6511 and so that the same number of elements appear from each pattern. */
6512 bool ok_p
= multiple_p (GET_MODE_NUNITS (outermode
), out_npatterns
);
6513 unsigned int const_nunits
;
6514 if (GET_MODE_NUNITS (outermode
).is_constant (&const_nunits
)
6515 && (!ok_p
|| out_npatterns
* nelts_per_pattern
> const_nunits
))
6517 /* Either the encoding is invalid, or applying it would give us
6518 more elements than we need. Just encode each element directly. */
6519 out_npatterns
= const_nunits
;
6520 nelts_per_pattern
= 1;
6525 /* Get enough bytes of X to form the new encoding. */
6526 unsigned int buffer_bits
= out_npatterns
* nelts_per_pattern
* out_elt_bits
;
6527 unsigned int buffer_bytes
= CEIL (buffer_bits
, BITS_PER_UNIT
);
6528 auto_vec
<target_unit
, 128> buffer (buffer_bytes
);
6529 if (!native_encode_rtx (innermode
, x
, buffer
, first_byte
, buffer_bytes
))
6532 /* Reencode the bytes as OUTERMODE. */
6533 return native_decode_vector_rtx (outermode
, buffer
, 0, out_npatterns
,
6537 /* Try to simplify a subreg of a constant by encoding the subreg region
6538 as a sequence of target bytes and reading them back in the new mode.
6539 Return the new value on success, otherwise return null.
6541 The subreg has outer mode OUTERMODE, inner mode INNERMODE, inner value X
6542 and byte offset FIRST_BYTE. */
6545 simplify_immed_subreg (fixed_size_mode outermode
, rtx x
,
6546 machine_mode innermode
, unsigned int first_byte
)
6548 unsigned int buffer_bytes
= GET_MODE_SIZE (outermode
);
6549 auto_vec
<target_unit
, 128> buffer (buffer_bytes
);
6551 /* Some ports misuse CCmode. */
6552 if (GET_MODE_CLASS (outermode
) == MODE_CC
&& CONST_INT_P (x
))
6555 /* Paradoxical subregs read undefined values for bytes outside of the
6556 inner value. However, we have traditionally always sign-extended
6557 integer constants and zero-extended others. */
6558 unsigned int inner_bytes
= buffer_bytes
;
6559 if (paradoxical_subreg_p (outermode
, innermode
))
6561 if (!GET_MODE_SIZE (innermode
).is_constant (&inner_bytes
))
6564 target_unit filler
= 0;
6565 if (CONST_SCALAR_INT_P (x
) && wi::neg_p (rtx_mode_t (x
, innermode
)))
6568 /* Add any leading bytes due to big-endian layout. The number of
6569 bytes must be constant because both modes have constant size. */
6570 unsigned int leading_bytes
6571 = -byte_lowpart_offset (outermode
, innermode
).to_constant ();
6572 for (unsigned int i
= 0; i
< leading_bytes
; ++i
)
6573 buffer
.quick_push (filler
);
6575 if (!native_encode_rtx (innermode
, x
, buffer
, first_byte
, inner_bytes
))
6578 /* Add any trailing bytes due to little-endian layout. */
6579 while (buffer
.length () < buffer_bytes
)
6580 buffer
.quick_push (filler
);
6584 if (!native_encode_rtx (innermode
, x
, buffer
, first_byte
, inner_bytes
))
6587 return native_decode_rtx (outermode
, buffer
, 0);
6590 /* Simplify SUBREG:OUTERMODE(OP:INNERMODE, BYTE)
6591 Return 0 if no simplifications are possible. */
6593 simplify_subreg (machine_mode outermode
, rtx op
,
6594 machine_mode innermode
, poly_uint64 byte
)
6596 /* Little bit of sanity checking. */
6597 gcc_assert (innermode
!= VOIDmode
);
6598 gcc_assert (outermode
!= VOIDmode
);
6599 gcc_assert (innermode
!= BLKmode
);
6600 gcc_assert (outermode
!= BLKmode
);
6602 gcc_assert (GET_MODE (op
) == innermode
6603 || GET_MODE (op
) == VOIDmode
);
6605 poly_uint64 outersize
= GET_MODE_SIZE (outermode
);
6606 if (!multiple_p (byte
, outersize
))
6609 poly_uint64 innersize
= GET_MODE_SIZE (innermode
);
6610 if (maybe_ge (byte
, innersize
))
6613 if (outermode
== innermode
&& known_eq (byte
, 0U))
6616 if (GET_CODE (op
) == CONST_VECTOR
)
6617 byte
= simplify_const_vector_byte_offset (op
, byte
);
6619 if (multiple_p (byte
, GET_MODE_UNIT_SIZE (innermode
)))
6623 if (VECTOR_MODE_P (outermode
)
6624 && GET_MODE_INNER (outermode
) == GET_MODE_INNER (innermode
)
6625 && vec_duplicate_p (op
, &elt
))
6626 return gen_vec_duplicate (outermode
, elt
);
6628 if (outermode
== GET_MODE_INNER (innermode
)
6629 && vec_duplicate_p (op
, &elt
))
6633 if (CONST_SCALAR_INT_P (op
)
6634 || CONST_DOUBLE_AS_FLOAT_P (op
)
6635 || CONST_FIXED_P (op
)
6636 || GET_CODE (op
) == CONST_VECTOR
)
6638 unsigned HOST_WIDE_INT cbyte
;
6639 if (byte
.is_constant (&cbyte
))
6641 if (GET_CODE (op
) == CONST_VECTOR
&& VECTOR_MODE_P (outermode
))
6643 rtx tmp
= simplify_const_vector_subreg (outermode
, op
,
6649 fixed_size_mode fs_outermode
;
6650 if (is_a
<fixed_size_mode
> (outermode
, &fs_outermode
))
6651 return simplify_immed_subreg (fs_outermode
, op
, innermode
, cbyte
);
6655 /* Changing mode twice with SUBREG => just change it once,
6656 or not at all if changing back op starting mode. */
6657 if (GET_CODE (op
) == SUBREG
)
6659 machine_mode innermostmode
= GET_MODE (SUBREG_REG (op
));
6660 poly_uint64 innermostsize
= GET_MODE_SIZE (innermostmode
);
6663 if (outermode
== innermostmode
6664 && known_eq (byte
, 0U)
6665 && known_eq (SUBREG_BYTE (op
), 0))
6666 return SUBREG_REG (op
);
6668 /* Work out the memory offset of the final OUTERMODE value relative
6669 to the inner value of OP. */
6670 poly_int64 mem_offset
= subreg_memory_offset (outermode
,
6672 poly_int64 op_mem_offset
= subreg_memory_offset (op
);
6673 poly_int64 final_offset
= mem_offset
+ op_mem_offset
;
6675 /* See whether resulting subreg will be paradoxical. */
6676 if (!paradoxical_subreg_p (outermode
, innermostmode
))
6678 /* Bail out in case resulting subreg would be incorrect. */
6679 if (maybe_lt (final_offset
, 0)
6680 || maybe_ge (poly_uint64 (final_offset
), innermostsize
)
6681 || !multiple_p (final_offset
, outersize
))
6686 poly_int64 required_offset
= subreg_memory_offset (outermode
,
6688 if (maybe_ne (final_offset
, required_offset
))
6690 /* Paradoxical subregs always have byte offset 0. */
6694 /* Recurse for further possible simplifications. */
6695 newx
= simplify_subreg (outermode
, SUBREG_REG (op
), innermostmode
,
6699 if (validate_subreg (outermode
, innermostmode
,
6700 SUBREG_REG (op
), final_offset
))
6702 newx
= gen_rtx_SUBREG (outermode
, SUBREG_REG (op
), final_offset
);
6703 if (SUBREG_PROMOTED_VAR_P (op
)
6704 && SUBREG_PROMOTED_SIGN (op
) >= 0
6705 && GET_MODE_CLASS (outermode
) == MODE_INT
6706 && known_ge (outersize
, innersize
)
6707 && known_le (outersize
, innermostsize
)
6708 && subreg_lowpart_p (newx
))
6710 SUBREG_PROMOTED_VAR_P (newx
) = 1;
6711 SUBREG_PROMOTED_SET (newx
, SUBREG_PROMOTED_GET (op
));
6718 /* SUBREG of a hard register => just change the register number
6719 and/or mode. If the hard register is not valid in that mode,
6720 suppress this simplification. If the hard register is the stack,
6721 frame, or argument pointer, leave this as a SUBREG. */
6723 if (REG_P (op
) && HARD_REGISTER_P (op
))
6725 unsigned int regno
, final_regno
;
6728 final_regno
= simplify_subreg_regno (regno
, innermode
, byte
, outermode
);
6729 if (HARD_REGISTER_NUM_P (final_regno
))
6731 rtx x
= gen_rtx_REG_offset (op
, outermode
, final_regno
,
6732 subreg_memory_offset (outermode
,
6735 /* Propagate original regno. We don't have any way to specify
6736 the offset inside original regno, so do so only for lowpart.
6737 The information is used only by alias analysis that cannot
6738 grog partial register anyway. */
6740 if (known_eq (subreg_lowpart_offset (outermode
, innermode
), byte
))
6741 ORIGINAL_REGNO (x
) = ORIGINAL_REGNO (op
);
6746 /* If we have a SUBREG of a register that we are replacing and we are
6747 replacing it with a MEM, make a new MEM and try replacing the
6748 SUBREG with it. Don't do this if the MEM has a mode-dependent address
6749 or if we would be widening it. */
6752 && ! mode_dependent_address_p (XEXP (op
, 0), MEM_ADDR_SPACE (op
))
6753 /* Allow splitting of volatile memory references in case we don't
6754 have instruction to move the whole thing. */
6755 && (! MEM_VOLATILE_P (op
)
6756 || ! have_insn_for (SET
, innermode
))
6757 && known_le (outersize
, innersize
))
6758 return adjust_address_nv (op
, outermode
, byte
);
6760 /* Handle complex or vector values represented as CONCAT or VEC_CONCAT
6762 if (GET_CODE (op
) == CONCAT
6763 || GET_CODE (op
) == VEC_CONCAT
)
6765 poly_uint64 final_offset
;
6768 machine_mode part_mode
= GET_MODE (XEXP (op
, 0));
6769 if (part_mode
== VOIDmode
)
6770 part_mode
= GET_MODE_INNER (GET_MODE (op
));
6771 poly_uint64 part_size
= GET_MODE_SIZE (part_mode
);
6772 if (known_lt (byte
, part_size
))
6774 part
= XEXP (op
, 0);
6775 final_offset
= byte
;
6777 else if (known_ge (byte
, part_size
))
6779 part
= XEXP (op
, 1);
6780 final_offset
= byte
- part_size
;
6785 if (maybe_gt (final_offset
+ outersize
, part_size
))
6788 part_mode
= GET_MODE (part
);
6789 if (part_mode
== VOIDmode
)
6790 part_mode
= GET_MODE_INNER (GET_MODE (op
));
6791 res
= simplify_subreg (outermode
, part
, part_mode
, final_offset
);
6794 if (validate_subreg (outermode
, part_mode
, part
, final_offset
))
6795 return gen_rtx_SUBREG (outermode
, part
, final_offset
);
6800 (subreg (vec_merge (X)
6802 (const_int ((1 << N) | M)))
6803 (N * sizeof (outermode)))
6805 (subreg (X) (N * sizeof (outermode)))
6808 if (constant_multiple_p (byte
, GET_MODE_SIZE (outermode
), &idx
)
6809 && idx
< HOST_BITS_PER_WIDE_INT
6810 && GET_CODE (op
) == VEC_MERGE
6811 && GET_MODE_INNER (innermode
) == outermode
6812 && CONST_INT_P (XEXP (op
, 2))
6813 && (UINTVAL (XEXP (op
, 2)) & (HOST_WIDE_INT_1U
<< idx
)) != 0)
6814 return simplify_gen_subreg (outermode
, XEXP (op
, 0), innermode
, byte
);
6816 /* A SUBREG resulting from a zero extension may fold to zero if
6817 it extracts higher bits that the ZERO_EXTEND's source bits. */
6818 if (GET_CODE (op
) == ZERO_EXTEND
&& SCALAR_INT_MODE_P (innermode
))
6820 poly_uint64 bitpos
= subreg_lsb_1 (outermode
, innermode
, byte
);
6821 if (known_ge (bitpos
, GET_MODE_PRECISION (GET_MODE (XEXP (op
, 0)))))
6822 return CONST0_RTX (outermode
);
6825 scalar_int_mode int_outermode
, int_innermode
;
6826 if (is_a
<scalar_int_mode
> (outermode
, &int_outermode
)
6827 && is_a
<scalar_int_mode
> (innermode
, &int_innermode
)
6828 && known_eq (byte
, subreg_lowpart_offset (int_outermode
, int_innermode
)))
6830 /* Handle polynomial integers. The upper bits of a paradoxical
6831 subreg are undefined, so this is safe regardless of whether
6832 we're truncating or extending. */
6833 if (CONST_POLY_INT_P (op
))
6836 = poly_wide_int::from (const_poly_int_value (op
),
6837 GET_MODE_PRECISION (int_outermode
),
6839 return immed_wide_int_const (val
, int_outermode
);
6842 if (GET_MODE_PRECISION (int_outermode
)
6843 < GET_MODE_PRECISION (int_innermode
))
6845 rtx tem
= simplify_truncation (int_outermode
, op
, int_innermode
);
6851 /* If OP is a vector comparison and the subreg is not changing the
6852 number of elements or the size of the elements, change the result
6853 of the comparison to the new mode. */
6854 if (COMPARISON_P (op
)
6855 && VECTOR_MODE_P (outermode
)
6856 && VECTOR_MODE_P (innermode
)
6857 && known_eq (GET_MODE_NUNITS (outermode
), GET_MODE_NUNITS (innermode
))
6858 && known_eq (GET_MODE_UNIT_SIZE (outermode
),
6859 GET_MODE_UNIT_SIZE (innermode
)))
6860 return simplify_gen_relational (GET_CODE (op
), outermode
, innermode
,
6861 XEXP (op
, 0), XEXP (op
, 1));
6865 /* Make a SUBREG operation or equivalent if it folds. */
6868 simplify_gen_subreg (machine_mode outermode
, rtx op
,
6869 machine_mode innermode
, poly_uint64 byte
)
6873 newx
= simplify_subreg (outermode
, op
, innermode
, byte
);
6877 if (GET_CODE (op
) == SUBREG
6878 || GET_CODE (op
) == CONCAT
6879 || GET_MODE (op
) == VOIDmode
)
6882 if (validate_subreg (outermode
, innermode
, op
, byte
))
6883 return gen_rtx_SUBREG (outermode
, op
, byte
);
6888 /* Generates a subreg to get the least significant part of EXPR (in mode
6889 INNER_MODE) to OUTER_MODE. */
6892 lowpart_subreg (machine_mode outer_mode
, rtx expr
,
6893 machine_mode inner_mode
)
6895 return simplify_gen_subreg (outer_mode
, expr
, inner_mode
,
6896 subreg_lowpart_offset (outer_mode
, inner_mode
));
6899 /* Simplify X, an rtx expression.
6901 Return the simplified expression or NULL if no simplifications
6904 This is the preferred entry point into the simplification routines;
6905 however, we still allow passes to call the more specific routines.
6907 Right now GCC has three (yes, three) major bodies of RTL simplification
6908 code that need to be unified.
6910 1. fold_rtx in cse.c. This code uses various CSE specific
6911 information to aid in RTL simplification.
6913 2. simplify_rtx in combine.c. Similar to fold_rtx, except that
6914 it uses combine specific information to aid in RTL
6917 3. The routines in this file.
6920 Long term we want to only have one body of simplification code; to
6921 get to that state I recommend the following steps:
6923 1. Pour over fold_rtx & simplify_rtx and move any simplifications
6924 which are not pass dependent state into these routines.
6926 2. As code is moved by #1, change fold_rtx & simplify_rtx to
6927 use this routine whenever possible.
6929 3. Allow for pass dependent state to be provided to these
6930 routines and add simplifications based on the pass dependent
6931 state. Remove code from cse.c & combine.c that becomes
6934 It will take time, but ultimately the compiler will be easier to
6935 maintain and improve. It's totally silly that when we add a
6936 simplification that it needs to be added to 4 places (3 for RTL
6937 simplification and 1 for tree simplification. */
6940 simplify_rtx (const_rtx x
)
6942 const enum rtx_code code
= GET_CODE (x
);
6943 const machine_mode mode
= GET_MODE (x
);
6945 switch (GET_RTX_CLASS (code
))
6948 return simplify_unary_operation (code
, mode
,
6949 XEXP (x
, 0), GET_MODE (XEXP (x
, 0)));
6950 case RTX_COMM_ARITH
:
6951 if (swap_commutative_operands_p (XEXP (x
, 0), XEXP (x
, 1)))
6952 return simplify_gen_binary (code
, mode
, XEXP (x
, 1), XEXP (x
, 0));
6957 return simplify_binary_operation (code
, mode
, XEXP (x
, 0), XEXP (x
, 1));
6960 case RTX_BITFIELD_OPS
:
6961 return simplify_ternary_operation (code
, mode
, GET_MODE (XEXP (x
, 0)),
6962 XEXP (x
, 0), XEXP (x
, 1),
6966 case RTX_COMM_COMPARE
:
6967 return simplify_relational_operation (code
, mode
,
6968 ((GET_MODE (XEXP (x
, 0))
6970 ? GET_MODE (XEXP (x
, 0))
6971 : GET_MODE (XEXP (x
, 1))),
6977 return simplify_subreg (mode
, SUBREG_REG (x
),
6978 GET_MODE (SUBREG_REG (x
)),
6985 /* Convert (lo_sum (high FOO) FOO) to FOO. */
6986 if (GET_CODE (XEXP (x
, 0)) == HIGH
6987 && rtx_equal_p (XEXP (XEXP (x
, 0), 0), XEXP (x
, 1)))
7000 namespace selftest
{
7002 /* Make a unique pseudo REG of mode MODE for use by selftests. */
7005 make_test_reg (machine_mode mode
)
7007 static int test_reg_num
= LAST_VIRTUAL_REGISTER
+ 1;
7009 return gen_rtx_REG (mode
, test_reg_num
++);
7012 /* Test vector simplifications involving VEC_DUPLICATE in which the
7013 operands and result have vector mode MODE. SCALAR_REG is a pseudo
7014 register that holds one element of MODE. */
7017 test_vector_ops_duplicate (machine_mode mode
, rtx scalar_reg
)
7019 scalar_mode inner_mode
= GET_MODE_INNER (mode
);
7020 rtx duplicate
= gen_rtx_VEC_DUPLICATE (mode
, scalar_reg
);
7021 poly_uint64 nunits
= GET_MODE_NUNITS (mode
);
7022 if (GET_MODE_CLASS (mode
) == MODE_VECTOR_INT
)
7024 /* Test some simple unary cases with VEC_DUPLICATE arguments. */
7025 rtx not_scalar_reg
= gen_rtx_NOT (inner_mode
, scalar_reg
);
7026 rtx duplicate_not
= gen_rtx_VEC_DUPLICATE (mode
, not_scalar_reg
);
7027 ASSERT_RTX_EQ (duplicate
,
7028 simplify_unary_operation (NOT
, mode
,
7029 duplicate_not
, mode
));
7031 rtx neg_scalar_reg
= gen_rtx_NEG (inner_mode
, scalar_reg
);
7032 rtx duplicate_neg
= gen_rtx_VEC_DUPLICATE (mode
, neg_scalar_reg
);
7033 ASSERT_RTX_EQ (duplicate
,
7034 simplify_unary_operation (NEG
, mode
,
7035 duplicate_neg
, mode
));
7037 /* Test some simple binary cases with VEC_DUPLICATE arguments. */
7038 ASSERT_RTX_EQ (duplicate
,
7039 simplify_binary_operation (PLUS
, mode
, duplicate
,
7040 CONST0_RTX (mode
)));
7042 ASSERT_RTX_EQ (duplicate
,
7043 simplify_binary_operation (MINUS
, mode
, duplicate
,
7044 CONST0_RTX (mode
)));
7046 ASSERT_RTX_PTR_EQ (CONST0_RTX (mode
),
7047 simplify_binary_operation (MINUS
, mode
, duplicate
,
7051 /* Test a scalar VEC_SELECT of a VEC_DUPLICATE. */
7052 rtx zero_par
= gen_rtx_PARALLEL (VOIDmode
, gen_rtvec (1, const0_rtx
));
7053 ASSERT_RTX_PTR_EQ (scalar_reg
,
7054 simplify_binary_operation (VEC_SELECT
, inner_mode
,
7055 duplicate
, zero_par
));
7057 unsigned HOST_WIDE_INT const_nunits
;
7058 if (nunits
.is_constant (&const_nunits
))
7060 /* And again with the final element. */
7061 rtx last_index
= gen_int_mode (const_nunits
- 1, word_mode
);
7062 rtx last_par
= gen_rtx_PARALLEL (VOIDmode
, gen_rtvec (1, last_index
));
7063 ASSERT_RTX_PTR_EQ (scalar_reg
,
7064 simplify_binary_operation (VEC_SELECT
, inner_mode
,
7065 duplicate
, last_par
));
7067 /* Test a scalar subreg of a VEC_MERGE of a VEC_DUPLICATE. */
7068 rtx vector_reg
= make_test_reg (mode
);
7069 for (unsigned HOST_WIDE_INT i
= 0; i
< const_nunits
; i
++)
7071 if (i
>= HOST_BITS_PER_WIDE_INT
)
7073 rtx mask
= GEN_INT ((HOST_WIDE_INT_1U
<< i
) | (i
+ 1));
7074 rtx vm
= gen_rtx_VEC_MERGE (mode
, duplicate
, vector_reg
, mask
);
7075 poly_uint64 offset
= i
* GET_MODE_SIZE (inner_mode
);
7076 ASSERT_RTX_EQ (scalar_reg
,
7077 simplify_gen_subreg (inner_mode
, vm
,
7082 /* Test a scalar subreg of a VEC_DUPLICATE. */
7083 poly_uint64 offset
= subreg_lowpart_offset (inner_mode
, mode
);
7084 ASSERT_RTX_EQ (scalar_reg
,
7085 simplify_gen_subreg (inner_mode
, duplicate
,
7088 machine_mode narrower_mode
;
7089 if (maybe_ne (nunits
, 2U)
7090 && multiple_p (nunits
, 2)
7091 && mode_for_vector (inner_mode
, 2).exists (&narrower_mode
)
7092 && VECTOR_MODE_P (narrower_mode
))
7094 /* Test VEC_DUPLICATE of a vector. */
7095 rtx_vector_builder
nbuilder (narrower_mode
, 2, 1);
7096 nbuilder
.quick_push (const0_rtx
);
7097 nbuilder
.quick_push (const1_rtx
);
7098 rtx_vector_builder
builder (mode
, 2, 1);
7099 builder
.quick_push (const0_rtx
);
7100 builder
.quick_push (const1_rtx
);
7101 ASSERT_RTX_EQ (builder
.build (),
7102 simplify_unary_operation (VEC_DUPLICATE
, mode
,
7106 /* Test VEC_SELECT of a vector. */
7108 = gen_rtx_PARALLEL (VOIDmode
, gen_rtvec (2, const1_rtx
, const0_rtx
));
7109 rtx narrower_duplicate
7110 = gen_rtx_VEC_DUPLICATE (narrower_mode
, scalar_reg
);
7111 ASSERT_RTX_EQ (narrower_duplicate
,
7112 simplify_binary_operation (VEC_SELECT
, narrower_mode
,
7113 duplicate
, vec_par
));
7115 /* Test a vector subreg of a VEC_DUPLICATE. */
7116 poly_uint64 offset
= subreg_lowpart_offset (narrower_mode
, mode
);
7117 ASSERT_RTX_EQ (narrower_duplicate
,
7118 simplify_gen_subreg (narrower_mode
, duplicate
,
7123 /* Test vector simplifications involving VEC_SERIES in which the
7124 operands and result have vector mode MODE. SCALAR_REG is a pseudo
7125 register that holds one element of MODE. */
7128 test_vector_ops_series (machine_mode mode
, rtx scalar_reg
)
7130 /* Test unary cases with VEC_SERIES arguments. */
7131 scalar_mode inner_mode
= GET_MODE_INNER (mode
);
7132 rtx duplicate
= gen_rtx_VEC_DUPLICATE (mode
, scalar_reg
);
7133 rtx neg_scalar_reg
= gen_rtx_NEG (inner_mode
, scalar_reg
);
7134 rtx series_0_r
= gen_rtx_VEC_SERIES (mode
, const0_rtx
, scalar_reg
);
7135 rtx series_0_nr
= gen_rtx_VEC_SERIES (mode
, const0_rtx
, neg_scalar_reg
);
7136 rtx series_nr_1
= gen_rtx_VEC_SERIES (mode
, neg_scalar_reg
, const1_rtx
);
7137 rtx series_r_m1
= gen_rtx_VEC_SERIES (mode
, scalar_reg
, constm1_rtx
);
7138 rtx series_r_r
= gen_rtx_VEC_SERIES (mode
, scalar_reg
, scalar_reg
);
7139 rtx series_nr_nr
= gen_rtx_VEC_SERIES (mode
, neg_scalar_reg
,
7141 ASSERT_RTX_EQ (series_0_r
,
7142 simplify_unary_operation (NEG
, mode
, series_0_nr
, mode
));
7143 ASSERT_RTX_EQ (series_r_m1
,
7144 simplify_unary_operation (NEG
, mode
, series_nr_1
, mode
));
7145 ASSERT_RTX_EQ (series_r_r
,
7146 simplify_unary_operation (NEG
, mode
, series_nr_nr
, mode
));
7148 /* Test that a VEC_SERIES with a zero step is simplified away. */
7149 ASSERT_RTX_EQ (duplicate
,
7150 simplify_binary_operation (VEC_SERIES
, mode
,
7151 scalar_reg
, const0_rtx
));
7153 /* Test PLUS and MINUS with VEC_SERIES. */
7154 rtx series_0_1
= gen_const_vec_series (mode
, const0_rtx
, const1_rtx
);
7155 rtx series_0_m1
= gen_const_vec_series (mode
, const0_rtx
, constm1_rtx
);
7156 rtx series_r_1
= gen_rtx_VEC_SERIES (mode
, scalar_reg
, const1_rtx
);
7157 ASSERT_RTX_EQ (series_r_r
,
7158 simplify_binary_operation (PLUS
, mode
, series_0_r
,
7160 ASSERT_RTX_EQ (series_r_1
,
7161 simplify_binary_operation (PLUS
, mode
, duplicate
,
7163 ASSERT_RTX_EQ (series_r_m1
,
7164 simplify_binary_operation (PLUS
, mode
, duplicate
,
7166 ASSERT_RTX_EQ (series_0_r
,
7167 simplify_binary_operation (MINUS
, mode
, series_r_r
,
7169 ASSERT_RTX_EQ (series_r_m1
,
7170 simplify_binary_operation (MINUS
, mode
, duplicate
,
7172 ASSERT_RTX_EQ (series_r_1
,
7173 simplify_binary_operation (MINUS
, mode
, duplicate
,
7175 ASSERT_RTX_EQ (series_0_m1
,
7176 simplify_binary_operation (VEC_SERIES
, mode
, const0_rtx
,
7179 /* Test NEG on constant vector series. */
7180 ASSERT_RTX_EQ (series_0_m1
,
7181 simplify_unary_operation (NEG
, mode
, series_0_1
, mode
));
7182 ASSERT_RTX_EQ (series_0_1
,
7183 simplify_unary_operation (NEG
, mode
, series_0_m1
, mode
));
7185 /* Test PLUS and MINUS on constant vector series. */
7186 rtx scalar2
= gen_int_mode (2, inner_mode
);
7187 rtx scalar3
= gen_int_mode (3, inner_mode
);
7188 rtx series_1_1
= gen_const_vec_series (mode
, const1_rtx
, const1_rtx
);
7189 rtx series_0_2
= gen_const_vec_series (mode
, const0_rtx
, scalar2
);
7190 rtx series_1_3
= gen_const_vec_series (mode
, const1_rtx
, scalar3
);
7191 ASSERT_RTX_EQ (series_1_1
,
7192 simplify_binary_operation (PLUS
, mode
, series_0_1
,
7193 CONST1_RTX (mode
)));
7194 ASSERT_RTX_EQ (series_0_m1
,
7195 simplify_binary_operation (PLUS
, mode
, CONST0_RTX (mode
),
7197 ASSERT_RTX_EQ (series_1_3
,
7198 simplify_binary_operation (PLUS
, mode
, series_1_1
,
7200 ASSERT_RTX_EQ (series_0_1
,
7201 simplify_binary_operation (MINUS
, mode
, series_1_1
,
7202 CONST1_RTX (mode
)));
7203 ASSERT_RTX_EQ (series_1_1
,
7204 simplify_binary_operation (MINUS
, mode
, CONST1_RTX (mode
),
7206 ASSERT_RTX_EQ (series_1_1
,
7207 simplify_binary_operation (MINUS
, mode
, series_1_3
,
7210 /* Test MULT between constant vectors. */
7211 rtx vec2
= gen_const_vec_duplicate (mode
, scalar2
);
7212 rtx vec3
= gen_const_vec_duplicate (mode
, scalar3
);
7213 rtx scalar9
= gen_int_mode (9, inner_mode
);
7214 rtx series_3_9
= gen_const_vec_series (mode
, scalar3
, scalar9
);
7215 ASSERT_RTX_EQ (series_0_2
,
7216 simplify_binary_operation (MULT
, mode
, series_0_1
, vec2
));
7217 ASSERT_RTX_EQ (series_3_9
,
7218 simplify_binary_operation (MULT
, mode
, vec3
, series_1_3
));
7219 if (!GET_MODE_NUNITS (mode
).is_constant ())
7220 ASSERT_FALSE (simplify_binary_operation (MULT
, mode
, series_0_1
,
7223 /* Test ASHIFT between constant vectors. */
7224 ASSERT_RTX_EQ (series_0_2
,
7225 simplify_binary_operation (ASHIFT
, mode
, series_0_1
,
7226 CONST1_RTX (mode
)));
7227 if (!GET_MODE_NUNITS (mode
).is_constant ())
7228 ASSERT_FALSE (simplify_binary_operation (ASHIFT
, mode
, CONST1_RTX (mode
),
7232 /* Verify simplify_merge_mask works correctly. */
7235 test_vec_merge (machine_mode mode
)
7237 rtx op0
= make_test_reg (mode
);
7238 rtx op1
= make_test_reg (mode
);
7239 rtx op2
= make_test_reg (mode
);
7240 rtx op3
= make_test_reg (mode
);
7241 rtx op4
= make_test_reg (mode
);
7242 rtx op5
= make_test_reg (mode
);
7243 rtx mask1
= make_test_reg (SImode
);
7244 rtx mask2
= make_test_reg (SImode
);
7245 rtx vm1
= gen_rtx_VEC_MERGE (mode
, op0
, op1
, mask1
);
7246 rtx vm2
= gen_rtx_VEC_MERGE (mode
, op2
, op3
, mask1
);
7247 rtx vm3
= gen_rtx_VEC_MERGE (mode
, op4
, op5
, mask1
);
7249 /* Simple vec_merge. */
7250 ASSERT_EQ (op0
, simplify_merge_mask (vm1
, mask1
, 0));
7251 ASSERT_EQ (op1
, simplify_merge_mask (vm1
, mask1
, 1));
7252 ASSERT_EQ (NULL_RTX
, simplify_merge_mask (vm1
, mask2
, 0));
7253 ASSERT_EQ (NULL_RTX
, simplify_merge_mask (vm1
, mask2
, 1));
7255 /* Nested vec_merge.
7256 It's tempting to make this simplify right down to opN, but we don't
7257 because all the simplify_* functions assume that the operands have
7258 already been simplified. */
7259 rtx nvm
= gen_rtx_VEC_MERGE (mode
, vm1
, vm2
, mask1
);
7260 ASSERT_EQ (vm1
, simplify_merge_mask (nvm
, mask1
, 0));
7261 ASSERT_EQ (vm2
, simplify_merge_mask (nvm
, mask1
, 1));
7263 /* Intermediate unary op. */
7264 rtx unop
= gen_rtx_NOT (mode
, vm1
);
7265 ASSERT_RTX_EQ (gen_rtx_NOT (mode
, op0
),
7266 simplify_merge_mask (unop
, mask1
, 0));
7267 ASSERT_RTX_EQ (gen_rtx_NOT (mode
, op1
),
7268 simplify_merge_mask (unop
, mask1
, 1));
7270 /* Intermediate binary op. */
7271 rtx binop
= gen_rtx_PLUS (mode
, vm1
, vm2
);
7272 ASSERT_RTX_EQ (gen_rtx_PLUS (mode
, op0
, op2
),
7273 simplify_merge_mask (binop
, mask1
, 0));
7274 ASSERT_RTX_EQ (gen_rtx_PLUS (mode
, op1
, op3
),
7275 simplify_merge_mask (binop
, mask1
, 1));
7277 /* Intermediate ternary op. */
7278 rtx tenop
= gen_rtx_FMA (mode
, vm1
, vm2
, vm3
);
7279 ASSERT_RTX_EQ (gen_rtx_FMA (mode
, op0
, op2
, op4
),
7280 simplify_merge_mask (tenop
, mask1
, 0));
7281 ASSERT_RTX_EQ (gen_rtx_FMA (mode
, op1
, op3
, op5
),
7282 simplify_merge_mask (tenop
, mask1
, 1));
7285 rtx badop0
= gen_rtx_PRE_INC (mode
, op0
);
7286 rtx badvm
= gen_rtx_VEC_MERGE (mode
, badop0
, op1
, mask1
);
7287 ASSERT_EQ (badop0
, simplify_merge_mask (badvm
, mask1
, 0));
7288 ASSERT_EQ (NULL_RTX
, simplify_merge_mask (badvm
, mask1
, 1));
7290 /* Called indirectly. */
7291 ASSERT_RTX_EQ (gen_rtx_VEC_MERGE (mode
, op0
, op3
, mask1
),
7292 simplify_rtx (nvm
));
7295 /* Test subregs of integer vector constant X, trying elements in
7296 the range [ELT_BIAS, ELT_BIAS + constant_lower_bound (NELTS)),
7297 where NELTS is the number of elements in X. Subregs involving
7298 elements [ELT_BIAS, ELT_BIAS + FIRST_VALID) are expected to fail. */
7301 test_vector_subregs_modes (rtx x
, poly_uint64 elt_bias
= 0,
7302 unsigned int first_valid
= 0)
7304 machine_mode inner_mode
= GET_MODE (x
);
7305 scalar_mode int_mode
= GET_MODE_INNER (inner_mode
);
7307 for (unsigned int modei
= 0; modei
< NUM_MACHINE_MODES
; ++modei
)
7309 machine_mode outer_mode
= (machine_mode
) modei
;
7310 if (!VECTOR_MODE_P (outer_mode
))
7313 unsigned int outer_nunits
;
7314 if (GET_MODE_INNER (outer_mode
) == int_mode
7315 && GET_MODE_NUNITS (outer_mode
).is_constant (&outer_nunits
)
7316 && multiple_p (GET_MODE_NUNITS (inner_mode
), outer_nunits
))
7318 /* Test subregs in which the outer mode is a smaller,
7319 constant-sized vector of the same element type. */
7321 = constant_lower_bound (GET_MODE_NUNITS (inner_mode
));
7322 for (unsigned int elt
= 0; elt
< limit
; elt
+= outer_nunits
)
7324 rtx expected
= NULL_RTX
;
7325 if (elt
>= first_valid
)
7327 rtx_vector_builder
builder (outer_mode
, outer_nunits
, 1);
7328 for (unsigned int i
= 0; i
< outer_nunits
; ++i
)
7329 builder
.quick_push (CONST_VECTOR_ELT (x
, elt
+ i
));
7330 expected
= builder
.build ();
7332 poly_uint64 byte
= (elt_bias
+ elt
) * GET_MODE_SIZE (int_mode
);
7333 ASSERT_RTX_EQ (expected
,
7334 simplify_subreg (outer_mode
, x
,
7338 else if (known_eq (GET_MODE_SIZE (outer_mode
),
7339 GET_MODE_SIZE (inner_mode
))
7340 && known_eq (elt_bias
, 0U)
7341 && (GET_MODE_CLASS (outer_mode
) != MODE_VECTOR_BOOL
7342 || known_eq (GET_MODE_BITSIZE (outer_mode
),
7343 GET_MODE_NUNITS (outer_mode
)))
7344 && (!FLOAT_MODE_P (outer_mode
)
7345 || (FLOAT_MODE_FORMAT (outer_mode
)->ieee_bits
7346 == GET_MODE_UNIT_PRECISION (outer_mode
)))
7347 && (GET_MODE_SIZE (inner_mode
).is_constant ()
7348 || !CONST_VECTOR_STEPPED_P (x
)))
7350 /* Try converting to OUTER_MODE and back. */
7351 rtx outer_x
= simplify_subreg (outer_mode
, x
, inner_mode
, 0);
7352 ASSERT_TRUE (outer_x
!= NULL_RTX
);
7353 ASSERT_RTX_EQ (x
, simplify_subreg (inner_mode
, outer_x
,
7358 if (BYTES_BIG_ENDIAN
== WORDS_BIG_ENDIAN
)
7360 /* Test each byte in the element range. */
7362 = constant_lower_bound (GET_MODE_SIZE (inner_mode
));
7363 for (unsigned int i
= 0; i
< limit
; ++i
)
7365 unsigned int elt
= i
/ GET_MODE_SIZE (int_mode
);
7366 rtx expected
= NULL_RTX
;
7367 if (elt
>= first_valid
)
7369 unsigned int byte_shift
= i
% GET_MODE_SIZE (int_mode
);
7370 if (BYTES_BIG_ENDIAN
)
7371 byte_shift
= GET_MODE_SIZE (int_mode
) - byte_shift
- 1;
7372 rtx_mode_t
vec_elt (CONST_VECTOR_ELT (x
, elt
), int_mode
);
7373 wide_int shifted_elt
7374 = wi::lrshift (vec_elt
, byte_shift
* BITS_PER_UNIT
);
7375 expected
= immed_wide_int_const (shifted_elt
, QImode
);
7377 poly_uint64 byte
= elt_bias
* GET_MODE_SIZE (int_mode
) + i
;
7378 ASSERT_RTX_EQ (expected
,
7379 simplify_subreg (QImode
, x
, inner_mode
, byte
));
7384 /* Test constant subregs of integer vector mode INNER_MODE, using 1
7385 element per pattern. */
7388 test_vector_subregs_repeating (machine_mode inner_mode
)
7390 poly_uint64 nunits
= GET_MODE_NUNITS (inner_mode
);
7391 unsigned int min_nunits
= constant_lower_bound (nunits
);
7392 scalar_mode int_mode
= GET_MODE_INNER (inner_mode
);
7393 unsigned int count
= gcd (min_nunits
, 8);
7395 rtx_vector_builder
builder (inner_mode
, count
, 1);
7396 for (unsigned int i
= 0; i
< count
; ++i
)
7397 builder
.quick_push (gen_int_mode (8 - i
, int_mode
));
7398 rtx x
= builder
.build ();
7400 test_vector_subregs_modes (x
);
7401 if (!nunits
.is_constant ())
7402 test_vector_subregs_modes (x
, nunits
- min_nunits
);
7405 /* Test constant subregs of integer vector mode INNER_MODE, using 2
7406 elements per pattern. */
7409 test_vector_subregs_fore_back (machine_mode inner_mode
)
7411 poly_uint64 nunits
= GET_MODE_NUNITS (inner_mode
);
7412 unsigned int min_nunits
= constant_lower_bound (nunits
);
7413 scalar_mode int_mode
= GET_MODE_INNER (inner_mode
);
7414 unsigned int count
= gcd (min_nunits
, 4);
7416 rtx_vector_builder
builder (inner_mode
, count
, 2);
7417 for (unsigned int i
= 0; i
< count
; ++i
)
7418 builder
.quick_push (gen_int_mode (i
, int_mode
));
7419 for (unsigned int i
= 0; i
< count
; ++i
)
7420 builder
.quick_push (gen_int_mode (-(int) i
, int_mode
));
7421 rtx x
= builder
.build ();
7423 test_vector_subregs_modes (x
);
7424 if (!nunits
.is_constant ())
7425 test_vector_subregs_modes (x
, nunits
- min_nunits
, count
);
7428 /* Test constant subregs of integer vector mode INNER_MODE, using 3
7429 elements per pattern. */
7432 test_vector_subregs_stepped (machine_mode inner_mode
)
7434 /* Build { 0, 1, 2, 3, ... }. */
7435 scalar_mode int_mode
= GET_MODE_INNER (inner_mode
);
7436 rtx_vector_builder
builder (inner_mode
, 1, 3);
7437 for (unsigned int i
= 0; i
< 3; ++i
)
7438 builder
.quick_push (gen_int_mode (i
, int_mode
));
7439 rtx x
= builder
.build ();
7441 test_vector_subregs_modes (x
);
7444 /* Test constant subregs of integer vector mode INNER_MODE. */
7447 test_vector_subregs (machine_mode inner_mode
)
7449 test_vector_subregs_repeating (inner_mode
);
7450 test_vector_subregs_fore_back (inner_mode
);
7451 test_vector_subregs_stepped (inner_mode
);
7454 /* Verify some simplifications involving vectors. */
7459 for (unsigned int i
= 0; i
< NUM_MACHINE_MODES
; ++i
)
7461 machine_mode mode
= (machine_mode
) i
;
7462 if (VECTOR_MODE_P (mode
))
7464 rtx scalar_reg
= make_test_reg (GET_MODE_INNER (mode
));
7465 test_vector_ops_duplicate (mode
, scalar_reg
);
7466 if (GET_MODE_CLASS (mode
) == MODE_VECTOR_INT
7467 && maybe_gt (GET_MODE_NUNITS (mode
), 2))
7469 test_vector_ops_series (mode
, scalar_reg
);
7470 test_vector_subregs (mode
);
7472 test_vec_merge (mode
);
7477 template<unsigned int N
>
7478 struct simplify_const_poly_int_tests
7484 struct simplify_const_poly_int_tests
<1>
7486 static void run () {}
7489 /* Test various CONST_POLY_INT properties. */
7491 template<unsigned int N
>
7493 simplify_const_poly_int_tests
<N
>::run ()
7495 rtx x1
= gen_int_mode (poly_int64 (1, 1), QImode
);
7496 rtx x2
= gen_int_mode (poly_int64 (-80, 127), QImode
);
7497 rtx x3
= gen_int_mode (poly_int64 (-79, -128), QImode
);
7498 rtx x4
= gen_int_mode (poly_int64 (5, 4), QImode
);
7499 rtx x5
= gen_int_mode (poly_int64 (30, 24), QImode
);
7500 rtx x6
= gen_int_mode (poly_int64 (20, 16), QImode
);
7501 rtx x7
= gen_int_mode (poly_int64 (7, 4), QImode
);
7502 rtx x8
= gen_int_mode (poly_int64 (30, 24), HImode
);
7503 rtx x9
= gen_int_mode (poly_int64 (-30, -24), HImode
);
7504 rtx x10
= gen_int_mode (poly_int64 (-31, -24), HImode
);
7505 rtx two
= GEN_INT (2);
7506 rtx six
= GEN_INT (6);
7507 poly_uint64 offset
= subreg_lowpart_offset (QImode
, HImode
);
7509 /* These tests only try limited operation combinations. Fuller arithmetic
7510 testing is done directly on poly_ints. */
7511 ASSERT_EQ (simplify_unary_operation (NEG
, HImode
, x8
, HImode
), x9
);
7512 ASSERT_EQ (simplify_unary_operation (NOT
, HImode
, x8
, HImode
), x10
);
7513 ASSERT_EQ (simplify_unary_operation (TRUNCATE
, QImode
, x8
, HImode
), x5
);
7514 ASSERT_EQ (simplify_binary_operation (PLUS
, QImode
, x1
, x2
), x3
);
7515 ASSERT_EQ (simplify_binary_operation (MINUS
, QImode
, x3
, x1
), x2
);
7516 ASSERT_EQ (simplify_binary_operation (MULT
, QImode
, x4
, six
), x5
);
7517 ASSERT_EQ (simplify_binary_operation (MULT
, QImode
, six
, x4
), x5
);
7518 ASSERT_EQ (simplify_binary_operation (ASHIFT
, QImode
, x4
, two
), x6
);
7519 ASSERT_EQ (simplify_binary_operation (IOR
, QImode
, x4
, two
), x7
);
7520 ASSERT_EQ (simplify_subreg (HImode
, x5
, QImode
, 0), x8
);
7521 ASSERT_EQ (simplify_subreg (QImode
, x8
, HImode
, offset
), x5
);
7524 /* Run all of the selftests within this file. */
7527 simplify_rtx_c_tests ()
7530 simplify_const_poly_int_tests
<NUM_POLY_INT_COEFFS
>::run ();
7533 } // namespace selftest
7535 #endif /* CHECKING_P */