gcc/config/aarch64/aarch64-sve.md

   1 ;; Machine description for AArch64 SVE.
   2 ;; Copyright (C) 2009-2016 Free Software Foundation, Inc.
   3 ;; Contributed by ARM Ltd.
   4 ;;
   5 ;; This file is part of GCC.
   6 ;;
   7 ;; GCC is free software; you can redistribute it and/or modify it
   8 ;; under the terms of the GNU General Public License as published by
   9 ;; the Free Software Foundation; either version 3, or (at your option)
  10 ;; any later version.
  11 ;;
  12 ;; GCC is distributed in the hope that it will be useful, but
  13 ;; WITHOUT ANY WARRANTY; without even the implied warranty of
  14 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  15 ;; General Public License for more details.
  16 ;;
  17 ;; You should have received a copy of the GNU General Public License
  18 ;; along with GCC; see the file COPYING3.  If not see
  19 ;; <http://www.gnu.org/licenses/>.
  20
  21 ;; Note on the handling of big-endian SVE
  22 ;; --------------------------------------
  23 ;;
  24 ;; On big-endian systems, Advanced SIMD mov<mode> patterns act in the
  25 ;; same way as movdi or movti would: the first byte of memory goes
  26 ;; into the most significant byte of the register and the last byte
  27 ;; of memory goes into the least significant byte of the register.
  28 ;; This is the most natural ordering for Advanced SIMD and matches
  29 ;; the ABI layout for 64-bit and 128-bit vector types.
  30 ;;
  31 ;; As a result, the order of bytes within the register is what GCC
  32 ;; expects for a big-endian target, and subreg offsets therefore work
  33 ;; as expected, with the first element in memory having subreg offset 0
  34 ;; and the last element in memory having the subreg offset associated
  35 ;; with a big-endian lowpart.  However, this ordering also means that
  36 ;; GCC's lane numbering does not match the architecture's numbering:
  37 ;; GCC always treats the element at the lowest address in memory
  38 ;; (subreg offset 0) as element 0, while the architecture treats
  39 ;; the least significant end of the register as element 0.
  40 ;;
  41 ;; The situation for SVE is different.  We want the layout of the
  42 ;; SVE register to be same for mov<mode> as it is for maskload<mode>:
  43 ;; logically, a mov<mode> load must be indistinguishable from a
  44 ;; maskload<mode> whose mask is all true.  We therefore need the
  45 ;; register layout to match LD1 rather than LDR.  The ABI layout of
  46 ;; SVE types also matches LD1 byte ordering rather than LDR byte ordering.
  47 ;;
  48 ;; As a result, the architecture lane numbering matches GCC's lane
  49 ;; numbering, with element 0 always being the first in memory.
  50 ;; However:
  51 ;;
  52 ;; - Applying a subreg offset to a register does not give the element
  53 ;;   that GCC expects: the first element in memory has the subreg offset
  54 ;;   associated with a big-endian lowpart while the last element in memory
  55 ;;   has subreg offset 0.  We handle this via TARGET_CAN_CHANGE_MODE_CLASS.
  56 ;;
  57 ;; - We cannot use LDR and STR for spill slots that might be accessed
  58 ;;   via subregs, since although the elements have the order GCC expects,
  59 ;;   the order of the bytes within the elements is different.  We instead
  60 ;;   access spill slots via LD1 and ST1, using secondary reloads to
  61 ;;   reserve a predicate register.
  62
  63
  64 ;; SVE data moves.
  65 (define_expand "mov<mode>"
  66   [(set (match_operand:SVE_ALL 0 "nonimmediate_operand")
  67         (match_operand:SVE_ALL 1 "general_operand"))]
  68   "TARGET_SVE"
  69   {
  70     /* Use the predicated load and store patterns where possible.
  71        This is required for big-endian targets (see the comment at the
  72        head of the file) and increases the addressing choices for
  73        little-endian.  */
  74     if ((MEM_P (operands[0]) || MEM_P (operands[1]))
  75         && can_create_pseudo_p ())
  76       {
  77         aarch64_expand_sve_mem_move (operands[0], operands[1], <VPRED>mode);
  78         DONE;
  79       }
  80
  81     if (CONSTANT_P (operands[1]))
  82       {
  83         aarch64_expand_mov_immediate (operands[0], operands[1],
  84                                       gen_vec_duplicate<mode>);
  85         DONE;
  86       }
  87
  88     /* Optimize subregs on big-endian targets: we can use REV[BHW]
  89        instead of going through memory.  */
  90     if (BYTES_BIG_ENDIAN
  91         && aarch64_maybe_expand_sve_subreg_move (operands[0], operands[1]))
  92       DONE;
  93   }
  94 )
  95
  96 ;; A pattern for optimizing SUBREGs that have a reinterpreting effect
  97 ;; on big-endian targets; see aarch64_maybe_expand_sve_subreg_move
  98 ;; for details.  We use a special predicate for operand 2 to reduce
  99 ;; the number of patterns.
 100 (define_insn_and_split "*aarch64_sve_mov<mode>_subreg_be"
 101   [(set (match_operand:SVE_ALL 0 "aarch64_sve_nonimmediate_operand" "=w")
 102         (unspec:SVE_ALL
 103           [(match_operand:VNx16BI 1 "register_operand" "Upl")
 104            (match_operand 2 "aarch64_any_register_operand" "w")]
 105           UNSPEC_REV_SUBREG))]
 106   "TARGET_SVE && BYTES_BIG_ENDIAN"
 107   "#"
 108   "&& reload_completed"
 109   [(const_int 0)]
 110   {
 111     aarch64_split_sve_subreg_move (operands[0], operands[1], operands[2]);
 112     DONE;
 113   }
 114 )
 115
 116 ;; Unpredicated moves (little-endian).  Only allow memory operations
 117 ;; during and after RA; before RA we want the predicated load and
 118 ;; store patterns to be used instead.
 119 (define_insn "*aarch64_sve_mov<mode>_le"
 120   [(set (match_operand:SVE_ALL 0 "aarch64_sve_nonimmediate_operand" "=w, Utr, w, w")
 121         (match_operand:SVE_ALL 1 "aarch64_sve_general_operand" "Utr, w, w, Dn"))]
 122   "TARGET_SVE
 123    && !BYTES_BIG_ENDIAN
 124    && ((lra_in_progress || reload_completed)
 125        || (register_operand (operands[0], <MODE>mode)
 126            && nonmemory_operand (operands[1], <MODE>mode)))"
 127   "@
 128    ldr\t%0, %1
 129    str\t%1, %0
 130    mov\t%0.d, %1.d
 131    * return aarch64_output_sve_mov_immediate (operands[1]);"
 132 )
 133
 134 ;; Unpredicated moves (big-endian).  Memory accesses require secondary
 135 ;; reloads.
 136 (define_insn "*aarch64_sve_mov<mode>_be"
 137   [(set (match_operand:SVE_ALL 0 "register_operand" "=w, w")
 138         (match_operand:SVE_ALL 1 "aarch64_nonmemory_operand" "w, Dn"))]
 139   "TARGET_SVE && BYTES_BIG_ENDIAN"
 140   "@
 141    mov\t%0.d, %1.d
 142    * return aarch64_output_sve_mov_immediate (operands[1]);"
 143 )
 144
 145 ;; Handle big-endian memory reloads.  We use byte PTRUE for all modes
 146 ;; to try to encourage reuse.
 147 (define_expand "aarch64_sve_reload_be"
 148   [(parallel
 149      [(set (match_operand 0)
 150            (match_operand 1))
 151       (clobber (match_operand:VNx16BI 2 "register_operand" "=Upl"))])]
 152   "TARGET_SVE && BYTES_BIG_ENDIAN"
 153   {
 154     /* Create a PTRUE.  */
 155     emit_move_insn (operands[2], CONSTM1_RTX (VNx16BImode));
 156
 157     /* Refer to the PTRUE in the appropriate mode for this move.  */
 158     machine_mode mode = GET_MODE (operands[0]);
 159     machine_mode pred_mode
 160       = aarch64_sve_pred_mode (GET_MODE_UNIT_SIZE (mode)).require ();
 161     rtx pred = gen_lowpart (pred_mode, operands[2]);
 162
 163     /* Emit a predicated load or store.  */
 164     aarch64_emit_sve_pred_move (operands[0], pred, operands[1]);
 165     DONE;
 166   }
 167 )
 168
 169 ;; A predicated load or store for which the predicate is known to be
 170 ;; all-true.  Note that this pattern is generated directly by
 171 ;; aarch64_emit_sve_pred_move, so changes to this pattern will
 172 ;; need changes there as well.
 173 (define_insn "*pred_mov<mode>"
 174   [(set (match_operand:SVE_ALL 0 "nonimmediate_operand" "=w, m")
 175         (unspec:SVE_ALL
 176           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
 177            (match_operand:SVE_ALL 2 "nonimmediate_operand" "m, w")]
 178           UNSPEC_MERGE_PTRUE))]
 179   "TARGET_SVE
 180    && (register_operand (operands[0], <MODE>mode)
 181        || register_operand (operands[2], <MODE>mode))"
 182   "@
 183    ld1<Vesize>\t%0.<Vetype>, %1/z, %2
 184    st1<Vesize>\t%2.<Vetype>, %1, %0"
 185 )
 186
 187 (define_expand "movmisalign<mode>"
 188   [(set (match_operand:SVE_ALL 0 "nonimmediate_operand")
 189         (match_operand:SVE_ALL 1 "general_operand"))]
 190   "TARGET_SVE"
 191   {
 192     /* Equivalent to a normal move for our purpooses.  */
 193     emit_move_insn (operands[0], operands[1]);
 194     DONE;
 195   }
 196 )
 197
 198 (define_insn "maskload<mode><vpred>"
 199   [(set (match_operand:SVE_ALL 0 "register_operand" "=w")
 200         (unspec:SVE_ALL
 201           [(match_operand:<VPRED> 2 "register_operand" "Upl")
 202            (match_operand:SVE_ALL 1 "memory_operand" "m")]
 203           UNSPEC_LD1_SVE))]
 204   "TARGET_SVE"
 205   "ld1<Vesize>\t%0.<Vetype>, %2/z, %1"
 206 )
 207
 208 (define_insn "maskstore<mode><vpred>"
 209   [(set (match_operand:SVE_ALL 0 "memory_operand" "+m")
 210         (unspec:SVE_ALL [(match_operand:<VPRED> 2 "register_operand" "Upl")
 211                          (match_operand:SVE_ALL 1 "register_operand" "w")
 212                          (match_dup 0)]
 213                         UNSPEC_ST1_SVE))]
 214   "TARGET_SVE"
 215   "st1<Vesize>\t%1.<Vetype>, %2, %0"
 216 )
 217
 218 ;; Unpredicated gather loads.
 219 (define_expand "gather_load<mode>"
 220   [(set (match_operand:SVE_SD 0 "register_operand")
 221         (unspec:SVE_SD
 222           [(match_dup 5)
 223            (match_operand:DI 1 "aarch64_reg_or_zero")
 224            (match_operand:<V_INT_EQUIV> 2 "register_operand")
 225            (match_operand:DI 3 "const_int_operand")
 226            (match_operand:DI 4 "aarch64_gather_scale_operand_<Vesize>")
 227            (mem:BLK (scratch))]
 228           UNSPEC_LD1_GATHER))]
 229   "TARGET_SVE"
 230   {
 231     operands[5] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
 232   }
 233 )
 234
 235 ;; Predicated gather loads for 32-bit elements.  Operand 3 is true for
 236 ;; unsigned extension and false for signed extension.
 237 (define_insn "mask_gather_load<mode>"
 238   [(set (match_operand:SVE_S 0 "register_operand" "=w, w, w, w, w")
 239         (unspec:SVE_S
 240           [(match_operand:<VPRED> 5 "register_operand" "Upl, Upl, Upl, Upl, Upl")
 241            (match_operand:DI 1 "aarch64_reg_or_zero" "Z, rk, rk, rk, rk")
 242            (match_operand:<V_INT_EQUIV> 2 "register_operand" "w, w, w, w, w")
 243            (match_operand:DI 3 "const_int_operand" "i, Z, Ui1, Z, Ui1")
 244            (match_operand:DI 4 "aarch64_gather_scale_operand_w" "Ui1, Ui1, Ui1, i, i")
 245            (mem:BLK (scratch))]
 246           UNSPEC_LD1_GATHER))]
 247   "TARGET_SVE"
 248   "@
 249    ld1w\t%0.s, %5/z, [%2.s]
 250    ld1w\t%0.s, %5/z, [%1, %2.s, sxtw]
 251    ld1w\t%0.s, %5/z, [%1, %2.s, uxtw]
 252    ld1w\t%0.s, %5/z, [%1, %2.s, sxtw %p4]
 253    ld1w\t%0.s, %5/z, [%1, %2.s, uxtw %p4]"
 254 )
 255
 256 ;; Predicated gather loads for 64-bit elements.  The value of operand 3
 257 ;; doesn't matter in this case.
 258 (define_insn "mask_gather_load<mode>"
 259   [(set (match_operand:SVE_D 0 "register_operand" "=w, w, w")
 260         (unspec:SVE_D
 261           [(match_operand:<VPRED> 5 "register_operand" "Upl, Upl, Upl")
 262            (match_operand:DI 1 "aarch64_reg_or_zero" "Z, rk, rk")
 263            (match_operand:<V_INT_EQUIV> 2 "register_operand" "w, w, w")
 264            (match_operand:DI 3 "const_int_operand")
 265            (match_operand:DI 4 "aarch64_gather_scale_operand_d" "Ui1, Ui1, i")
 266            (mem:BLK (scratch))]
 267           UNSPEC_LD1_GATHER))]
 268   "TARGET_SVE"
 269   "@
 270    ld1d\t%0.d, %5/z, [%2.d]
 271    ld1d\t%0.d, %5/z, [%1, %2.d]
 272    ld1d\t%0.d, %5/z, [%1, %2.d, lsl %p4]"
 273 )
 274
 275 ;; Unpredicated scatter store.
 276 (define_expand "scatter_store<mode>"
 277   [(set (mem:BLK (scratch))
 278         (unspec:BLK
 279           [(match_dup 5)
 280            (match_operand:DI 0 "aarch64_reg_or_zero")
 281            (match_operand:<V_INT_EQUIV> 1 "register_operand")
 282            (match_operand:DI 2 "const_int_operand")
 283            (match_operand:DI 3 "aarch64_gather_scale_operand_<Vesize>")
 284            (match_operand:SVE_SD 4 "register_operand")]
 285           UNSPEC_ST1_SCATTER))]
 286   "TARGET_SVE"
 287   {
 288     operands[5] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
 289   }
 290 )
 291
 292 ;; Predicated scatter stores for 32-bit elements.  Operand 2 is true for
 293 ;; unsigned extension and false for signed extension.
 294 (define_insn "mask_scatter_store<mode>"
 295   [(set (mem:BLK (scratch))
 296         (unspec:BLK
 297           [(match_operand:<VPRED> 5 "register_operand" "Upl, Upl, Upl, Upl, Upl")
 298            (match_operand:DI 0 "aarch64_reg_or_zero" "Z, rk, rk, rk, rk")
 299            (match_operand:<V_INT_EQUIV> 1 "register_operand" "w, w, w, w, w")
 300            (match_operand:DI 2 "const_int_operand" "i, Z, Ui1, Z, Ui1")
 301            (match_operand:DI 3 "aarch64_gather_scale_operand_w" "Ui1, Ui1, Ui1, i, i")
 302            (match_operand:SVE_S 4 "register_operand" "w, w, w, w, w")]
 303           UNSPEC_ST1_SCATTER))]
 304   "TARGET_SVE"
 305   "@
 306    st1w\t%4.s, %5, [%1.s]
 307    st1w\t%4.s, %5, [%0, %1.s, sxtw]
 308    st1w\t%4.s, %5, [%0, %1.s, uxtw]
 309    st1w\t%4.s, %5, [%0, %1.s, sxtw %p3]
 310    st1w\t%4.s, %5, [%0, %1.s, uxtw %p3]"
 311 )
 312
 313 ;; Predicated scatter stores for 64-bit elements.  The value of operand 2
 314 ;; doesn't matter in this case.
 315 (define_insn "mask_scatter_store<mode>"
 316   [(set (mem:BLK (scratch))
 317         (unspec:BLK
 318           [(match_operand:<VPRED> 5 "register_operand" "Upl, Upl, Upl")
 319            (match_operand:DI 0 "aarch64_reg_or_zero" "Z, rk, rk")
 320            (match_operand:<V_INT_EQUIV> 1 "register_operand" "w, w, w")
 321            (match_operand:DI 2 "const_int_operand")
 322            (match_operand:DI 3 "aarch64_gather_scale_operand_d" "Ui1, Ui1, i")
 323            (match_operand:SVE_D 4 "register_operand" "w, w, w")]
 324           UNSPEC_ST1_SCATTER))]
 325   "TARGET_SVE"
 326   "@
 327    st1d\t%4.d, %5, [%1.d]
 328    st1d\t%4.d, %5, [%0, %1.d]
 329    st1d\t%4.d, %5, [%0, %1.d, lsl %p3]"
 330 )
 331
 332 ;; SVE structure moves.
 333 (define_expand "mov<mode>"
 334   [(set (match_operand:SVE_STRUCT 0 "nonimmediate_operand")
 335         (match_operand:SVE_STRUCT 1 "general_operand"))]
 336   "TARGET_SVE"
 337   {
 338     /* Big-endian loads and stores need to be done via LD1 and ST1;
 339        see the comment at the head of the file for details.  */
 340     if ((MEM_P (operands[0]) || MEM_P (operands[1]))
 341         && BYTES_BIG_ENDIAN)
 342       {
 343         gcc_assert (can_create_pseudo_p ());
 344         aarch64_expand_sve_mem_move (operands[0], operands[1], <VPRED>mode);
 345         DONE;
 346       }
 347
 348     if (CONSTANT_P (operands[1]))
 349       {
 350         aarch64_expand_mov_immediate (operands[0], operands[1]);
 351         DONE;
 352       }
 353   }
 354 )
 355
 356 ;; Unpredicated structure moves (little-endian).
 357 (define_insn "*aarch64_sve_mov<mode>_le"
 358   [(set (match_operand:SVE_STRUCT 0 "aarch64_sve_nonimmediate_operand" "=w, Utr, w, w")
 359         (match_operand:SVE_STRUCT 1 "aarch64_sve_general_operand" "Utr, w, w, Dn"))]
 360   "TARGET_SVE && !BYTES_BIG_ENDIAN"
 361   "#"
 362   [(set_attr "length" "<insn_length>")]
 363 )
 364
 365 ;; Unpredicated structure moves (big-endian).  Memory accesses require
 366 ;; secondary reloads.
 367 (define_insn "*aarch64_sve_mov<mode>_le"
 368   [(set (match_operand:SVE_STRUCT 0 "register_operand" "=w, w")
 369         (match_operand:SVE_STRUCT 1 "aarch64_nonmemory_operand" "w, Dn"))]
 370   "TARGET_SVE && BYTES_BIG_ENDIAN"
 371   "#"
 372   [(set_attr "length" "<insn_length>")]
 373 )
 374
 375 ;; Split unpredicated structure moves into pieces.  This is the same
 376 ;; for both big-endian and little-endian code, although it only needs
 377 ;; to handle memory operands for little-endian code.
 378 (define_split
 379   [(set (match_operand:SVE_STRUCT 0 "aarch64_sve_nonimmediate_operand")
 380         (match_operand:SVE_STRUCT 1 "aarch64_sve_general_operand"))]
 381   "TARGET_SVE && reload_completed"
 382   [(const_int 0)]
 383   {
 384     rtx dest = operands[0];
 385     rtx src = operands[1];
 386     if (REG_P (dest) && REG_P (src))
 387       aarch64_simd_emit_reg_reg_move (operands, <VSINGLE>mode, <vector_count>);
 388     else
 389       for (unsigned int i = 0; i < <vector_count>; ++i)
 390         {
 391           rtx subdest = simplify_gen_subreg (<VSINGLE>mode, dest, <MODE>mode,
 392                                              i * BYTES_PER_SVE_VECTOR);
 393           rtx subsrc = simplify_gen_subreg (<VSINGLE>mode, src, <MODE>mode,
 394                                             i * BYTES_PER_SVE_VECTOR);
 395           emit_insn (gen_rtx_SET (subdest, subsrc));
 396         }
 397     DONE;
 398   }
 399 )
 400
 401 ;; Predicated structure moves.  This works for both endiannesses but in
 402 ;; practice is only useful for big-endian.
 403 (define_insn_and_split "pred_mov<mode>"
 404   [(set (match_operand:SVE_STRUCT 0 "aarch64_sve_struct_nonimmediate_operand" "=w, Utx")
 405         (unspec:SVE_STRUCT
 406           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
 407            (match_operand:SVE_STRUCT 2 "aarch64_sve_struct_nonimmediate_operand" "Utx, w")]
 408           UNSPEC_MERGE_PTRUE))]
 409   "TARGET_SVE
 410    && (register_operand (operands[0], <MODE>mode)
 411        || register_operand (operands[2], <MODE>mode))"
 412   "#"
 413   "&& reload_completed"
 414   [(const_int 0)]
 415   {
 416     for (unsigned int i = 0; i < <vector_count>; ++i)
 417       {
 418         rtx subdest = simplify_gen_subreg (<VSINGLE>mode, operands[0],
 419                                            <MODE>mode,
 420                                            i * BYTES_PER_SVE_VECTOR);
 421         rtx subsrc = simplify_gen_subreg (<VSINGLE>mode, operands[2],
 422                                           <MODE>mode,
 423                                           i * BYTES_PER_SVE_VECTOR);
 424         aarch64_emit_sve_pred_move (subdest, operands[1], subsrc);
 425       }
 426     DONE;
 427   }
 428   [(set_attr "length" "<insn_length>")]
 429 )
 430
 431 (define_expand "mov<mode>"
 432   [(set (match_operand:PRED_ALL 0 "nonimmediate_operand")
 433         (match_operand:PRED_ALL 1 "general_operand"))]
 434   "TARGET_SVE"
 435   {
 436     if (GET_CODE (operands[0]) == MEM)
 437       operands[1] = force_reg (<MODE>mode, operands[1]);
 438   }
 439 )
 440
 441 (define_insn "*aarch64_sve_mov<mode>"
 442   [(set (match_operand:PRED_ALL 0 "nonimmediate_operand" "=Upa, m, Upa, Upa, Upa")
 443         (match_operand:PRED_ALL 1 "general_operand" "Upa, Upa, m, Dz, Dm"))]
 444   "TARGET_SVE
 445    && (register_operand (operands[0], <MODE>mode)
 446        || register_operand (operands[1], <MODE>mode))"
 447   "@
 448    mov\t%0.b, %1.b
 449    str\t%1, %0
 450    ldr\t%0, %1
 451    pfalse\t%0.b
 452    * return aarch64_output_ptrue (<MODE>mode, '<Vetype>');"
 453 )
 454
 455 ;; Handle extractions from a predicate by converting to an integer vector
 456 ;; and extracting from there.
 457 (define_expand "vec_extract<vpred><Vel>"
 458   [(match_operand:<VEL> 0 "register_operand")
 459    (match_operand:<VPRED> 1 "register_operand")
 460    (match_operand:SI 2 "nonmemory_operand")
 461    ;; Dummy operand to which we can attach the iterator.
 462    (reg:SVE_I V0_REGNUM)]
 463   "TARGET_SVE"
 464   {
 465     rtx tmp = gen_reg_rtx (<MODE>mode);
 466     emit_insn (gen_aarch64_sve_dup<mode>_const (tmp, operands[1],
 467                                                 CONST1_RTX (<MODE>mode),
 468                                                 CONST0_RTX (<MODE>mode)));
 469     emit_insn (gen_vec_extract<mode><Vel> (operands[0], tmp, operands[2]));
 470     DONE;
 471   }
 472 )
 473
 474 (define_expand "vec_extract<mode><Vel>"
 475   [(set (match_operand:<VEL> 0 "register_operand")
 476         (vec_select:<VEL>
 477           (match_operand:SVE_ALL 1 "register_operand")
 478           (parallel [(match_operand:SI 2 "nonmemory_operand")])))]
 479   "TARGET_SVE"
 480   {
 481     poly_int64 val;
 482     if (poly_int_rtx_p (operands[2], &val)
 483         && known_eq (val, GET_MODE_NUNITS (<MODE>mode) - 1))
 484       {
 485         /* The last element can be extracted with a LASTB and a false
 486            predicate.  */
 487         rtx sel = force_reg (<VPRED>mode, CONST0_RTX (<VPRED>mode));
 488         emit_insn (gen_extract_last_<mode> (operands[0], sel, operands[1]));
 489         DONE;
 490       }
 491     if (!CONST_INT_P (operands[2]))
 492       {
 493         /* Create an index with operand[2] as the base and -1 as the step.
 494            It will then be zero for the element we care about.  */
 495         rtx index = gen_lowpart (<VEL_INT>mode, operands[2]);
 496         index = force_reg (<VEL_INT>mode, index);
 497         rtx series = gen_reg_rtx (<V_INT_EQUIV>mode);
 498         emit_insn (gen_vec_series<v_int_equiv> (series, index, constm1_rtx));
 499
 500         /* Get a predicate that is true for only that element.  */
 501         rtx zero = CONST0_RTX (<V_INT_EQUIV>mode);
 502         rtx cmp = gen_rtx_EQ (<V_INT_EQUIV>mode, series, zero);
 503         rtx sel = gen_reg_rtx (<VPRED>mode);
 504         emit_insn (gen_vec_cmp<v_int_equiv><vpred> (sel, cmp, series, zero));
 505
 506         /* Select the element using LASTB.  */
 507         emit_insn (gen_extract_last_<mode> (operands[0], sel, operands[1]));
 508         DONE;
 509       }
 510   }
 511 )
 512
 513 ;; Extract element zero.  This is a special case because we want to force
 514 ;; the registers to be the same for the second alternative, and then
 515 ;; split the instruction into nothing after RA.
 516 (define_insn_and_split "*vec_extract<mode><Vel>_0"
 517   [(set (match_operand:<VEL> 0 "aarch64_simd_nonimmediate_operand" "=r, w, Utv")
 518         (vec_select:<VEL>
 519           (match_operand:SVE_ALL 1 "register_operand" "w, 0, w")
 520           (parallel [(const_int 0)])))]
 521   "TARGET_SVE"
 522   {
 523     operands[1] = gen_rtx_REG (<V128>mode, REGNO (operands[1]));
 524     switch (which_alternative)
 525       {
 526         case 0:
 527           return "umov\\t%<vwcore>0, %1.<Vetype>[0]";
 528         case 1:
 529           return "#";
 530         case 2:
 531           return "st1\\t{%1.<Vetype>}[0], %0";
 532         default:
 533           gcc_unreachable ();
 534       }
 535   }
 536   "&& reload_completed
 537    && REG_P (operands[0])
 538    && REGNO (operands[0]) == REGNO (operands[1])"
 539   [(const_int 0)]
 540   {
 541     emit_note (NOTE_INSN_DELETED);
 542     DONE;
 543   }
 544   [(set_attr "type" "neon_to_gp_q, untyped, neon_store1_one_lane_q")]
 545 )
 546
 547 ;; Extract an element from the Advanced SIMD portion of the register.
 548 ;; We don't just reuse the aarch64-simd.md pattern because we don't
 549 ;; want any change in lane number on big-endian targets.
 550 (define_insn "*vec_extract<mode><Vel>_v128"
 551   [(set (match_operand:<VEL> 0 "aarch64_simd_nonimmediate_operand" "=r, w, Utv")
 552         (vec_select:<VEL>
 553           (match_operand:SVE_ALL 1 "register_operand" "w, w, w")
 554           (parallel [(match_operand:SI 2 "const_int_operand")])))]
 555   "TARGET_SVE
 556    && IN_RANGE (INTVAL (operands[2]) * GET_MODE_SIZE (<VEL>mode), 1, 15)"
 557   {
 558     operands[1] = gen_rtx_REG (<V128>mode, REGNO (operands[1]));
 559     switch (which_alternative)
 560       {
 561         case 0:
 562           return "umov\\t%<vwcore>0, %1.<Vetype>[%2]";
 563         case 1:
 564           return "dup\\t%<Vetype>0, %1.<Vetype>[%2]";
 565         case 2:
 566           return "st1\\t{%1.<Vetype>}[%2], %0";
 567         default:
 568           gcc_unreachable ();
 569       }
 570   }
 571   [(set_attr "type" "neon_to_gp_q, neon_dup_q, neon_store1_one_lane_q")]
 572 )
 573
 574 ;; Extract an element in the range of DUP.  This pattern allows the
 575 ;; source and destination to be different.
 576 (define_insn "*vec_extract<mode><Vel>_dup"
 577   [(set (match_operand:<VEL> 0 "register_operand" "=w")
 578         (vec_select:<VEL>
 579           (match_operand:SVE_ALL 1 "register_operand" "w")
 580           (parallel [(match_operand:SI 2 "const_int_operand")])))]
 581   "TARGET_SVE
 582    && IN_RANGE (INTVAL (operands[2]) * GET_MODE_SIZE (<VEL>mode), 16, 63)"
 583   {
 584     operands[0] = gen_rtx_REG (<MODE>mode, REGNO (operands[0]));
 585     return "dup\t%0.<Vetype>, %1.<Vetype>[%2]";
 586   }
 587 )
 588
 589 ;; Extract an element outside the range of DUP.  This pattern requires the
 590 ;; source and destination to be the same.
 591 (define_insn "*vec_extract<mode><Vel>_ext"
 592   [(set (match_operand:<VEL> 0 "register_operand" "=w")
 593         (vec_select:<VEL>
 594           (match_operand:SVE_ALL 1 "register_operand" "0")
 595           (parallel [(match_operand:SI 2 "const_int_operand")])))]
 596   "TARGET_SVE && INTVAL (operands[2]) * GET_MODE_SIZE (<VEL>mode) >= 64"
 597   {
 598     operands[0] = gen_rtx_REG (<MODE>mode, REGNO (operands[0]));
 599     operands[2] = GEN_INT (INTVAL (operands[2]) * GET_MODE_SIZE (<VEL>mode));
 600     return "ext\t%0.b, %0.b, %0.b, #%2";
 601   }
 602 )
 603
 604 ;; Extract the last active element of operand 1 into operand 0.
 605 ;; If no elements are active, extract the last inactive element instead.
 606 (define_insn "extract_last_<mode>"
 607   [(set (match_operand:<VEL> 0 "register_operand" "=r, w")
 608         (unspec:<VEL>
 609           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
 610            (match_operand:SVE_ALL 2 "register_operand" "w, w")]
 611           UNSPEC_LASTB))]
 612   "TARGET_SVE"
 613   "@
 614    lastb\t%<vwcore>0, %1, %2.<Vetype>
 615    lastb\t%<Vetype>0, %1, %2.<Vetype>"
 616 )
 617
 618 (define_expand "vec_duplicate<mode>"
 619   [(parallel
 620     [(set (match_operand:SVE_ALL 0 "register_operand")
 621           (vec_duplicate:SVE_ALL
 622             (match_operand:<VEL> 1 "aarch64_sve_dup_operand")))
 623      (clobber (scratch:<VPRED>))])]
 624   "TARGET_SVE"
 625   {
 626     if (MEM_P (operands[1]))
 627       {
 628         rtx ptrue = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
 629         emit_insn (gen_sve_ld1r<mode> (operands[0], ptrue, operands[1],
 630                                        CONST0_RTX (<MODE>mode)));
 631         DONE;
 632       }
 633   }
 634 )
 635
 636 ;; Accept memory operands for the benefit of combine, and also in case
 637 ;; the scalar input gets spilled to memory during RA.  We want to split
 638 ;; the load at the first opportunity in order to allow the PTRUE to be
 639 ;; optimized with surrounding code.
 640 (define_insn_and_split "*vec_duplicate<mode>_reg"
 641   [(set (match_operand:SVE_ALL 0 "register_operand" "=w, w, w")
 642         (vec_duplicate:SVE_ALL
 643           (match_operand:<VEL> 1 "aarch64_sve_dup_operand" "r, w, Uty")))
 644    (clobber (match_scratch:<VPRED> 2 "=X, X, Upl"))]
 645   "TARGET_SVE"
 646   "@
 647    mov\t%0.<Vetype>, %<vwcore>1
 648    mov\t%0.<Vetype>, %<Vetype>1
 649    #"
 650   "&& MEM_P (operands[1])"
 651   [(const_int 0)]
 652   {
 653     if (GET_CODE (operands[2]) == SCRATCH)
 654       operands[2] = gen_reg_rtx (<VPRED>mode);
 655     emit_move_insn (operands[2], CONSTM1_RTX (<VPRED>mode));
 656     emit_insn (gen_sve_ld1r<mode> (operands[0], operands[2], operands[1],
 657                                    CONST0_RTX (<MODE>mode)));
 658     DONE;
 659   }
 660   [(set_attr "length" "4,4,8")]
 661 )
 662
 663 ;; This is used for vec_duplicate<mode>s from memory, but can also
 664 ;; be used by combine to optimize selects of a a vec_duplicate<mode>
 665 ;; with zero.
 666 (define_insn "sve_ld1r<mode>"
 667   [(set (match_operand:SVE_ALL 0 "register_operand" "=w")
 668         (unspec:SVE_ALL
 669           [(match_operand:<VPRED> 1 "register_operand" "Upl")
 670            (vec_duplicate:SVE_ALL
 671              (match_operand:<VEL> 2 "aarch64_sve_ld1r_operand" "Uty"))
 672            (match_operand:SVE_ALL 3 "aarch64_simd_imm_zero")]
 673           UNSPEC_SEL))]
 674   "TARGET_SVE"
 675   "ld1r<Vesize>\t%0.<Vetype>, %1/z, %2"
 676 )
 677
 678 ;; Load 128 bits from memory and duplicate to fill a vector.  Since there
 679 ;; are so few operations on 128-bit "elements", we don't define a VNx1TI
 680 ;; and simply use vectors of bytes instead.
 681 (define_insn "*sve_ld1rq<Vesize>"
 682   [(set (match_operand:SVE_ALL 0 "register_operand" "=w")
 683         (unspec:SVE_ALL
 684           [(match_operand:<VPRED> 1 "register_operand" "Upl")
 685            (match_operand:TI 2 "aarch64_sve_ld1r_operand" "Uty")]
 686           UNSPEC_LD1RQ))]
 687   "TARGET_SVE"
 688   "ld1rq<Vesize>\t%0.<Vetype>, %1/z, %2"
 689 )
 690
 691 ;; Implement a predicate broadcast by shifting the low bit of the scalar
 692 ;; input into the top bit and using a WHILELO.  An alternative would be to
 693 ;; duplicate the input and do a compare with zero.
 694 (define_expand "vec_duplicate<mode>"
 695   [(set (match_operand:PRED_ALL 0 "register_operand")
 696         (vec_duplicate:PRED_ALL (match_operand 1 "register_operand")))]
 697   "TARGET_SVE"
 698   {
 699     rtx tmp = gen_reg_rtx (DImode);
 700     rtx op1 = gen_lowpart (DImode, operands[1]);
 701     emit_insn (gen_ashldi3 (tmp, op1, gen_int_mode (63, DImode)));
 702     emit_insn (gen_while_ultdi<mode> (operands[0], const0_rtx, tmp));
 703     DONE;
 704   }
 705 )
 706
 707 (define_insn "vec_series<mode>"
 708   [(set (match_operand:SVE_I 0 "register_operand" "=w, w, w")
 709         (vec_series:SVE_I
 710           (match_operand:<VEL> 1 "aarch64_sve_index_operand" "Usi, r, r")
 711           (match_operand:<VEL> 2 "aarch64_sve_index_operand" "r, Usi, r")))]
 712   "TARGET_SVE"
 713   "@
 714    index\t%0.<Vetype>, #%1, %<vw>2
 715    index\t%0.<Vetype>, %<vw>1, #%2
 716    index\t%0.<Vetype>, %<vw>1, %<vw>2"
 717 )
 718
 719 ;; Optimize {x, x, x, x, ...} + {0, n, 2*n, 3*n, ...} if n is in range
 720 ;; of an INDEX instruction.
 721 (define_insn "*vec_series<mode>_plus"
 722   [(set (match_operand:SVE_I 0 "register_operand" "=w")
 723         (plus:SVE_I
 724           (vec_duplicate:SVE_I
 725             (match_operand:<VEL> 1 "register_operand" "r"))
 726           (match_operand:SVE_I 2 "immediate_operand")))]
 727   "TARGET_SVE && aarch64_check_zero_based_sve_index_immediate (operands[2])"
 728   {
 729     operands[2] = aarch64_check_zero_based_sve_index_immediate (operands[2]);
 730     return "index\t%0.<Vetype>, %<vw>1, #%2";
 731   }
 732 )
 733
 734 ;; Unpredicated LD[234].
 735 (define_expand "vec_load_lanes<mode><vsingle>"
 736   [(set (match_operand:SVE_STRUCT 0 "register_operand")
 737         (unspec:SVE_STRUCT
 738           [(match_dup 2)
 739            (match_operand:SVE_STRUCT 1 "memory_operand")]
 740           UNSPEC_LDN))]
 741   "TARGET_SVE"
 742   {
 743     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
 744   }
 745 )
 746
 747 ;; Predicated LD[234].
 748 (define_insn "vec_mask_load_lanes<mode><vsingle>"
 749   [(set (match_operand:SVE_STRUCT 0 "register_operand" "=w")
 750         (unspec:SVE_STRUCT
 751           [(match_operand:<VPRED> 2 "register_operand" "Upl")
 752            (match_operand:SVE_STRUCT 1 "memory_operand" "m")]
 753           UNSPEC_LDN))]
 754   "TARGET_SVE"
 755   "ld<vector_count><Vesize>\t%0, %2/z, %1"
 756 )
 757
 758 ;; Unpredicated ST[234].  This is always a full update, so the dependence
 759 ;; on the old value of the memory location (via (match_dup 0)) is redundant.
 760 ;; There doesn't seem to be any obvious benefit to treating the all-true
 761 ;; case differently though.  In particular, it's very unlikely that we'll
 762 ;; only find out during RTL that a store_lanes is dead.
 763 (define_expand "vec_store_lanes<mode><vsingle>"
 764   [(set (match_operand:SVE_STRUCT 0 "memory_operand")
 765         (unspec:SVE_STRUCT
 766           [(match_dup 2)
 767            (match_operand:SVE_STRUCT 1 "register_operand")
 768            (match_dup 0)]
 769           UNSPEC_STN))]
 770   "TARGET_SVE"
 771   {
 772     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
 773   }
 774 )
 775
 776 ;; Predicated ST[234].
 777 (define_insn "vec_mask_store_lanes<mode><vsingle>"
 778   [(set (match_operand:SVE_STRUCT 0 "memory_operand" "+m")
 779         (unspec:SVE_STRUCT
 780           [(match_operand:<VPRED> 2 "register_operand" "Upl")
 781            (match_operand:SVE_STRUCT 1 "register_operand" "w")
 782            (match_dup 0)]
 783           UNSPEC_STN))]
 784   "TARGET_SVE"
 785   "st<vector_count><Vesize>\t%1, %2, %0"
 786 )
 787
 788 (define_expand "vec_perm<mode>"
 789   [(match_operand:SVE_ALL 0 "register_operand")
 790    (match_operand:SVE_ALL 1 "register_operand")
 791    (match_operand:SVE_ALL 2 "register_operand")
 792    (match_operand:<V_INT_EQUIV> 3 "aarch64_sve_vec_perm_operand")]
 793   "TARGET_SVE && GET_MODE_NUNITS (<MODE>mode).is_constant ()"
 794   {
 795     aarch64_expand_sve_vec_perm (operands[0], operands[1],
 796                                  operands[2], operands[3]);
 797     DONE;
 798   }
 799 )
 800
 801 (define_insn "*aarch64_sve_tbl<mode>"
 802   [(set (match_operand:SVE_ALL 0 "register_operand" "=w")
 803         (unspec:SVE_ALL
 804           [(match_operand:SVE_ALL 1 "register_operand" "w")
 805            (match_operand:<V_INT_EQUIV> 2 "register_operand" "w")]
 806           UNSPEC_TBL))]
 807   "TARGET_SVE"
 808   "tbl\t%0.<Vetype>, %1.<Vetype>, %2.<Vetype>"
 809 )
 810
 811 (define_insn "*aarch64_sve_<perm_insn><perm_hilo><mode>"
 812   [(set (match_operand:PRED_ALL 0 "register_operand" "=Upa")
 813         (unspec:PRED_ALL [(match_operand:PRED_ALL 1 "register_operand" "Upa")
 814                           (match_operand:PRED_ALL 2 "register_operand" "Upa")]
 815                          PERMUTE))]
 816   "TARGET_SVE"
 817   "<perm_insn><perm_hilo>\t%0.<Vetype>, %1.<Vetype>, %2.<Vetype>"
 818 )
 819
 820 (define_insn "*aarch64_sve_<perm_insn><perm_hilo><mode>"
 821   [(set (match_operand:SVE_ALL 0 "register_operand" "=w")
 822         (unspec:SVE_ALL [(match_operand:SVE_ALL 1 "register_operand" "w")
 823                          (match_operand:SVE_ALL 2 "register_operand" "w")]
 824                         PERMUTE))]
 825   "TARGET_SVE"
 826   "<perm_insn><perm_hilo>\t%0.<Vetype>, %1.<Vetype>, %2.<Vetype>"
 827 )
 828
 829 (define_insn "*aarch64_sve_rev64<mode>"
 830   [(set (match_operand:SVE_BHS 0 "register_operand" "=w")
 831         (unspec:SVE_BHS
 832           [(match_operand:VNx2BI 1 "register_operand" "Upl")
 833            (unspec:SVE_BHS [(match_operand:SVE_BHS 2 "register_operand" "w")]
 834                            UNSPEC_REV64)]
 835           UNSPEC_MERGE_PTRUE))]
 836   "TARGET_SVE"
 837   "rev<Vesize>\t%0.d, %1/m, %2.d"
 838 )
 839
 840 (define_insn "*aarch64_sve_rev32<mode>"
 841   [(set (match_operand:SVE_BH 0 "register_operand" "=w")
 842         (unspec:SVE_BH
 843           [(match_operand:VNx4BI 1 "register_operand" "Upl")
 844            (unspec:SVE_BH [(match_operand:SVE_BH 2 "register_operand" "w")]
 845                           UNSPEC_REV32)]
 846           UNSPEC_MERGE_PTRUE))]
 847   "TARGET_SVE"
 848   "rev<Vesize>\t%0.s, %1/m, %2.s"
 849 )
 850
 851 (define_insn "*aarch64_sve_rev16vnx16qi"
 852   [(set (match_operand:VNx16QI 0 "register_operand" "=w")
 853         (unspec:VNx16QI
 854           [(match_operand:VNx8BI 1 "register_operand" "Upl")
 855            (unspec:VNx16QI [(match_operand:VNx16QI 2 "register_operand" "w")]
 856                            UNSPEC_REV16)]
 857           UNSPEC_MERGE_PTRUE))]
 858   "TARGET_SVE"
 859   "revb\t%0.h, %1/m, %2.h"
 860 )
 861
 862 (define_insn "*aarch64_sve_rev<mode>"
 863   [(set (match_operand:SVE_ALL 0 "register_operand" "=w")
 864         (unspec:SVE_ALL [(match_operand:SVE_ALL 1 "register_operand" "w")]
 865                         UNSPEC_REV))]
 866   "TARGET_SVE"
 867   "rev\t%0.<Vetype>, %1.<Vetype>")
 868
 869 (define_insn "*aarch64_sve_dup_lane<mode>"
 870   [(set (match_operand:SVE_ALL 0 "register_operand" "=w")
 871         (vec_duplicate:SVE_ALL
 872           (vec_select:<VEL>
 873             (match_operand:SVE_ALL 1 "register_operand" "w")
 874             (parallel [(match_operand:SI 2 "const_int_operand")]))))]
 875   "TARGET_SVE
 876    && IN_RANGE (INTVAL (operands[2]) * GET_MODE_SIZE (<VEL>mode), 0, 63)"
 877   "dup\t%0.<Vetype>, %1.<Vetype>[%2]"
 878 )
 879
 880 ;; Note that the immediate (third) operand is the lane index not
 881 ;; the byte index.
 882 (define_insn "*aarch64_sve_ext<mode>"
 883   [(set (match_operand:SVE_ALL 0 "register_operand" "=w")
 884         (unspec:SVE_ALL [(match_operand:SVE_ALL 1 "register_operand" "0")
 885                          (match_operand:SVE_ALL 2 "register_operand" "w")
 886                          (match_operand:SI 3 "const_int_operand")]
 887                         UNSPEC_EXT))]
 888   "TARGET_SVE
 889    && IN_RANGE (INTVAL (operands[3]) * GET_MODE_SIZE (<VEL>mode), 0, 255)"
 890   {
 891     operands[3] = GEN_INT (INTVAL (operands[3]) * GET_MODE_SIZE (<VEL>mode));
 892     return "ext\\t%0.b, %0.b, %2.b, #%3";
 893   }
 894 )
 895
 896 (define_insn "add<mode>3"
 897   [(set (match_operand:SVE_I 0 "register_operand" "=w, w, w, w")
 898         (plus:SVE_I
 899           (match_operand:SVE_I 1 "register_operand" "%0, 0, 0, w")
 900           (match_operand:SVE_I 2 "aarch64_sve_add_operand" "vsa, vsn, vsi, w")))]
 901   "TARGET_SVE"
 902   "@
 903    add\t%0.<Vetype>, %0.<Vetype>, #%D2
 904    sub\t%0.<Vetype>, %0.<Vetype>, #%N2
 905    * return aarch64_output_sve_inc_dec_immediate (\"%0.<Vetype>\", operands[2]);
 906    add\t%0.<Vetype>, %1.<Vetype>, %2.<Vetype>"
 907 )
 908
 909 (define_insn "sub<mode>3"
 910   [(set (match_operand:SVE_I 0 "register_operand" "=w, w")
 911         (minus:SVE_I
 912           (match_operand:SVE_I 1 "aarch64_sve_arith_operand" "w, vsa")
 913           (match_operand:SVE_I 2 "register_operand" "w, 0")))]
 914   "TARGET_SVE"
 915   "@
 916    sub\t%0.<Vetype>, %1.<Vetype>, %2.<Vetype>
 917    subr\t%0.<Vetype>, %0.<Vetype>, #%D1"
 918 )
 919
 920 ;; Unpredicated multiplication.
 921 (define_expand "mul<mode>3"
 922   [(set (match_operand:SVE_I 0 "register_operand")
 923         (unspec:SVE_I
 924           [(match_dup 3)
 925            (mult:SVE_I
 926              (match_operand:SVE_I 1 "register_operand")
 927              (match_operand:SVE_I 2 "aarch64_sve_mul_operand"))]
 928           UNSPEC_MERGE_PTRUE))]
 929   "TARGET_SVE"
 930   {
 931     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
 932   }
 933 )
 934
 935 ;; Multiplication predicated with a PTRUE.  We don't actually need the
 936 ;; predicate for the first alternative, but using Upa or X isn't likely
 937 ;; to gain much and would make the instruction seem less uniform to the
 938 ;; register allocator.
 939 (define_insn "*mul<mode>3"
 940   [(set (match_operand:SVE_I 0 "register_operand" "=w, w")
 941         (unspec:SVE_I
 942           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
 943            (mult:SVE_I
 944              (match_operand:SVE_I 2 "register_operand" "%0, 0")
 945              (match_operand:SVE_I 3 "aarch64_sve_mul_operand" "vsm, w"))]
 946           UNSPEC_MERGE_PTRUE))]
 947   "TARGET_SVE"
 948   "@
 949    mul\t%0.<Vetype>, %0.<Vetype>, #%3
 950    mul\t%0.<Vetype>, %1/m, %0.<Vetype>, %3.<Vetype>"
 951 )
 952
 953 (define_insn "*madd<mode>"
 954   [(set (match_operand:SVE_I 0 "register_operand" "=w, w")
 955         (plus:SVE_I
 956           (unspec:SVE_I
 957             [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
 958              (mult:SVE_I (match_operand:SVE_I 2 "register_operand" "%0, w")
 959                          (match_operand:SVE_I 3 "register_operand" "w, w"))]
 960             UNSPEC_MERGE_PTRUE)
 961           (match_operand:SVE_I 4 "register_operand" "w, 0")))]
 962   "TARGET_SVE"
 963   "@
 964    mad\t%0.<Vetype>, %1/m, %3.<Vetype>, %4.<Vetype>
 965    mla\t%0.<Vetype>, %1/m, %2.<Vetype>, %3.<Vetype>"
 966 )
 967
 968 (define_insn "*msub<mode>3"
 969   [(set (match_operand:SVE_I 0 "register_operand" "=w, w")
 970         (minus:SVE_I
 971           (match_operand:SVE_I 4 "register_operand" "w, 0")
 972           (unspec:SVE_I
 973             [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
 974              (mult:SVE_I (match_operand:SVE_I 2 "register_operand" "%0, w")
 975                          (match_operand:SVE_I 3 "register_operand" "w, w"))]
 976             UNSPEC_MERGE_PTRUE)))]
 977   "TARGET_SVE"
 978   "@
 979    msb\t%0.<Vetype>, %1/m, %3.<Vetype>, %4.<Vetype>
 980    mls\t%0.<Vetype>, %1/m, %2.<Vetype>, %3.<Vetype>"
 981 )
 982
 983 ;; Unpredicated NEG, NOT and POPCOUNT.
 984 (define_expand "<optab><mode>2"
 985   [(set (match_operand:SVE_I 0 "register_operand")
 986         (unspec:SVE_I
 987           [(match_dup 2)
 988            (SVE_INT_UNARY:SVE_I (match_operand:SVE_I 1 "register_operand"))]
 989           UNSPEC_MERGE_PTRUE))]
 990   "TARGET_SVE"
 991   {
 992     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
 993   }
 994 )
 995
 996 ;; NEG, NOT and POPCOUNT predicated with a PTRUE.
 997 (define_insn "*<optab><mode>2"
 998   [(set (match_operand:SVE_I 0 "register_operand" "=w")
 999         (unspec:SVE_I
1000           [(match_operand:<VPRED> 1 "register_operand" "Upl")
1001            (SVE_INT_UNARY:SVE_I
1002              (match_operand:SVE_I 2 "register_operand" "w"))]
1003           UNSPEC_MERGE_PTRUE))]
1004   "TARGET_SVE"
1005   "<sve_int_op>\t%0.<Vetype>, %1/m, %2.<Vetype>"
1006 )
1007
1008 ;; Vector AND, ORR and XOR.
1009 (define_insn "<optab><mode>3"
1010   [(set (match_operand:SVE_I 0 "register_operand" "=w, w")
1011         (LOGICAL:SVE_I
1012           (match_operand:SVE_I 1 "register_operand" "%0, w")
1013           (match_operand:SVE_I 2 "aarch64_sve_logical_operand" "vsl, w")))]
1014   "TARGET_SVE"
1015   "@
1016    <logical>\t%0.<Vetype>, %0.<Vetype>, #%C2
1017    <logical>\t%0.d, %1.d, %2.d"
1018 )
1019
1020 ;; Vector AND, ORR and XOR on floating-point modes.  We avoid subregs
1021 ;; by providing this, but we need to use UNSPECs since rtx logical ops
1022 ;; aren't defined for floating-point modes.
1023 (define_insn "*<optab><mode>3"
1024   [(set (match_operand:SVE_F 0 "register_operand" "=w")
1025         (unspec:SVE_F [(match_operand:SVE_F 1 "register_operand" "w")
1026                        (match_operand:SVE_F 2 "register_operand" "w")]
1027                       LOGICALF))]
1028   "TARGET_SVE"
1029   "<logicalf_op>\t%0.d, %1.d, %2.d"
1030 )
1031
1032 ;; REG_EQUAL notes on "not<mode>3" should ensure that we can generate
1033 ;; this pattern even though the NOT instruction itself is predicated.
1034 (define_insn "bic<mode>3"
1035   [(set (match_operand:SVE_I 0 "register_operand" "=w")
1036         (and:SVE_I
1037           (not:SVE_I (match_operand:SVE_I 1 "register_operand" "w"))
1038           (match_operand:SVE_I 2 "register_operand" "w")))]
1039   "TARGET_SVE"
1040   "bic\t%0.d, %2.d, %1.d"
1041 )
1042
1043 ;; Predicate AND.  We can reuse one of the inputs as the GP.
1044 (define_insn "and<mode>3"
1045   [(set (match_operand:PRED_ALL 0 "register_operand" "=Upa")
1046         (and:PRED_ALL (match_operand:PRED_ALL 1 "register_operand" "Upa")
1047                       (match_operand:PRED_ALL 2 "register_operand" "Upa")))]
1048   "TARGET_SVE"
1049   "and\t%0.b, %1/z, %1.b, %2.b"
1050 )
1051
1052 ;; Unpredicated predicate ORR and XOR.
1053 (define_expand "<optab><mode>3"
1054   [(set (match_operand:PRED_ALL 0 "register_operand")
1055         (and:PRED_ALL
1056           (LOGICAL_OR:PRED_ALL
1057             (match_operand:PRED_ALL 1 "register_operand")
1058             (match_operand:PRED_ALL 2 "register_operand"))
1059           (match_dup 3)))]
1060   "TARGET_SVE"
1061   {
1062     operands[3] = force_reg (<MODE>mode, CONSTM1_RTX (<MODE>mode));
1063   }
1064 )
1065
1066 ;; Predicated predicate ORR and XOR.
1067 (define_insn "pred_<optab><mode>3"
1068   [(set (match_operand:PRED_ALL 0 "register_operand" "=Upa")
1069         (and:PRED_ALL
1070           (LOGICAL:PRED_ALL
1071             (match_operand:PRED_ALL 2 "register_operand" "Upa")
1072             (match_operand:PRED_ALL 3 "register_operand" "Upa"))
1073           (match_operand:PRED_ALL 1 "register_operand" "Upa")))]
1074   "TARGET_SVE"
1075   "<logical>\t%0.b, %1/z, %2.b, %3.b"
1076 )
1077
1078 ;; Perform a logical operation on operands 2 and 3, using operand 1 as
1079 ;; the GP (which is known to be a PTRUE).  Store the result in operand 0
1080 ;; and set the flags in the same way as for PTEST.  The (and ...) in the
1081 ;; UNSPEC_PTEST_PTRUE is logically redundant, but means that the tested
1082 ;; value is structurally equivalent to rhs of the second set.
1083 (define_insn "*<optab><mode>3_cc"
1084   [(set (reg:CC CC_REGNUM)
1085         (compare:CC
1086           (unspec:SI [(match_operand:PRED_ALL 1 "register_operand" "Upa")
1087                       (and:PRED_ALL
1088                         (LOGICAL:PRED_ALL
1089                           (match_operand:PRED_ALL 2 "register_operand" "Upa")
1090                           (match_operand:PRED_ALL 3 "register_operand" "Upa"))
1091                         (match_dup 1))]
1092                      UNSPEC_PTEST_PTRUE)
1093           (const_int 0)))
1094    (set (match_operand:PRED_ALL 0 "register_operand" "=Upa")
1095         (and:PRED_ALL (LOGICAL:PRED_ALL (match_dup 2) (match_dup 3))
1096                       (match_dup 1)))]
1097   "TARGET_SVE"
1098   "<logical>s\t%0.b, %1/z, %2.b, %3.b"
1099 )
1100
1101 ;; Unpredicated predicate inverse.
1102 (define_expand "one_cmpl<mode>2"
1103   [(set (match_operand:PRED_ALL 0 "register_operand")
1104         (and:PRED_ALL
1105           (not:PRED_ALL (match_operand:PRED_ALL 1 "register_operand"))
1106           (match_dup 2)))]
1107   "TARGET_SVE"
1108   {
1109     operands[2] = force_reg (<MODE>mode, CONSTM1_RTX (<MODE>mode));
1110   }
1111 )
1112
1113 ;; Predicated predicate inverse.
1114 (define_insn "*one_cmpl<mode>3"
1115   [(set (match_operand:PRED_ALL 0 "register_operand" "=Upa")
1116         (and:PRED_ALL
1117           (not:PRED_ALL (match_operand:PRED_ALL 2 "register_operand" "Upa"))
1118           (match_operand:PRED_ALL 1 "register_operand" "Upa")))]
1119   "TARGET_SVE"
1120   "not\t%0.b, %1/z, %2.b"
1121 )
1122
1123 ;; Predicated predicate BIC and ORN.
1124 (define_insn "*<nlogical><mode>3"
1125   [(set (match_operand:PRED_ALL 0 "register_operand" "=Upa")
1126         (and:PRED_ALL
1127           (NLOGICAL:PRED_ALL
1128             (not:PRED_ALL (match_operand:PRED_ALL 2 "register_operand" "Upa"))
1129             (match_operand:PRED_ALL 3 "register_operand" "Upa"))
1130           (match_operand:PRED_ALL 1 "register_operand" "Upa")))]
1131   "TARGET_SVE"
1132   "<nlogical>\t%0.b, %1/z, %3.b, %2.b"
1133 )
1134
1135 ;; Predicated predicate NAND and NOR.
1136 (define_insn "*<logical_nn><mode>3"
1137   [(set (match_operand:PRED_ALL 0 "register_operand" "=Upa")
1138         (and:PRED_ALL
1139           (NLOGICAL:PRED_ALL
1140             (not:PRED_ALL (match_operand:PRED_ALL 2 "register_operand" "Upa"))
1141             (not:PRED_ALL (match_operand:PRED_ALL 3 "register_operand" "Upa")))
1142           (match_operand:PRED_ALL 1 "register_operand" "Upa")))]
1143   "TARGET_SVE"
1144   "<logical_nn>\t%0.b, %1/z, %2.b, %3.b"
1145 )
1146
1147 ;; Unpredicated LSL, LSR and ASR by a vector.
1148 (define_expand "v<optab><mode>3"
1149   [(set (match_operand:SVE_I 0 "register_operand")
1150         (unspec:SVE_I
1151           [(match_dup 3)
1152            (ASHIFT:SVE_I
1153              (match_operand:SVE_I 1 "register_operand")
1154              (match_operand:SVE_I 2 "aarch64_sve_<lr>shift_operand"))]
1155           UNSPEC_MERGE_PTRUE))]
1156   "TARGET_SVE"
1157   {
1158     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1159   }
1160 )
1161
1162 ;; LSL, LSR and ASR by a vector, predicated with a PTRUE.  We don't
1163 ;; actually need the predicate for the first alternative, but using Upa
1164 ;; or X isn't likely to gain much and would make the instruction seem
1165 ;; less uniform to the register allocator.
1166 (define_insn "*v<optab><mode>3"
1167   [(set (match_operand:SVE_I 0 "register_operand" "=w, w")
1168         (unspec:SVE_I
1169           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1170            (ASHIFT:SVE_I
1171              (match_operand:SVE_I 2 "register_operand" "w, 0")
1172              (match_operand:SVE_I 3 "aarch64_sve_<lr>shift_operand" "D<lr>, w"))]
1173           UNSPEC_MERGE_PTRUE))]
1174   "TARGET_SVE"
1175   "@
1176    <shift>\t%0.<Vetype>, %2.<Vetype>, #%3
1177    <shift>\t%0.<Vetype>, %1/m, %0.<Vetype>, %3.<Vetype>"
1178 )
1179
1180 ;; LSL, LSR and ASR by a scalar, which expands into one of the vector
1181 ;; shifts above.
1182 (define_expand "<ASHIFT:optab><mode>3"
1183   [(set (match_operand:SVE_I 0 "register_operand")
1184         (ASHIFT:SVE_I (match_operand:SVE_I 1 "register_operand")
1185                       (match_operand:<VEL> 2 "general_operand")))]
1186   "TARGET_SVE"
1187   {
1188     rtx amount;
1189     if (CONST_INT_P (operands[2]))
1190       {
1191         amount = gen_const_vec_duplicate (<MODE>mode, operands[2]);
1192         if (!aarch64_sve_<lr>shift_operand (operands[2], <MODE>mode))
1193           amount = force_reg (<MODE>mode, amount);
1194       }
1195     else
1196       {
1197         amount = gen_reg_rtx (<MODE>mode);
1198         emit_insn (gen_vec_duplicate<mode> (amount,
1199                                             convert_to_mode (<VEL>mode,
1200                                                              operands[2], 0)));
1201       }
1202     emit_insn (gen_v<optab><mode>3 (operands[0], operands[1], amount));
1203     DONE;
1204   }
1205 )
1206
1207 ;; Test all bits of operand 1.  Operand 0 is a GP that is known to hold PTRUE.
1208 ;;
1209 ;; Using UNSPEC_PTEST_PTRUE allows combine patterns to assume that the GP
1210 ;; is a PTRUE even if the optimizers haven't yet been able to propagate
1211 ;; the constant.  We would use a separate unspec code for PTESTs involving
1212 ;; GPs that might not be PTRUEs.
1213 (define_insn "ptest_ptrue<mode>"
1214   [(set (reg:CC CC_REGNUM)
1215         (compare:CC
1216           (unspec:SI [(match_operand:PRED_ALL 0 "register_operand" "Upa")
1217                       (match_operand:PRED_ALL 1 "register_operand" "Upa")]
1218                      UNSPEC_PTEST_PTRUE)
1219           (const_int 0)))]
1220   "TARGET_SVE"
1221   "ptest\t%0, %1.b"
1222 )
1223
1224 ;; Set element I of the result if operand1 + J < operand2 for all J in [0, I].
1225 ;; with the comparison being unsigned.
1226 (define_insn "while_ult<GPI:mode><PRED_ALL:mode>"
1227   [(set (match_operand:PRED_ALL 0 "register_operand" "=Upa")
1228         (unspec:PRED_ALL [(match_operand:GPI 1 "aarch64_reg_or_zero" "rZ")
1229                           (match_operand:GPI 2 "aarch64_reg_or_zero" "rZ")]
1230                          UNSPEC_WHILE_LO))
1231    (clobber (reg:CC CC_REGNUM))]
1232   "TARGET_SVE"
1233   "whilelo\t%0.<PRED_ALL:Vetype>, %<w>1, %<w>2"
1234 )
1235
1236 ;; WHILELO sets the flags in the same way as a PTEST with a PTRUE GP.
1237 ;; Handle the case in which both results are useful.  The GP operand
1238 ;; to the PTEST isn't needed, so we allow it to be anything.
1239 (define_insn_and_split "while_ult<GPI:mode><PRED_ALL:mode>_cc"
1240   [(set (reg:CC CC_REGNUM)
1241         (compare:CC
1242           (unspec:SI [(match_operand:PRED_ALL 1)
1243                       (unspec:PRED_ALL
1244                         [(match_operand:GPI 2 "aarch64_reg_or_zero" "rZ")
1245                          (match_operand:GPI 3 "aarch64_reg_or_zero" "rZ")]
1246                         UNSPEC_WHILE_LO)]
1247                      UNSPEC_PTEST_PTRUE)
1248           (const_int 0)))
1249    (set (match_operand:PRED_ALL 0 "register_operand" "=Upa")
1250         (unspec:PRED_ALL [(match_dup 2)
1251                           (match_dup 3)]
1252                          UNSPEC_WHILE_LO))]
1253   "TARGET_SVE"
1254   "whilelo\t%0.<PRED_ALL:Vetype>, %<w>2, %<w>3"
1255   ;; Force the compiler to drop the unused predicate operand, so that we
1256   ;; don't have an unnecessary PTRUE.
1257   "&& !CONSTANT_P (operands[1])"
1258   [(const_int 0)]
1259   {
1260     emit_insn (gen_while_ult<GPI:mode><PRED_ALL:mode>_cc
1261                (operands[0], CONSTM1_RTX (<MODE>mode),
1262                 operands[2], operands[3]));
1263     DONE;
1264   }
1265 )
1266
1267 ;; Predicated integer comparison.
1268 (define_insn "*vec_cmp<cmp_op>_<mode>"
1269   [(set (match_operand:<VPRED> 0 "register_operand" "=Upa, Upa")
1270         (unspec:<VPRED>
1271           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1272            (match_operand:SVE_I 2 "register_operand" "w, w")
1273            (match_operand:SVE_I 3 "aarch64_sve_cmp_<imm_con>_operand" "<imm_con>, w")]
1274           SVE_COND_INT_CMP))
1275    (clobber (reg:CC CC_REGNUM))]
1276   "TARGET_SVE"
1277   "@
1278    cmp<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, #%3
1279    cmp<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, %3.<Vetype>"
1280 )
1281
1282 ;; Predicated integer comparison in which only the flags result is interesting.
1283 (define_insn "*vec_cmp<cmp_op>_<mode>_ptest"
1284   [(set (reg:CC CC_REGNUM)
1285         (compare:CC
1286           (unspec:SI
1287             [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1288              (unspec:<VPRED>
1289                [(match_dup 1)
1290                 (match_operand:SVE_I 2 "register_operand" "w, w")
1291                 (match_operand:SVE_I 3 "aarch64_sve_cmp_<imm_con>_operand" "<imm_con>, w")]
1292                SVE_COND_INT_CMP)]
1293             UNSPEC_PTEST_PTRUE)
1294           (const_int 0)))
1295    (clobber (match_scratch:<VPRED> 0 "=Upa, Upa"))]
1296   "TARGET_SVE"
1297   "@
1298    cmp<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, #%3
1299    cmp<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, %3.<Vetype>"
1300 )
1301
1302 ;; Predicated comparison in which both the flag and predicate results
1303 ;; are interesting.
1304 (define_insn "*vec_cmp<cmp_op>_<mode>_cc"
1305   [(set (reg:CC CC_REGNUM)
1306         (compare:CC
1307           (unspec:SI
1308             [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1309              (unspec:<VPRED>
1310                [(match_dup 1)
1311                 (match_operand:SVE_I 2 "register_operand" "w, w")
1312                 (match_operand:SVE_I 3 "aarch64_sve_cmp_<imm_con>_operand" "<imm_con>, w")]
1313                SVE_COND_INT_CMP)]
1314             UNSPEC_PTEST_PTRUE)
1315           (const_int 0)))
1316    (set (match_operand:<VPRED> 0 "register_operand" "=Upa, Upa")
1317         (unspec:<VPRED>
1318           [(match_dup 1)
1319            (match_dup 2)
1320            (match_dup 3)]
1321           SVE_COND_INT_CMP))]
1322   "TARGET_SVE"
1323   "@
1324    cmp<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, #%3
1325    cmp<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, %3.<Vetype>"
1326 )
1327
1328 ;; Predicated floating-point comparison (excluding FCMUO, which doesn't
1329 ;; allow #0.0 as an operand).
1330 (define_insn "*vec_fcm<cmp_op><mode>"
1331   [(set (match_operand:<VPRED> 0 "register_operand" "=Upa, Upa")
1332         (unspec:<VPRED>
1333           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1334            (match_operand:SVE_F 2 "register_operand" "w, w")
1335            (match_operand:SVE_F 3 "aarch64_simd_reg_or_zero" "Dz, w")]
1336           SVE_COND_FP_CMP))]
1337   "TARGET_SVE"
1338   "@
1339    fcm<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, #0.0
1340    fcm<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, %3.<Vetype>"
1341 )
1342
1343 ;; Predicated FCMUO.
1344 (define_insn "*vec_fcmuo<mode>"
1345   [(set (match_operand:<VPRED> 0 "register_operand" "=Upa")
1346         (unspec:<VPRED>
1347           [(match_operand:<VPRED> 1 "register_operand" "Upl")
1348            (match_operand:SVE_F 2 "register_operand" "w")
1349            (match_operand:SVE_F 3 "register_operand" "w")]
1350           UNSPEC_COND_UO))]
1351   "TARGET_SVE"
1352   "fcmuo\t%0.<Vetype>, %1/z, %2.<Vetype>, %3.<Vetype>"
1353 )
1354
1355 ;; vcond_mask operand order: true, false, mask
1356 ;; UNSPEC_SEL operand order: mask, true, false (as for VEC_COND_EXPR)
1357 ;; SEL operand order:        mask, true, false
1358 (define_insn "vcond_mask_<mode><vpred>"
1359   [(set (match_operand:SVE_ALL 0 "register_operand" "=w")
1360         (unspec:SVE_ALL
1361           [(match_operand:<VPRED> 3 "register_operand" "Upa")
1362            (match_operand:SVE_ALL 1 "register_operand" "w")
1363            (match_operand:SVE_ALL 2 "register_operand" "w")]
1364           UNSPEC_SEL))]
1365   "TARGET_SVE"
1366   "sel\t%0.<Vetype>, %3, %1.<Vetype>, %2.<Vetype>"
1367 )
1368
1369 ;; Selects between a duplicated immediate and zero.
1370 (define_insn "aarch64_sve_dup<mode>_const"
1371   [(set (match_operand:SVE_I 0 "register_operand" "=w")
1372         (unspec:SVE_I
1373           [(match_operand:<VPRED> 1 "register_operand" "Upl")
1374            (match_operand:SVE_I 2 "aarch64_sve_dup_immediate")
1375            (match_operand:SVE_I 3 "aarch64_simd_imm_zero")]
1376           UNSPEC_SEL))]
1377   "TARGET_SVE"
1378   "mov\t%0.<Vetype>, %1/z, #%2"
1379 )
1380
1381 ;; Integer (signed) vcond.  Don't enforce an immediate range here, since it
1382 ;; depends on the comparison; leave it to aarch64_expand_sve_vcond instead.
1383 (define_expand "vcond<mode><v_int_equiv>"
1384   [(set (match_operand:SVE_ALL 0 "register_operand")
1385         (if_then_else:SVE_ALL
1386           (match_operator 3 "comparison_operator"
1387             [(match_operand:<V_INT_EQUIV> 4 "register_operand")
1388              (match_operand:<V_INT_EQUIV> 5 "nonmemory_operand")])
1389           (match_operand:SVE_ALL 1 "register_operand")
1390           (match_operand:SVE_ALL 2 "register_operand")))]
1391   "TARGET_SVE"
1392   {
1393     aarch64_expand_sve_vcond (<MODE>mode, <V_INT_EQUIV>mode, operands);
1394     DONE;
1395   }
1396 )
1397
1398 ;; Integer vcondu.  Don't enforce an immediate range here, since it
1399 ;; depends on the comparison; leave it to aarch64_expand_sve_vcond instead.
1400 (define_expand "vcondu<mode><v_int_equiv>"
1401   [(set (match_operand:SVE_ALL 0 "register_operand")
1402         (if_then_else:SVE_ALL
1403           (match_operator 3 "comparison_operator"
1404             [(match_operand:<V_INT_EQUIV> 4 "register_operand")
1405              (match_operand:<V_INT_EQUIV> 5 "nonmemory_operand")])
1406           (match_operand:SVE_ALL 1 "register_operand")
1407           (match_operand:SVE_ALL 2 "register_operand")))]
1408   "TARGET_SVE"
1409   {
1410     aarch64_expand_sve_vcond (<MODE>mode, <V_INT_EQUIV>mode, operands);
1411     DONE;
1412   }
1413 )
1414
1415 ;; Floating-point vcond.  All comparisons except FCMUO allow a zero
1416 ;; operand; aarch64_expand_sve_vcond handles the case of an FCMUO
1417 ;; with zero.
1418 (define_expand "vcond<mode><v_fp_equiv>"
1419   [(set (match_operand:SVE_SD 0 "register_operand")
1420         (if_then_else:SVE_SD
1421           (match_operator 3 "comparison_operator"
1422             [(match_operand:<V_FP_EQUIV> 4 "register_operand")
1423              (match_operand:<V_FP_EQUIV> 5 "aarch64_simd_reg_or_zero")])
1424           (match_operand:SVE_SD 1 "register_operand")
1425           (match_operand:SVE_SD 2 "register_operand")))]
1426   "TARGET_SVE"
1427   {
1428     aarch64_expand_sve_vcond (<MODE>mode, <V_FP_EQUIV>mode, operands);
1429     DONE;
1430   }
1431 )
1432
1433 ;; Signed integer comparisons.  Don't enforce an immediate range here, since
1434 ;; it depends on the comparison; leave it to aarch64_expand_sve_vec_cmp_int
1435 ;; instead.
1436 (define_expand "vec_cmp<mode><vpred>"
1437   [(parallel
1438     [(set (match_operand:<VPRED> 0 "register_operand")
1439           (match_operator:<VPRED> 1 "comparison_operator"
1440             [(match_operand:SVE_I 2 "register_operand")
1441              (match_operand:SVE_I 3 "nonmemory_operand")]))
1442      (clobber (reg:CC CC_REGNUM))])]
1443   "TARGET_SVE"
1444   {
1445     aarch64_expand_sve_vec_cmp_int (operands[0], GET_CODE (operands[1]),
1446                                     operands[2], operands[3]);
1447     DONE;
1448   }
1449 )
1450
1451 ;; Unsigned integer comparisons.  Don't enforce an immediate range here, since
1452 ;; it depends on the comparison; leave it to aarch64_expand_sve_vec_cmp_int
1453 ;; instead.
1454 (define_expand "vec_cmpu<mode><vpred>"
1455   [(parallel
1456     [(set (match_operand:<VPRED> 0 "register_operand")
1457           (match_operator:<VPRED> 1 "comparison_operator"
1458             [(match_operand:SVE_I 2 "register_operand")
1459              (match_operand:SVE_I 3 "nonmemory_operand")]))
1460      (clobber (reg:CC CC_REGNUM))])]
1461   "TARGET_SVE"
1462   {
1463     aarch64_expand_sve_vec_cmp_int (operands[0], GET_CODE (operands[1]),
1464                                     operands[2], operands[3]);
1465     DONE;
1466   }
1467 )
1468
1469 ;; Floating-point comparisons.  All comparisons except FCMUO allow a zero
1470 ;; operand; aarch64_expand_sve_vec_cmp_float handles the case of an FCMUO
1471 ;; with zero.
1472 (define_expand "vec_cmp<mode><vpred>"
1473   [(set (match_operand:<VPRED> 0 "register_operand")
1474         (match_operator:<VPRED> 1 "comparison_operator"
1475           [(match_operand:SVE_F 2 "register_operand")
1476            (match_operand:SVE_F 3 "aarch64_simd_reg_or_zero")]))]
1477   "TARGET_SVE"
1478   {
1479     aarch64_expand_sve_vec_cmp_float (operands[0], GET_CODE (operands[1]),
1480                                       operands[2], operands[3], false);
1481     DONE;
1482   }
1483 )
1484
1485 ;; Branch based on predicate equality or inequality.
1486 (define_expand "cbranch<mode>4"
1487   [(set (pc)
1488         (if_then_else
1489           (match_operator 0 "aarch64_equality_operator"
1490             [(match_operand:PRED_ALL 1 "register_operand")
1491              (match_operand:PRED_ALL 2 "aarch64_simd_reg_or_zero")])
1492           (label_ref (match_operand 3 ""))
1493           (pc)))]
1494   ""
1495   {
1496     rtx ptrue = force_reg (<MODE>mode, CONSTM1_RTX (<MODE>mode));
1497     rtx pred;
1498     if (operands[2] == CONST0_RTX (<MODE>mode))
1499       pred = operands[1];
1500     else
1501       {
1502         pred = gen_reg_rtx (<MODE>mode);
1503         emit_insn (gen_pred_xor<mode>3 (pred, ptrue, operands[1],
1504                                         operands[2]));
1505       }
1506     emit_insn (gen_ptest_ptrue<mode> (ptrue, pred));
1507     operands[1] = gen_rtx_REG (CCmode, CC_REGNUM);
1508     operands[2] = const0_rtx;
1509   }
1510 )
1511
1512 ;; Unpredicated integer MIN/MAX.
1513 (define_expand "<su><maxmin><mode>3"
1514   [(set (match_operand:SVE_I 0 "register_operand")
1515         (unspec:SVE_I
1516           [(match_dup 3)
1517            (MAXMIN:SVE_I (match_operand:SVE_I 1 "register_operand")
1518                          (match_operand:SVE_I 2 "register_operand"))]
1519           UNSPEC_MERGE_PTRUE))]
1520   "TARGET_SVE"
1521   {
1522     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1523   }
1524 )
1525
1526 ;; Integer MIN/MAX predicated with a PTRUE.
1527 (define_insn "*<su><maxmin><mode>3"
1528   [(set (match_operand:SVE_I 0 "register_operand" "=w")
1529         (unspec:SVE_I
1530           [(match_operand:<VPRED> 1 "register_operand" "Upl")
1531            (MAXMIN:SVE_I (match_operand:SVE_I 2 "register_operand" "%0")
1532                          (match_operand:SVE_I 3 "register_operand" "w"))]
1533           UNSPEC_MERGE_PTRUE))]
1534   "TARGET_SVE"
1535   "<su><maxmin>\t%0.<Vetype>, %1/m, %0.<Vetype>, %3.<Vetype>"
1536 )
1537
1538 ;; Unpredicated floating-point MIN/MAX.
1539 (define_expand "<su><maxmin><mode>3"
1540   [(set (match_operand:SVE_F 0 "register_operand")
1541         (unspec:SVE_F
1542           [(match_dup 3)
1543            (FMAXMIN:SVE_F (match_operand:SVE_F 1 "register_operand")
1544                           (match_operand:SVE_F 2 "register_operand"))]
1545           UNSPEC_MERGE_PTRUE))]
1546   "TARGET_SVE"
1547   {
1548     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1549   }
1550 )
1551
1552 ;; Floating-point MIN/MAX predicated with a PTRUE.
1553 (define_insn "*<su><maxmin><mode>3"
1554   [(set (match_operand:SVE_F 0 "register_operand" "=w")
1555         (unspec:SVE_F
1556           [(match_operand:<VPRED> 1 "register_operand" "Upl")
1557            (FMAXMIN:SVE_F (match_operand:SVE_F 2 "register_operand" "%0")
1558                           (match_operand:SVE_F 3 "register_operand" "w"))]
1559           UNSPEC_MERGE_PTRUE))]
1560   "TARGET_SVE"
1561   "f<maxmin>nm\t%0.<Vetype>, %1/m, %0.<Vetype>, %3.<Vetype>"
1562 )
1563
1564 ;; Unpredicated fmin/fmax.
1565 (define_expand "<maxmin_uns><mode>3"
1566   [(set (match_operand:SVE_F 0 "register_operand")
1567         (unspec:SVE_F
1568           [(match_dup 3)
1569            (unspec:SVE_F [(match_operand:SVE_F 1 "register_operand")
1570                           (match_operand:SVE_F 2 "register_operand")]
1571                          FMAXMIN_UNS)]
1572           UNSPEC_MERGE_PTRUE))]
1573   "TARGET_SVE"
1574   {
1575     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1576   }
1577 )
1578
1579 ;; fmin/fmax predicated with a PTRUE.
1580 (define_insn "*<maxmin_uns><mode>3"
1581   [(set (match_operand:SVE_F 0 "register_operand" "=w")
1582         (unspec:SVE_F
1583           [(match_operand:<VPRED> 1 "register_operand" "Upl")
1584            (unspec:SVE_F [(match_operand:SVE_F 2 "register_operand" "%0")
1585                           (match_operand:SVE_F 3 "register_operand" "w")]
1586                          FMAXMIN_UNS)]
1587           UNSPEC_MERGE_PTRUE))]
1588   "TARGET_SVE"
1589   "<maxmin_uns_op>\t%0.<Vetype>, %1/m, %0.<Vetype>, %3.<Vetype>"
1590 )
1591
1592 ;; Predicated integer operations.
1593 (define_insn "cond_<optab><mode>"
1594   [(set (match_operand:SVE_I 0 "register_operand" "=w")
1595         (unspec:SVE_I
1596           [(match_operand:<VPRED> 1 "register_operand" "Upl")
1597            (match_operand:SVE_I 2 "register_operand" "0")
1598            (match_operand:SVE_I 3 "register_operand" "w")]
1599           SVE_COND_INT_OP))]
1600   "TARGET_SVE"
1601   "<sve_int_op>\t%0.<Vetype>, %1/m, %0.<Vetype>, %3.<Vetype>"
1602 )
1603
1604 ;; Set operand 0 to the last active element in operand 3, or to tied
1605 ;; operand 1 if no elements are active.
1606 (define_insn "fold_extract_last_<mode>"
1607   [(set (match_operand:<VEL> 0 "register_operand" "=r, w")
1608         (unspec:<VEL>
1609           [(match_operand:<VEL> 1 "register_operand" "0, 0")
1610            (match_operand:<VPRED> 2 "register_operand" "Upl, Upl")
1611            (match_operand:SVE_ALL 3 "register_operand" "w, w")]
1612           UNSPEC_CLASTB))]
1613   "TARGET_SVE"
1614   "@
1615    clastb\t%<vwcore>0, %2, %<vwcore>0, %3.<Vetype>
1616    clastb\t%<vw>0, %2, %<vw>0, %3.<Vetype>"
1617 )
1618
1619 ;; Unpredicated integer add reduction.
1620 (define_expand "reduc_plus_scal_<mode>"
1621   [(set (match_operand:<VEL> 0 "register_operand")
1622         (unspec:<VEL> [(match_dup 2)
1623                        (match_operand:SVE_I 1 "register_operand")]
1624                       UNSPEC_ADDV))]
1625   "TARGET_SVE"
1626   {
1627     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1628   }
1629 )
1630
1631 ;; Predicated integer add reduction.  The result is always 64-bits.
1632 (define_insn "*reduc_plus_scal_<mode>"
1633   [(set (match_operand:<VEL> 0 "register_operand" "=w")
1634         (unspec:<VEL> [(match_operand:<VPRED> 1 "register_operand" "Upl")
1635                        (match_operand:SVE_I 2 "register_operand" "w")]
1636                       UNSPEC_ADDV))]
1637   "TARGET_SVE"
1638   "uaddv\t%d0, %1, %2.<Vetype>"
1639 )
1640
1641 ;; Unpredicated floating-point add reduction.
1642 (define_expand "reduc_plus_scal_<mode>"
1643   [(set (match_operand:<VEL> 0 "register_operand")
1644         (unspec:<VEL> [(match_dup 2)
1645                        (match_operand:SVE_F 1 "register_operand")]
1646                       UNSPEC_FADDV))]
1647   "TARGET_SVE"
1648   {
1649     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1650   }
1651 )
1652
1653 ;; Predicated floating-point add reduction.
1654 (define_insn "*reduc_plus_scal_<mode>"
1655   [(set (match_operand:<VEL> 0 "register_operand" "=w")
1656         (unspec:<VEL> [(match_operand:<VPRED> 1 "register_operand" "Upl")
1657                        (match_operand:SVE_F 2 "register_operand" "w")]
1658                       UNSPEC_FADDV))]
1659   "TARGET_SVE"
1660   "faddv\t%<Vetype>0, %1, %2.<Vetype>"
1661 )
1662
1663 ;; Unpredicated integer MIN/MAX reduction.
1664 (define_expand "reduc_<maxmin_uns>_scal_<mode>"
1665   [(set (match_operand:<VEL> 0 "register_operand")
1666         (unspec:<VEL> [(match_dup 2)
1667                        (match_operand:SVE_I 1 "register_operand")]
1668                       MAXMINV))]
1669   "TARGET_SVE"
1670   {
1671     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1672   }
1673 )
1674
1675 ;; Predicated integer MIN/MAX reduction.
1676 (define_insn "*reduc_<maxmin_uns>_scal_<mode>"
1677   [(set (match_operand:<VEL> 0 "register_operand" "=w")
1678         (unspec:<VEL> [(match_operand:<VPRED> 1 "register_operand" "Upl")
1679                        (match_operand:SVE_I 2 "register_operand" "w")]
1680                       MAXMINV))]
1681   "TARGET_SVE"
1682   "<maxmin_uns_op>v\t%<Vetype>0, %1, %2.<Vetype>"
1683 )
1684
1685 ;; Unpredicated floating-point MIN/MAX reduction.
1686 (define_expand "reduc_<maxmin_uns>_scal_<mode>"
1687   [(set (match_operand:<VEL> 0 "register_operand")
1688         (unspec:<VEL> [(match_dup 2)
1689                        (match_operand:SVE_F 1 "register_operand")]
1690                       FMAXMINV))]
1691   "TARGET_SVE"
1692   {
1693     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1694   }
1695 )
1696
1697 ;; Predicated floating-point MIN/MAX reduction.
1698 (define_insn "*reduc_<maxmin_uns>_scal_<mode>"
1699   [(set (match_operand:<VEL> 0 "register_operand" "=w")
1700         (unspec:<VEL> [(match_operand:<VPRED> 1 "register_operand" "Upl")
1701                        (match_operand:SVE_F 2 "register_operand" "w")]
1702                       FMAXMINV))]
1703   "TARGET_SVE"
1704   "<maxmin_uns_op>v\t%<Vetype>0, %1, %2.<Vetype>"
1705 )
1706
1707 (define_expand "reduc_<optab>_scal_<mode>"
1708   [(set (match_operand:<VEL> 0 "register_operand")
1709         (unspec:<VEL> [(match_dup 2)
1710                        (match_operand:SVE_I 1 "register_operand")]
1711                       BITWISEV))]
1712   "TARGET_SVE"
1713   {
1714     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1715   }
1716 )
1717
1718 (define_insn "*reduc_<optab>_scal_<mode>"
1719   [(set (match_operand:<VEL> 0 "register_operand" "=w")
1720         (unspec:<VEL> [(match_operand:<VPRED> 1 "register_operand" "Upl")
1721                        (match_operand:SVE_I 2 "register_operand" "w")]
1722                       BITWISEV))]
1723   "TARGET_SVE"
1724   "<bit_reduc_op>\t%<Vetype>0, %1, %2.<Vetype>"
1725 )
1726
1727 ;; Unpredicated in-order FP reductions.
1728 (define_expand "fold_left_plus_<mode>"
1729   [(set (match_operand:<VEL> 0 "register_operand")
1730         (unspec:<VEL> [(match_dup 3)
1731                        (match_operand:<VEL> 1 "register_operand")
1732                        (match_operand:SVE_F 2 "register_operand")]
1733                       UNSPEC_FADDA))]
1734   "TARGET_SVE"
1735   {
1736     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1737   }
1738 )
1739
1740 ;; In-order FP reductions predicated with PTRUE.
1741 (define_insn "*fold_left_plus_<mode>"
1742   [(set (match_operand:<VEL> 0 "register_operand" "=w")
1743         (unspec:<VEL> [(match_operand:<VPRED> 1 "register_operand" "Upl")
1744                        (match_operand:<VEL> 2 "register_operand" "0")
1745                        (match_operand:SVE_F 3 "register_operand" "w")]
1746                       UNSPEC_FADDA))]
1747   "TARGET_SVE"
1748   "fadda\t%<Vetype>0, %1, %<Vetype>0, %3.<Vetype>"
1749 )
1750
1751 ;; Predicated form of the above in-order reduction.
1752 (define_insn "*pred_fold_left_plus_<mode>"
1753   [(set (match_operand:<VEL> 0 "register_operand" "=w")
1754         (unspec:<VEL>
1755           [(match_operand:<VEL> 1 "register_operand" "0")
1756            (unspec:SVE_F
1757              [(match_operand:<VPRED> 2 "register_operand" "Upl")
1758               (match_operand:SVE_F 3 "register_operand" "w")
1759               (match_operand:SVE_F 4 "aarch64_simd_imm_zero")]
1760              UNSPEC_SEL)]
1761           UNSPEC_FADDA))]
1762   "TARGET_SVE"
1763   "fadda\t%<Vetype>0, %2, %<Vetype>0, %3.<Vetype>"
1764 )
1765
1766 ;; Unpredicated floating-point addition.
1767 (define_expand "add<mode>3"
1768   [(set (match_operand:SVE_F 0 "register_operand")
1769         (unspec:SVE_F
1770           [(match_dup 3)
1771            (plus:SVE_F
1772              (match_operand:SVE_F 1 "register_operand")
1773              (match_operand:SVE_F 2 "aarch64_sve_float_arith_with_sub_operand"))]
1774           UNSPEC_MERGE_PTRUE))]
1775   "TARGET_SVE"
1776   {
1777     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1778   }
1779 )
1780
1781 ;; Floating-point addition predicated with a PTRUE.
1782 (define_insn "*add<mode>3"
1783   [(set (match_operand:SVE_F 0 "register_operand" "=w, w, w")
1784         (unspec:SVE_F
1785           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl, Upl")
1786            (plus:SVE_F
1787               (match_operand:SVE_F 2 "register_operand" "%0, 0, w")
1788               (match_operand:SVE_F 3 "aarch64_sve_float_arith_with_sub_operand" "vsA, vsN, w"))]
1789           UNSPEC_MERGE_PTRUE))]
1790   "TARGET_SVE"
1791   "@
1792    fadd\t%0.<Vetype>, %1/m, %0.<Vetype>, #%3
1793    fsub\t%0.<Vetype>, %1/m, %0.<Vetype>, #%N3
1794    fadd\t%0.<Vetype>, %2.<Vetype>, %3.<Vetype>"
1795 )
1796
1797 ;; Unpredicated floating-point subtraction.
1798 (define_expand "sub<mode>3"
1799   [(set (match_operand:SVE_F 0 "register_operand")
1800         (unspec:SVE_F
1801           [(match_dup 3)
1802            (minus:SVE_F
1803              (match_operand:SVE_F 1 "aarch64_sve_float_arith_operand")
1804              (match_operand:SVE_F 2 "register_operand"))]
1805           UNSPEC_MERGE_PTRUE))]
1806   "TARGET_SVE"
1807   {
1808     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1809   }
1810 )
1811
1812 ;; Floating-point subtraction predicated with a PTRUE.
1813 (define_insn "*sub<mode>3"
1814   [(set (match_operand:SVE_F 0 "register_operand" "=w, w, w, w")
1815         (unspec:SVE_F
1816           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl, Upl, Upl")
1817            (minus:SVE_F
1818              (match_operand:SVE_F 2 "aarch64_sve_float_arith_operand" "0, 0, vsA, w")
1819              (match_operand:SVE_F 3 "aarch64_sve_float_arith_with_sub_operand" "vsA, vsN, 0, w"))]
1820           UNSPEC_MERGE_PTRUE))]
1821   "TARGET_SVE
1822    && (register_operand (operands[2], <MODE>mode)
1823        || register_operand (operands[3], <MODE>mode))"
1824   "@
1825    fsub\t%0.<Vetype>, %1/m, %0.<Vetype>, #%3
1826    fadd\t%0.<Vetype>, %1/m, %0.<Vetype>, #%N3
1827    fsubr\t%0.<Vetype>, %1/m, %0.<Vetype>, #%2
1828    fsub\t%0.<Vetype>, %2.<Vetype>, %3.<Vetype>"
1829 )
1830
1831 ;; Unpredicated floating-point multiplication.
1832 (define_expand "mul<mode>3"
1833   [(set (match_operand:SVE_F 0 "register_operand")
1834         (unspec:SVE_F
1835           [(match_dup 3)
1836            (mult:SVE_F
1837              (match_operand:SVE_F 1 "register_operand")
1838              (match_operand:SVE_F 2 "aarch64_sve_float_mul_operand"))]
1839           UNSPEC_MERGE_PTRUE))]
1840   "TARGET_SVE"
1841   {
1842     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1843   }
1844 )
1845
1846 ;; Floating-point multiplication predicated with a PTRUE.
1847 (define_insn "*mul<mode>3"
1848   [(set (match_operand:SVE_F 0 "register_operand" "=w, w")
1849         (unspec:SVE_F
1850           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1851            (mult:SVE_F
1852              (match_operand:SVE_F 2 "register_operand" "%0, w")
1853              (match_operand:SVE_F 3 "aarch64_sve_float_mul_operand" "vsM, w"))]
1854           UNSPEC_MERGE_PTRUE))]
1855   "TARGET_SVE"
1856   "@
1857    fmul\t%0.<Vetype>, %1/m, %0.<Vetype>, #%3
1858    fmul\t%0.<Vetype>, %2.<Vetype>, %3.<Vetype>"
1859 )
1860
1861 ;; Unpredicated fma (%0 = (%1 * %2) + %3).
1862 (define_expand "fma<mode>4"
1863   [(set (match_operand:SVE_F 0 "register_operand")
1864         (unspec:SVE_F
1865           [(match_dup 4)
1866            (fma:SVE_F (match_operand:SVE_F 1 "register_operand")
1867                       (match_operand:SVE_F 2 "register_operand")
1868                       (match_operand:SVE_F 3 "register_operand"))]
1869           UNSPEC_MERGE_PTRUE))]
1870   "TARGET_SVE"
1871   {
1872     operands[4] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1873   }
1874 )
1875
1876 ;; fma predicated with a PTRUE.
1877 (define_insn "*fma<mode>4"
1878   [(set (match_operand:SVE_F 0 "register_operand" "=w, w")
1879         (unspec:SVE_F
1880           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1881            (fma:SVE_F (match_operand:SVE_F 3 "register_operand" "%0, w")
1882                       (match_operand:SVE_F 4 "register_operand" "w, w")
1883                       (match_operand:SVE_F 2 "register_operand" "w, 0"))]
1884           UNSPEC_MERGE_PTRUE))]
1885   "TARGET_SVE"
1886   "@
1887    fmad\t%0.<Vetype>, %1/m, %4.<Vetype>, %2.<Vetype>
1888    fmla\t%0.<Vetype>, %1/m, %3.<Vetype>, %4.<Vetype>"
1889 )
1890
1891 ;; Unpredicated fnma (%0 = (-%1 * %2) + %3).
1892 (define_expand "fnma<mode>4"
1893   [(set (match_operand:SVE_F 0 "register_operand")
1894         (unspec:SVE_F
1895           [(match_dup 4)
1896            (fma:SVE_F (neg:SVE_F
1897                         (match_operand:SVE_F 1 "register_operand"))
1898                       (match_operand:SVE_F 2 "register_operand")
1899                       (match_operand:SVE_F 3 "register_operand"))]
1900           UNSPEC_MERGE_PTRUE))]
1901   "TARGET_SVE"
1902   {
1903     operands[4] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1904   }
1905 )
1906
1907 ;; fnma predicated with a PTRUE.
1908 (define_insn "*fnma<mode>4"
1909   [(set (match_operand:SVE_F 0 "register_operand" "=w, w")
1910         (unspec:SVE_F
1911           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1912            (fma:SVE_F (neg:SVE_F
1913                         (match_operand:SVE_F 3 "register_operand" "%0, w"))
1914                       (match_operand:SVE_F 4 "register_operand" "w, w")
1915                       (match_operand:SVE_F 2 "register_operand" "w, 0"))]
1916           UNSPEC_MERGE_PTRUE))]
1917   "TARGET_SVE"
1918   "@
1919    fmsb\t%0.<Vetype>, %1/m, %4.<Vetype>, %2.<Vetype>
1920    fmls\t%0.<Vetype>, %1/m, %3.<Vetype>, %4.<Vetype>"
1921 )
1922
1923 ;; Unpredicated fms (%0 = (%1 * %2) - %3).
1924 (define_expand "fms<mode>4"
1925   [(set (match_operand:SVE_F 0 "register_operand")
1926         (unspec:SVE_F
1927           [(match_dup 4)
1928            (fma:SVE_F (match_operand:SVE_F 1 "register_operand")
1929                       (match_operand:SVE_F 2 "register_operand")
1930                       (neg:SVE_F
1931                         (match_operand:SVE_F 3 "register_operand")))]
1932           UNSPEC_MERGE_PTRUE))]
1933   "TARGET_SVE"
1934   {
1935     operands[4] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1936   }
1937 )
1938
1939 ;; fms predicated with a PTRUE.
1940 (define_insn "*fms<mode>4"
1941   [(set (match_operand:SVE_F 0 "register_operand" "=w, w")
1942         (unspec:SVE_F
1943           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1944            (fma:SVE_F (match_operand:SVE_F 3 "register_operand" "%0, w")
1945                       (match_operand:SVE_F 4 "register_operand" "w, w")
1946                       (neg:SVE_F
1947                         (match_operand:SVE_F 2 "register_operand" "w, 0")))]
1948           UNSPEC_MERGE_PTRUE))]
1949   "TARGET_SVE"
1950   "@
1951    fnmsb\t%0.<Vetype>, %1/m, %4.<Vetype>, %2.<Vetype>
1952    fnmls\t%0.<Vetype>, %1/m, %3.<Vetype>, %4.<Vetype>"
1953 )
1954
1955 ;; Unpredicated fnms (%0 = (-%1 * %2) - %3).
1956 (define_expand "fnms<mode>4"
1957   [(set (match_operand:SVE_F 0 "register_operand")
1958         (unspec:SVE_F
1959           [(match_dup 4)
1960            (fma:SVE_F (neg:SVE_F
1961                         (match_operand:SVE_F 1 "register_operand"))
1962                       (match_operand:SVE_F 2 "register_operand")
1963                       (neg:SVE_F
1964                         (match_operand:SVE_F 3 "register_operand")))]
1965           UNSPEC_MERGE_PTRUE))]
1966   "TARGET_SVE"
1967   {
1968     operands[4] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
1969   }
1970 )
1971
1972 ;; fnms predicated with a PTRUE.
1973 (define_insn "*fnms<mode>4"
1974   [(set (match_operand:SVE_F 0 "register_operand" "=w, w")
1975         (unspec:SVE_F
1976           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
1977            (fma:SVE_F (neg:SVE_F
1978                         (match_operand:SVE_F 3 "register_operand" "%0, w"))
1979                       (match_operand:SVE_F 4 "register_operand" "w, w")
1980                       (neg:SVE_F
1981                         (match_operand:SVE_F 2 "register_operand" "w, 0")))]
1982           UNSPEC_MERGE_PTRUE))]
1983   "TARGET_SVE"
1984   "@
1985    fnmad\t%0.<Vetype>, %1/m, %4.<Vetype>, %2.<Vetype>
1986    fnmla\t%0.<Vetype>, %1/m, %3.<Vetype>, %4.<Vetype>"
1987 )
1988
1989 ;; Unpredicated floating-point division.
1990 (define_expand "div<mode>3"
1991   [(set (match_operand:SVE_F 0 "register_operand")
1992         (unspec:SVE_F
1993           [(match_dup 3)
1994            (div:SVE_F (match_operand:SVE_F 1 "register_operand")
1995                       (match_operand:SVE_F 2 "register_operand"))]
1996           UNSPEC_MERGE_PTRUE))]
1997   "TARGET_SVE"
1998   {
1999     operands[3] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
2000   }
2001 )
2002
2003 ;; Floating-point division predicated with a PTRUE.
2004 (define_insn "*div<mode>3"
2005   [(set (match_operand:SVE_F 0 "register_operand" "=w, w")
2006         (unspec:SVE_F
2007           [(match_operand:<VPRED> 1 "register_operand" "Upl, Upl")
2008            (div:SVE_F (match_operand:SVE_F 2 "register_operand" "0, w")
2009                       (match_operand:SVE_F 3 "register_operand" "w, 0"))]
2010           UNSPEC_MERGE_PTRUE))]
2011   "TARGET_SVE"
2012   "@
2013    fdiv\t%0.<Vetype>, %1/m, %0.<Vetype>, %3.<Vetype>
2014    fdivr\t%0.<Vetype>, %1/m, %0.<Vetype>, %2.<Vetype>"
2015 )
2016
2017 ;; Unpredicated FNEG, FABS and FSQRT.
2018 (define_expand "<optab><mode>2"
2019   [(set (match_operand:SVE_F 0 "register_operand")
2020         (unspec:SVE_F
2021           [(match_dup 2)
2022            (SVE_FP_UNARY:SVE_F (match_operand:SVE_F 1 "register_operand"))]
2023           UNSPEC_MERGE_PTRUE))]
2024   "TARGET_SVE"
2025   {
2026     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
2027   }
2028 )
2029
2030 ;; FNEG, FABS and FSQRT predicated with a PTRUE.
2031 (define_insn "*<optab><mode>2"
2032   [(set (match_operand:SVE_F 0 "register_operand" "=w")
2033         (unspec:SVE_F
2034           [(match_operand:<VPRED> 1 "register_operand" "Upl")
2035            (SVE_FP_UNARY:SVE_F (match_operand:SVE_F 2 "register_operand" "w"))]
2036           UNSPEC_MERGE_PTRUE))]
2037   "TARGET_SVE"
2038   "<sve_fp_op>\t%0.<Vetype>, %1/m, %2.<Vetype>"
2039 )
2040
2041 ;; Unpredicated FRINTy.
2042 (define_expand "<frint_pattern><mode>2"
2043   [(set (match_operand:SVE_F 0 "register_operand")
2044         (unspec:SVE_F
2045           [(match_dup 2)
2046            (unspec:SVE_F [(match_operand:SVE_F 1 "register_operand")]
2047                          FRINT)]
2048           UNSPEC_MERGE_PTRUE))]
2049   "TARGET_SVE"
2050   {
2051     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
2052   }
2053 )
2054
2055 ;; FRINTy predicated with a PTRUE.
2056 (define_insn "*<frint_pattern><mode>2"
2057   [(set (match_operand:SVE_F 0 "register_operand" "=w")
2058         (unspec:SVE_F
2059           [(match_operand:<VPRED> 1 "register_operand" "Upl")
2060            (unspec:SVE_F [(match_operand:SVE_F 2 "register_operand" "w")]
2061                          FRINT)]
2062           UNSPEC_MERGE_PTRUE))]
2063   "TARGET_SVE"
2064   "frint<frint_suffix>\t%0.<Vetype>, %1/m, %2.<Vetype>"
2065 )
2066
2067 ;; Unpredicated conversion of floats to integers of the same size (HF to HI,
2068 ;; SF to SI or DF to DI).
2069 (define_expand "<fix_trunc_optab><mode><v_int_equiv>2"
2070   [(set (match_operand:<V_INT_EQUIV> 0 "register_operand")
2071         (unspec:<V_INT_EQUIV>
2072           [(match_dup 2)
2073            (FIXUORS:<V_INT_EQUIV>
2074              (match_operand:SVE_F 1 "register_operand"))]
2075           UNSPEC_MERGE_PTRUE))]
2076   "TARGET_SVE"
2077   {
2078     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
2079   }
2080 )
2081
2082 ;; Conversion of SF to DI, SI or HI, predicated with a PTRUE.
2083 (define_insn "*<fix_trunc_optab>v16hsf<mode>2"
2084   [(set (match_operand:SVE_HSDI 0 "register_operand" "=w")
2085         (unspec:SVE_HSDI
2086           [(match_operand:<VPRED> 1 "register_operand" "Upl")
2087            (FIXUORS:SVE_HSDI
2088              (match_operand:VNx8HF 2 "register_operand" "w"))]
2089           UNSPEC_MERGE_PTRUE))]
2090   "TARGET_SVE"
2091   "fcvtz<su>\t%0.<Vetype>, %1/m, %2.h"
2092 )
2093
2094 ;; Conversion of SF to DI or SI, predicated with a PTRUE.
2095 (define_insn "*<fix_trunc_optab>vnx4sf<mode>2"
2096   [(set (match_operand:SVE_SDI 0 "register_operand" "=w")
2097         (unspec:SVE_SDI
2098           [(match_operand:<VPRED> 1 "register_operand" "Upl")
2099            (FIXUORS:SVE_SDI
2100              (match_operand:VNx4SF 2 "register_operand" "w"))]
2101           UNSPEC_MERGE_PTRUE))]
2102   "TARGET_SVE"
2103   "fcvtz<su>\t%0.<Vetype>, %1/m, %2.s"
2104 )
2105
2106 ;; Conversion of DF to DI or SI, predicated with a PTRUE.
2107 (define_insn "*<fix_trunc_optab>vnx2df<mode>2"
2108   [(set (match_operand:SVE_SDI 0 "register_operand" "=w")
2109         (unspec:SVE_SDI
2110           [(match_operand:VNx2BI 1 "register_operand" "Upl")
2111            (FIXUORS:SVE_SDI
2112              (match_operand:VNx2DF 2 "register_operand" "w"))]
2113           UNSPEC_MERGE_PTRUE))]
2114   "TARGET_SVE"
2115   "fcvtz<su>\t%0.<Vetype>, %1/m, %2.d"
2116 )
2117
2118 ;; Unpredicated conversion of integers to floats of the same size
2119 ;; (HI to HF, SI to SF or DI to DF).
2120 (define_expand "<optab><v_int_equiv><mode>2"
2121   [(set (match_operand:SVE_F 0 "register_operand")
2122         (unspec:SVE_F
2123           [(match_dup 2)
2124            (FLOATUORS:SVE_F
2125              (match_operand:<V_INT_EQUIV> 1 "register_operand"))]
2126           UNSPEC_MERGE_PTRUE))]
2127   "TARGET_SVE"
2128   {
2129     operands[2] = force_reg (<VPRED>mode, CONSTM1_RTX (<VPRED>mode));
2130   }
2131 )
2132
2133 ;; Conversion of DI, SI or HI to the same number of HFs, predicated
2134 ;; with a PTRUE.
2135 (define_insn "*<optab><mode>vnx8hf2"
2136   [(set (match_operand:VNx8HF 0 "register_operand" "=w")
2137         (unspec:VNx8HF
2138           [(match_operand:<VPRED> 1 "register_operand" "Upl")
2139            (FLOATUORS:VNx8HF
2140              (match_operand:SVE_HSDI 2 "register_operand" "w"))]
2141           UNSPEC_MERGE_PTRUE))]
2142   "TARGET_SVE"
2143   "<su_optab>cvtf\t%0.h, %1/m, %2.<Vetype>"
2144 )
2145
2146 ;; Conversion of DI or SI to the same number of SFs, predicated with a PTRUE.
2147 (define_insn "*<optab><mode>vnx4sf2"
2148   [(set (match_operand:VNx4SF 0 "register_operand" "=w")
2149         (unspec:VNx4SF
2150           [(match_operand:<VPRED> 1 "register_operand" "Upl")
2151            (FLOATUORS:VNx4SF
2152              (match_operand:SVE_SDI 2 "register_operand" "w"))]
2153           UNSPEC_MERGE_PTRUE))]
2154   "TARGET_SVE"
2155   "<su_optab>cvtf\t%0.s, %1/m, %2.<Vetype>"
2156 )
2157
2158 ;; Conversion of DI or SI to DF, predicated with a PTRUE.
2159 (define_insn "*<optab><mode>vnx2df2"
2160   [(set (match_operand:VNx2DF 0 "register_operand" "=w")
2161         (unspec:VNx2DF
2162           [(match_operand:VNx2BI 1 "register_operand" "Upl")
2163            (FLOATUORS:VNx2DF
2164              (match_operand:SVE_SDI 2 "register_operand" "w"))]
2165           UNSPEC_MERGE_PTRUE))]
2166   "TARGET_SVE"
2167   "<su_optab>cvtf\t%0.d, %1/m, %2.<Vetype>"
2168 )
2169
2170 ;; Conversion of DFs to the same number of SFs, or SFs to the same number
2171 ;; of HFs.
2172 (define_insn "*trunc<Vwide><mode>2"
2173   [(set (match_operand:SVE_HSF 0 "register_operand" "=w")
2174         (unspec:SVE_HSF
2175           [(match_operand:<VWIDE_PRED> 1 "register_operand" "Upl")
2176            (unspec:SVE_HSF
2177              [(match_operand:<VWIDE> 2 "register_operand" "w")]
2178              UNSPEC_FLOAT_CONVERT)]
2179           UNSPEC_MERGE_PTRUE))]
2180   "TARGET_SVE"
2181   "fcvt\t%0.<Vetype>, %1/m, %2.<Vewtype>"
2182 )
2183
2184 ;; Conversion of SFs to the same number of DFs, or HFs to the same number
2185 ;; of SFs.
2186 (define_insn "*extend<mode><Vwide>2"
2187   [(set (match_operand:<VWIDE> 0 "register_operand" "=w")
2188         (unspec:<VWIDE>
2189           [(match_operand:<VWIDE_PRED> 1 "register_operand" "Upl")
2190            (unspec:<VWIDE>
2191              [(match_operand:SVE_HSF 2 "register_operand" "w")]
2192              UNSPEC_FLOAT_CONVERT)]
2193           UNSPEC_MERGE_PTRUE))]
2194   "TARGET_SVE"
2195   "fcvt\t%0.<Vewtype>, %1/m, %2.<Vetype>"
2196 )
2197
2198 ;; PUNPKHI and PUNPKLO.
2199 (define_insn "vec_unpack<su>_<perm_hilo>_<mode>"
2200   [(set (match_operand:<VWIDE> 0 "register_operand" "=Upa")
2201         (unspec:<VWIDE> [(match_operand:PRED_BHS 1 "register_operand" "Upa")]
2202                         UNPACK))]
2203   "TARGET_SVE"
2204   "punpk<perm_hilo>\t%0.h, %1.b"
2205 )
2206
2207 ;; SUNPKHI, UUNPKHI, SUNPKLO and UUNPKLO.
2208 (define_insn "vec_unpack<su>_<perm_hilo>_<SVE_BHSI:mode>"
2209   [(set (match_operand:<VWIDE> 0 "register_operand" "=w")
2210         (unspec:<VWIDE> [(match_operand:SVE_BHSI 1 "register_operand" "w")]
2211                         UNPACK))]
2212   "TARGET_SVE"
2213   "<su>unpk<perm_hilo>\t%0.<Vewtype>, %1.<Vetype>"
2214 )
2215
2216 ;; Used by the vec_unpacks_<perm_hilo>_<mode> expander to unpack the bit
2217 ;; representation of a VNx4SF or VNx8HF without conversion.  The choice
2218 ;; between signed and unsigned isn't significant.
2219 (define_insn "*vec_unpacku_<perm_hilo>_<mode>_no_convert"
2220   [(set (match_operand:SVE_HSF 0 "register_operand" "=w")
2221         (unspec:SVE_HSF [(match_operand:SVE_HSF 1 "register_operand" "w")]
2222                         UNPACK_UNSIGNED))]
2223   "TARGET_SVE"
2224   "uunpk<perm_hilo>\t%0.<Vewtype>, %1.<Vetype>"
2225 )
2226
2227 ;; Unpack one half of a VNx4SF to VNx2DF, or one half of a VNx8HF to VNx4SF.
2228 ;; First unpack the source without conversion, then float-convert the
2229 ;; unpacked source.
2230 (define_expand "vec_unpacks_<perm_hilo>_<mode>"
2231   [(set (match_dup 2)
2232         (unspec:SVE_HSF [(match_operand:SVE_HSF 1 "register_operand")]
2233                         UNPACK_UNSIGNED))
2234    (set (match_operand:<VWIDE> 0 "register_operand")
2235         (unspec:<VWIDE> [(match_dup 3)
2236                          (unspec:<VWIDE> [(match_dup 2)] UNSPEC_FLOAT_CONVERT)]
2237                         UNSPEC_MERGE_PTRUE))]
2238   "TARGET_SVE"
2239   {
2240     operands[2] = gen_reg_rtx (<MODE>mode);
2241     operands[3] = force_reg (<VWIDE_PRED>mode, CONSTM1_RTX (<VWIDE_PRED>mode));
2242   }
2243 )
2244
2245 ;; Unpack one half of a VNx4SI to VNx2DF.  First unpack from VNx4SI
2246 ;; to VNx2DI, reinterpret the VNx2DI as a VNx4SI, then convert the
2247 ;; unpacked VNx4SI to VNx2DF.
2248 (define_expand "vec_unpack<su_optab>_float_<perm_hilo>_vnx4si"
2249   [(set (match_dup 2)
2250         (unspec:VNx2DI [(match_operand:VNx4SI 1 "register_operand")]
2251                        UNPACK_UNSIGNED))
2252    (set (match_operand:VNx2DF 0 "register_operand")
2253         (unspec:VNx2DF [(match_dup 3)
2254                         (FLOATUORS:VNx2DF (match_dup 4))]
2255                        UNSPEC_MERGE_PTRUE))]
2256   "TARGET_SVE"
2257   {
2258     operands[2] = gen_reg_rtx (VNx2DImode);
2259     operands[3] = force_reg (VNx2BImode, CONSTM1_RTX (VNx2BImode));
2260     operands[4] = gen_rtx_SUBREG (VNx4SImode, operands[2], 0);
2261   }
2262 )
2263
2264 ;; Predicate pack.  Use UZP1 on the narrower type, which discards
2265 ;; the high part of each wide element.
2266 (define_insn "vec_pack_trunc_<Vwide>"
2267   [(set (match_operand:PRED_BHS 0 "register_operand" "=Upa")
2268         (unspec:PRED_BHS
2269           [(match_operand:<VWIDE> 1 "register_operand" "Upa")
2270            (match_operand:<VWIDE> 2 "register_operand" "Upa")]
2271           UNSPEC_PACK))]
2272   "TARGET_SVE"
2273   "uzp1\t%0.<Vetype>, %1.<Vetype>, %2.<Vetype>"
2274 )
2275
2276 ;; Integer pack.  Use UZP1 on the narrower type, which discards
2277 ;; the high part of each wide element.
2278 (define_insn "vec_pack_trunc_<Vwide>"
2279   [(set (match_operand:SVE_BHSI 0 "register_operand" "=w")
2280         (unspec:SVE_BHSI
2281           [(match_operand:<VWIDE> 1 "register_operand" "w")
2282            (match_operand:<VWIDE> 2 "register_operand" "w")]
2283           UNSPEC_PACK))]
2284   "TARGET_SVE"
2285   "uzp1\t%0.<Vetype>, %1.<Vetype>, %2.<Vetype>"
2286 )
2287
2288 ;; Convert two vectors of DF to SF, or two vectors of SF to HF, and pack
2289 ;; the results into a single vector.
2290 (define_expand "vec_pack_trunc_<Vwide>"
2291   [(set (match_dup 4)
2292         (unspec:SVE_HSF
2293           [(match_dup 3)
2294            (unspec:SVE_HSF [(match_operand:<VWIDE> 1 "register_operand")]
2295                            UNSPEC_FLOAT_CONVERT)]
2296           UNSPEC_MERGE_PTRUE))
2297    (set (match_dup 5)
2298         (unspec:SVE_HSF
2299           [(match_dup 3)
2300            (unspec:SVE_HSF [(match_operand:<VWIDE> 2 "register_operand")]
2301                            UNSPEC_FLOAT_CONVERT)]
2302           UNSPEC_MERGE_PTRUE))
2303    (set (match_operand:SVE_HSF 0 "register_operand")
2304         (unspec:SVE_HSF [(match_dup 4) (match_dup 5)] UNSPEC_UZP1))]
2305   "TARGET_SVE"
2306   {
2307     operands[3] = force_reg (<VWIDE_PRED>mode, CONSTM1_RTX (<VWIDE_PRED>mode));
2308     operands[4] = gen_reg_rtx (<MODE>mode);
2309     operands[5] = gen_reg_rtx (<MODE>mode);
2310   }
2311 )
2312
2313 ;; Convert two vectors of DF to SI and pack the results into a single vector.
2314 (define_expand "vec_pack_<su>fix_trunc_vnx2df"
2315   [(set (match_dup 4)
2316         (unspec:VNx4SI
2317           [(match_dup 3)
2318            (FIXUORS:VNx4SI (match_operand:VNx2DF 1 "register_operand"))]
2319           UNSPEC_MERGE_PTRUE))
2320    (set (match_dup 5)
2321         (unspec:VNx4SI
2322           [(match_dup 3)
2323            (FIXUORS:VNx4SI (match_operand:VNx2DF 2 "register_operand"))]
2324           UNSPEC_MERGE_PTRUE))
2325    (set (match_operand:VNx4SI 0 "register_operand")
2326         (unspec:VNx4SI [(match_dup 4) (match_dup 5)] UNSPEC_UZP1))]
2327   "TARGET_SVE"
2328   {
2329     operands[3] = force_reg (VNx2BImode, CONSTM1_RTX (VNx2BImode));
2330     operands[4] = gen_reg_rtx (VNx4SImode);
2331     operands[5] = gen_reg_rtx (VNx4SImode);
2332   }
2333 )
2334
2335 ;; Predicated floating-point operations.
2336 (define_insn "cond_<optab><mode>"
2337   [(set (match_operand:SVE_F 0 "register_operand" "=w")
2338         (unspec:SVE_F
2339           [(match_operand:<VPRED> 1 "register_operand" "Upl")
2340            (match_operand:SVE_F 2 "register_operand" "0")
2341            (match_operand:SVE_F 3 "register_operand" "w")]
2342           SVE_COND_FP_OP))]
2343   "TARGET_SVE"
2344   "<sve_fp_op>\t%0.<Vetype>, %1/m, %0.<Vetype>, %3.<Vetype>"
2345 )
2346
2347 ;; Shift an SVE vector left and insert a scalar into element 0.
2348 (define_insn "vec_shl_insert_<mode>"
2349   [(set (match_operand:SVE_ALL 0 "register_operand" "=w, w")
2350         (unspec:SVE_ALL
2351           [(match_operand:SVE_ALL 1 "register_operand" "0, 0")
2352            (match_operand:<VEL> 2 "register_operand" "rZ, w")]
2353           UNSPEC_INSR))]
2354   "TARGET_SVE"
2355   "@
2356    insr\t%0.<Vetype>, %<vwcore>2
2357    insr\t%0.<Vetype>, %<Vetype>2"
2358 )