gcc/config/rs6000/vsx.md

   1 ;; VSX patterns.
   2 ;; Copyright (C) 2009-2024 Free Software Foundation, Inc.
   3 ;; Contributed by Michael Meissner <meissner@linux.vnet.ibm.com>
   4
   5 ;; This file is part of GCC.
   6
   7 ;; GCC is free software; you can redistribute it and/or modify it
   8 ;; under the terms of the GNU General Public License as published
   9 ;; by the Free Software Foundation; either version 3, or (at your
  10 ;; option) any later version.
  11
  12 ;; GCC is distributed in the hope that it will be useful, but WITHOUT
  13 ;; ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
  14 ;; or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public
  15 ;; License for more details.
  16
  17 ;; You should have received a copy of the GNU General Public License
  18 ;; along with GCC; see the file COPYING3.  If not see
  19 ;; <http://www.gnu.org/licenses/>.
  20
  21 ;; Iterator for comparison types
  22 (define_code_iterator CMP_TEST [eq lt gt unordered])
  23
  24 ;; Mode attribute for vector floate and floato conversions
  25 (define_mode_attr VF_sxddp [(V2DI "sxd") (V2DF "dp")])
  26
  27 ;; Iterator for both scalar and vector floating point types supported by VSX
  28 (define_mode_iterator VSX_B [DF V4SF V2DF])
  29
  30 ;; Iterator for the 2 64-bit vector types
  31 (define_mode_iterator VSX_D [V2DF V2DI])
  32
  33 ;; Mode iterator to handle swapping words on little endian for the 128-bit
  34 ;; types that goes in a single vector register.
  35 (define_mode_iterator VSX_LE_128 [(KF   "FLOAT128_VECTOR_P (KFmode)")
  36                                   (TF   "FLOAT128_VECTOR_P (TFmode)")
  37                                   TI
  38                                   V1TI])
  39
  40 ;; Iterator for the 2 32-bit vector types
  41 (define_mode_iterator VSX_W [V4SF V4SI])
  42
  43 ;; Iterator for the DF types
  44 (define_mode_iterator VSX_DF [V2DF DF])
  45
  46 ;; Iterator for vector floating point types supported by VSX
  47 (define_mode_iterator VSX_F [V4SF V2DF])
  48
  49 ;; Iterator for logical types supported by VSX
  50 (define_mode_iterator VSX_L [V16QI
  51                              V8HI
  52                              V4SI
  53                              V2DI
  54                              V4SF
  55                              V2DF
  56                              V1TI
  57                              TI
  58                              (KF        "FLOAT128_VECTOR_P (KFmode)")
  59                              (TF        "FLOAT128_VECTOR_P (TFmode)")])
  60
  61 ;; Iterator for memory moves.
  62 (define_mode_iterator VSX_M [V16QI
  63                              V8HI
  64                              V4SI
  65                              V2DI
  66                              V4SF
  67                              V2DF
  68                              V1TI
  69                              (KF        "FLOAT128_VECTOR_P (KFmode)")
  70                              (TF        "FLOAT128_VECTOR_P (TFmode)")
  71                              TI])
  72
  73 (define_mode_attr VSX_XXBR  [(V8HI  "h")
  74                              (V4SI  "w")
  75                              (V4SF  "w")
  76                              (V2DF  "d")
  77                              (V2DI  "d")
  78                              (V1TI  "q")])
  79
  80 ;; Map into the appropriate load/store name based on the type
  81 (define_mode_attr VSm  [(V16QI "vw4")
  82                         (V8HI  "vw4")
  83                         (V4SI  "vw4")
  84                         (V4SF  "vw4")
  85                         (V2DF  "vd2")
  86                         (V2DI  "vd2")
  87                         (DF    "d")
  88                         (TF    "vd2")
  89                         (KF    "vd2")
  90                         (V1TI  "vd2")
  91                         (TI    "vd2")])
  92
  93 ;; Map the register class used
  94 (define_mode_attr VSr   [(V16QI "v")
  95                          (V8HI  "v")
  96                          (V4SI  "v")
  97                          (V4SF  "wa")
  98                          (V2DI  "wa")
  99                          (V2DF  "wa")
 100                          (DI    "wa")
 101                          (DF    "wa")
 102                          (SF    "wa")
 103                          (TF    "wa")
 104                          (KF    "wa")
 105                          (V1TI  "v")
 106                          (TI    "wa")])
 107
 108 ;; What value we need in the "isa" field, to make the IEEE QP float work.
 109 (define_mode_attr VSisa [(V16QI "*")
 110                          (V8HI  "*")
 111                          (V4SI  "*")
 112                          (V4SF  "*")
 113                          (V2DI  "*")
 114                          (V2DF  "*")
 115                          (DI    "*")
 116                          (DF    "*")
 117                          (SF    "*")
 118                          (V1TI  "*")
 119                          (TI    "*")
 120                          (TF    "p9tf")
 121                          (KF    "p9kf")])
 122
 123 ;; A mode attribute to disparage use of GPR registers, except for scalar
 124 ;; integer modes.
 125 (define_mode_attr ??r   [(V16QI "??r")
 126                          (V8HI  "??r")
 127                          (V4SI  "??r")
 128                          (V4SF  "??r")
 129                          (V2DI  "??r")
 130                          (V2DF  "??r")
 131                          (V1TI  "??r")
 132                          (KF    "??r")
 133                          (TF    "??r")
 134                          (TI    "r")])
 135
 136 ;; A mode attribute used for 128-bit constant values.
 137 (define_mode_attr nW    [(V16QI "W")
 138                          (V8HI  "W")
 139                          (V4SI  "W")
 140                          (V4SF  "W")
 141                          (V2DI  "W")
 142                          (V2DF  "W")
 143                          (V1TI  "W")
 144                          (KF    "W")
 145                          (TF    "W")
 146                          (TI    "n")])
 147
 148 ;; Same size integer type for floating point data
 149 (define_mode_attr VSi [(V4SF  "v4si")
 150                        (V2DF  "v2di")
 151                        (DF    "di")])
 152
 153 (define_mode_attr VSI [(V4SF  "V4SI")
 154                        (V2DF  "V2DI")
 155                        (DF    "DI")])
 156
 157 ;; Word size for same size conversion
 158 (define_mode_attr VSc [(V4SF "w")
 159                        (V2DF "d")
 160                        (DF   "d")])
 161
 162 ;; Map into either s or v, depending on whether this is a scalar or vector
 163 ;; operation
 164 (define_mode_attr VSv   [(V16QI "v")
 165                          (V8HI  "v")
 166                          (V4SI  "v")
 167                          (V4SF  "v")
 168                          (V2DI  "v")
 169                          (V2DF  "v")
 170                          (V1TI  "v")
 171                          (DF    "s")
 172                          (KF    "v")])
 173
 174 ;; Appropriate type for add ops (and other simple FP ops)
 175 (define_mode_attr VStype_simple [(V2DF "vecdouble")
 176                                  (V4SF "vecfloat")
 177                                  (DF   "fp")])
 178
 179 ;; Appropriate type for multiply ops
 180 (define_mode_attr VStype_mul    [(V2DF "vecdouble")
 181                                  (V4SF "vecfloat")
 182                                  (DF   "dmul")])
 183
 184 ;; Appropriate type for divide ops.
 185 (define_mode_attr VStype_div    [(V2DF "vecdiv")
 186                                  (V4SF "vecfdiv")
 187                                  (DF   "ddiv")])
 188
 189 ;; Map to a double-sized vector mode
 190 (define_mode_attr VS_double [(V4SI      "V8SI")
 191                              (V4SF      "V8SF")
 192                              (V2DI      "V4DI")
 193                              (V2DF      "V4DF")
 194                              (V1TI      "V2TI")])
 195
 196 ;; Iterators for loading constants with xxspltib
 197 (define_mode_iterator VSINT_84  [V4SI V2DI DI SI])
 198 (define_mode_iterator VSINT_842 [V8HI V4SI V2DI])
 199
 200 ;; Vector reverse byte modes
 201 (define_mode_iterator VEC_REVB [V8HI V4SI V2DI V4SF V2DF V1TI])
 202
 203 ;; Iterator for ISA 3.0 vector extract/insert of small integer vectors.
 204 ;; VSX_EXTRACT_I2 doesn't include V4SImode because SI extracts can be
 205 ;; done on ISA 2.07 and not just ISA 3.0.
 206 (define_mode_iterator VSX_EXTRACT_I  [V16QI V8HI V4SI])
 207 (define_mode_iterator VSX_EXTRACT_I2 [V16QI V8HI])
 208 (define_mode_iterator VSX_EXTRACT_I4 [V16QI V8HI V4SI V2DI])
 209
 210 (define_mode_attr VSX_EXTRACT_WIDTH [(V16QI "b")
 211                                      (V8HI "h")
 212                                      (V4SI "w")])
 213
 214 ;; Mode attribute to give the correct predicate for ISA 3.0 vector extract and
 215 ;; insert to validate the operand number.
 216 (define_mode_attr VSX_EXTRACT_PREDICATE [(V16QI "const_0_to_15_operand")
 217                                          (V8HI  "const_0_to_7_operand")
 218                                          (V4SI  "const_0_to_3_operand")])
 219
 220 ;; Mode attribute to give the constraint for vector extract and insert
 221 ;; operations.
 222 (define_mode_attr VSX_EX [(V16QI "v")
 223                           (V8HI  "v")
 224                           (V4SI  "wa")])
 225
 226 ;; Mode iterator for binary floating types other than double to
 227 ;; optimize convert to that floating point type from an extract
 228 ;; of an integer type
 229 (define_mode_iterator VSX_EXTRACT_FL [SF
 230                                       (IF "FLOAT128_2REG_P (IFmode)")
 231                                       (KF "TARGET_FLOAT128_HW")
 232                                       (TF "FLOAT128_2REG_P (TFmode)
 233                                            || (FLOAT128_IEEE_P (TFmode)
 234                                                && TARGET_FLOAT128_HW)")])
 235
 236 ;; Mode iterator for binary floating types that have a direct conversion
 237 ;; from 64-bit integer to floating point
 238 (define_mode_iterator FL_CONV [SF
 239                                DF
 240                                (KF "TARGET_FLOAT128_HW")
 241                                (TF "TARGET_FLOAT128_HW
 242                                     && FLOAT128_IEEE_P (TFmode)")])
 243
 244 ;; Iterator for the 2 short vector types to do a splat from an integer
 245 (define_mode_iterator VSX_SPLAT_I [V16QI V8HI])
 246
 247 ;; Mode attribute to give the count for the splat instruction to splat
 248 ;; the value in the 64-bit integer slot
 249 (define_mode_attr VSX_SPLAT_COUNT [(V16QI "7") (V8HI "3")])
 250
 251 ;; Mode attribute to give the suffix for the splat instruction
 252 (define_mode_attr VSX_SPLAT_SUFFIX [(V16QI "b") (V8HI "h")])
 253
 254 ;; Iterator for the move to mask instructions
 255 (define_mode_iterator VSX_MM [V16QI V8HI V4SI V2DI V1TI])
 256 (define_mode_iterator VSX_MM4 [V16QI V8HI V4SI V2DI])
 257
 258 ;; Longer vec int modes for rotate/mask ops
 259 ;; and Vector Integer Multiply/Divide/Modulo Instructions
 260 (define_mode_iterator VIlong [V2DI V4SI])
 261
 262 ;; Constants for creating unspecs
 263 (define_c_enum "unspec"
 264   [UNSPEC_VSX_CONCAT
 265    UNSPEC_VSX_CVDPSXWS
 266    UNSPEC_VSX_CVDPUXWS
 267    UNSPEC_VSX_CVSPDP
 268    UNSPEC_VSX_CVHPSP
 269    UNSPEC_VSX_CVSPDPN
 270    UNSPEC_VSX_CVDPSPN
 271    UNSPEC_VSX_CVSXWDP
 272    UNSPEC_VSX_CVUXWDP
 273    UNSPEC_VSX_CVSXDSP
 274    UNSPEC_VSX_CVUXDSP
 275    UNSPEC_VSX_FLOAT2
 276    UNSPEC_VSX_UNS_FLOAT2
 277    UNSPEC_VSX_FLOATE
 278    UNSPEC_VSX_UNS_FLOATE
 279    UNSPEC_VSX_FLOATO
 280    UNSPEC_VSX_UNS_FLOATO
 281    UNSPEC_VSX_TDIV
 282    UNSPEC_VSX_TSQRT
 283    UNSPEC_VSX_SET
 284    UNSPEC_VSX_ROUND_I
 285    UNSPEC_VSX_ROUND_IC
 286    UNSPEC_VSX_SLDWI
 287    UNSPEC_VSX_XXPERM
 288
 289    UNSPEC_VSX_XXSPLTW
 290    UNSPEC_VSX_XXSPLTD
 291    UNSPEC_VSX_DIVSD
 292    UNSPEC_VSX_DIVUD
 293    UNSPEC_VSX_DIVSQ
 294    UNSPEC_VSX_DIVUQ
 295    UNSPEC_VSX_DIVESQ
 296    UNSPEC_VSX_DIVEUQ
 297    UNSPEC_VSX_MODSQ
 298    UNSPEC_VSX_MODUQ
 299    UNSPEC_VSX_MULSD
 300    UNSPEC_VSX_SIGN_EXTEND
 301    UNSPEC_VSX_XVCVBF16SPN
 302    UNSPEC_VSX_XVCVSPBF16
 303    UNSPEC_VSX_XVCVSPSXDS
 304    UNSPEC_VSX_XVCVSPHP
 305    UNSPEC_VSX_VSLO
 306    UNSPEC_VSX_EXTRACT
 307    UNSPEC_VSX_SXEXPDP
 308    UNSPEC_VSX_SXSIG
 309    UNSPEC_VSX_SIEXPDP
 310    UNSPEC_VSX_SIEXPQP
 311    UNSPEC_VSX_SCMPEXPDP
 312    UNSPEC_VSX_SCMPEXPQP
 313    UNSPEC_VSX_STSTDC
 314    UNSPEC_VSX_VEXTRACT_FP_FROM_SHORTH
 315    UNSPEC_VSX_VEXTRACT_FP_FROM_SHORTL
 316    UNSPEC_VSX_VXEXP
 317    UNSPEC_VSX_VXSIG
 318    UNSPEC_VSX_VIEXP
 319    UNSPEC_VSX_VTSTDC
 320    UNSPEC_VSX_VSIGNED2
 321
 322    UNSPEC_LXVL
 323    UNSPEC_LXVLL
 324    UNSPEC_LVSL_REG
 325    UNSPEC_LVSR_REG
 326    UNSPEC_STXVL
 327    UNSPEC_STXVLL
 328    UNSPEC_XL_LEN_R
 329    UNSPEC_XST_LEN_R
 330
 331    UNSPEC_VCLZLSBB
 332    UNSPEC_VCTZLSBB
 333    UNSPEC_VEXTUBLX
 334    UNSPEC_VEXTUHLX
 335    UNSPEC_VEXTUWLX
 336    UNSPEC_VEXTUBRX
 337    UNSPEC_VEXTUHRX
 338    UNSPEC_VEXTUWRX
 339    UNSPEC_VCMPNEB
 340    UNSPEC_VCMPNEZB
 341    UNSPEC_VCMPNEH
 342    UNSPEC_VCMPNEZH
 343    UNSPEC_VCMPNEW
 344    UNSPEC_VCMPNEZW
 345    UNSPEC_XXEXTRACTUW
 346    UNSPEC_XXINSERTW
 347    UNSPEC_VSX_FIRST_MATCH_INDEX
 348    UNSPEC_VSX_FIRST_MATCH_EOS_INDEX
 349    UNSPEC_VSX_FIRST_MISMATCH_INDEX
 350    UNSPEC_VSX_FIRST_MISMATCH_EOS_INDEX
 351    UNSPEC_XXGENPCV
 352    UNSPEC_MTVSBM
 353    UNSPEC_EXTENDDITI2
 354    UNSPEC_VCNTMB
 355    UNSPEC_VEXPAND
 356    UNSPEC_VEXTRACT
 357    UNSPEC_EXTRACTL
 358    UNSPEC_EXTRACTR
 359    UNSPEC_INSERTL
 360    UNSPEC_INSERTR
 361    UNSPEC_REPLACE_ELT
 362    UNSPEC_REPLACE_UN
 363    UNSPEC_VDIVES
 364    UNSPEC_VDIVEU
 365    UNSPEC_VMSUMCUD
 366    UNSPEC_XXEVAL
 367    UNSPEC_XXSPLTIW
 368    UNSPEC_XXSPLTIDP
 369    UNSPEC_XXSPLTI32DX
 370    UNSPEC_XXBLEND
 371    UNSPEC_XXPERMX
 372   ])
 373
 374 (define_int_iterator XVCVBF16   [UNSPEC_VSX_XVCVSPBF16
 375                                  UNSPEC_VSX_XVCVBF16SPN])
 376
 377 (define_int_attr xvcvbf16       [(UNSPEC_VSX_XVCVSPBF16 "xvcvspbf16")
 378                                  (UNSPEC_VSX_XVCVBF16SPN "xvcvbf16spn")])
 379
 380 ;; Like VI, defined in vector.md, but add ISA 2.07 integer vector ops
 381 (define_mode_iterator VI2 [V4SI V8HI V16QI V2DI])
 382
 383 ;; Aligned and unaligned vector replace iterator/attr for 32-bit and
 384 ;; 64-bit elements
 385 (define_mode_iterator REPLACE_ELT_V [V4SI V4SF V2DI V2DF])
 386 (define_mode_iterator REPLACE_ELT [SI SF DI DF])
 387 (define_mode_attr REPLACE_ELT_char [(V4SI "w") (V4SF "w")
 388                                     (V2DI "d") (V2DF "d")
 389                                     (SI "w") (SF "w")
 390                                     (DI "d") (DF "d")])
 391 (define_mode_attr REPLACE_ELT_sh [(V4SI "2") (V4SF "2")
 392                                   (V2DI  "3") (V2DF "3")])
 393 (define_mode_attr REPLACE_ELT_max [(V4SI "12") (V4SF "12")
 394                                    (V2DI  "8") (V2DF "8")])
 395
 396 ;; Like VM2 in altivec.md, just do char, short, int, long, float and double
 397 (define_mode_iterator VM3 [V4SI
 398                            V8HI
 399                            V16QI
 400                            V4SF
 401                            V2DF
 402                            V2DI])
 403 (define_mode_iterator V2DI_DI  [V2DI DI])
 404 (define_mode_attr DI_to_TI [(V2DI "V1TI")
 405                             (DI   "TI")])
 406
 407 (define_mode_attr VM3_char [(V2DI "d")
 408                            (V4SI "w")
 409                            (V8HI "h")
 410                            (V16QI "b")
 411                            (V2DF  "d")
 412                            (V4SF  "w")])
 413
 414 ;; Iterator and attribute for vector count leading/trailing
 415 ;; zero least-significant bits byte
 416 (define_int_iterator VCZLSBB [UNSPEC_VCLZLSBB
 417                               UNSPEC_VCTZLSBB])
 418 (define_int_attr vczlsbb_char [(UNSPEC_VCLZLSBB "l")
 419                                (UNSPEC_VCTZLSBB "t")])
 420
 421 ;; VSX moves
 422
 423 ;; TImode memory to memory move optimization on LE with p8vector
 424 (define_insn_and_split "*vsx_le_mem_to_mem_mov_ti"
 425   [(set (match_operand:TI 0 "indexed_or_indirect_operand" "=Z")
 426         (match_operand:TI 1 "indexed_or_indirect_operand" "Z"))]
 427   "!BYTES_BIG_ENDIAN
 428    && TARGET_VSX
 429    && !TARGET_P9_VECTOR
 430    && can_create_pseudo_p ()"
 431   "#"
 432   "&& 1"
 433   [(const_int 0)]
 434 {
 435   rtx tmp = gen_reg_rtx (V2DImode);
 436   rtx src =  adjust_address (operands[1], V2DImode, 0);
 437   emit_insn (gen_vsx_ld_elemrev_v2di (tmp, src));
 438   rtx dest = adjust_address (operands[0], V2DImode, 0);
 439   emit_insn (gen_vsx_st_elemrev_v2di (dest, tmp));
 440   DONE;
 441 }
 442   [(set_attr "length" "16")])
 443
 444 ;; The patterns for LE permuted loads and stores come before the general
 445 ;; VSX moves so they match first.
 446 (define_insn_and_split "*vsx_le_perm_load_<mode>"
 447   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
 448         (match_operand:VSX_D 1 "indexed_or_indirect_operand" "Z"))]
 449   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR"
 450   "#"
 451   "&& 1"
 452   [(set (match_dup 2)
 453         (vec_select:<MODE>
 454           (match_dup 1)
 455           (parallel [(const_int 1) (const_int 0)])))
 456    (set (match_dup 0)
 457         (vec_select:<MODE>
 458           (match_dup 2)
 459           (parallel [(const_int 1) (const_int 0)])))]
 460 {
 461   rtx mem = operands[1];
 462
 463   /* Don't apply the swap optimization if we've already performed register
 464      allocation and the hard register destination is not in the altivec
 465      range.  */
 466   if ((MEM_ALIGN (mem) >= 128)
 467       && (!HARD_REGISTER_NUM_P (reg_or_subregno (operands[0]))
 468           || ALTIVEC_REGNO_P (reg_or_subregno (operands[0]))))
 469     {
 470       rtx mem_address = XEXP (mem, 0);
 471       enum machine_mode mode = GET_MODE (mem);
 472
 473       if (REG_P (mem_address) || rs6000_sum_of_two_registers_p (mem_address))
 474         {
 475           /* Replace the source memory address with masked address.  */
 476           rtx lvx_set_expr = rs6000_gen_lvx (mode, operands[0], mem);
 477           emit_insn (lvx_set_expr);
 478           DONE;
 479         }
 480       else if (rs6000_quadword_masked_address_p (mem_address))
 481         {
 482           /* This rtl is already in the form that matches lvx
 483              instruction, so leave it alone.  */
 484           DONE;
 485         }
 486       /* Otherwise, fall through to transform into a swapping load.  */
 487     }
 488   operands[2] = can_create_pseudo_p () ? gen_reg_rtx_and_attrs (operands[0])
 489                                        : operands[0];
 490 }
 491   [(set_attr "type" "vecload")
 492    (set_attr "length" "8")])
 493
 494 (define_insn_and_split "*vsx_le_perm_load_<mode>"
 495   [(set (match_operand:VSX_W 0 "vsx_register_operand" "=wa")
 496         (match_operand:VSX_W 1 "indexed_or_indirect_operand" "Z"))]
 497   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR"
 498   "#"
 499   "&& 1"
 500   [(set (match_dup 2)
 501         (vec_select:<MODE>
 502           (match_dup 1)
 503           (parallel [(const_int 2) (const_int 3)
 504                      (const_int 0) (const_int 1)])))
 505    (set (match_dup 0)
 506         (vec_select:<MODE>
 507           (match_dup 2)
 508           (parallel [(const_int 2) (const_int 3)
 509                      (const_int 0) (const_int 1)])))]
 510 {
 511   rtx mem = operands[1];
 512
 513   /* Don't apply the swap optimization if we've already performed register
 514      allocation and the hard register destination is not in the altivec
 515      range.  */
 516   if ((MEM_ALIGN (mem) >= 128)
 517       && (!HARD_REGISTER_P (operands[0])
 518           || ALTIVEC_REGNO_P (REGNO(operands[0]))))
 519     {
 520       rtx mem_address = XEXP (mem, 0);
 521       enum machine_mode mode = GET_MODE (mem);
 522
 523       if (REG_P (mem_address) || rs6000_sum_of_two_registers_p (mem_address))
 524         {
 525           /* Replace the source memory address with masked address.  */
 526           rtx lvx_set_expr = rs6000_gen_lvx (mode, operands[0], mem);
 527           emit_insn (lvx_set_expr);
 528           DONE;
 529         }
 530       else if (rs6000_quadword_masked_address_p (mem_address))
 531         {
 532           /* This rtl is already in the form that matches lvx
 533              instruction, so leave it alone.  */
 534           DONE;
 535         }
 536       /* Otherwise, fall through to transform into a swapping load.  */
 537     }
 538   operands[2] = can_create_pseudo_p () ? gen_reg_rtx_and_attrs (operands[0])
 539                                        : operands[0];
 540 }
 541   [(set_attr "type" "vecload")
 542    (set_attr "length" "8")])
 543
 544 (define_insn_and_split "*vsx_le_perm_load_v8hi"
 545   [(set (match_operand:V8HI 0 "vsx_register_operand" "=wa")
 546         (match_operand:V8HI 1 "indexed_or_indirect_operand" "Z"))]
 547   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR"
 548   "#"
 549   "&& 1"
 550   [(set (match_dup 2)
 551         (vec_select:V8HI
 552           (match_dup 1)
 553           (parallel [(const_int 4) (const_int 5)
 554                      (const_int 6) (const_int 7)
 555                      (const_int 0) (const_int 1)
 556                      (const_int 2) (const_int 3)])))
 557    (set (match_dup 0)
 558         (vec_select:V8HI
 559           (match_dup 2)
 560           (parallel [(const_int 4) (const_int 5)
 561                      (const_int 6) (const_int 7)
 562                      (const_int 0) (const_int 1)
 563                      (const_int 2) (const_int 3)])))]
 564 {
 565   rtx mem = operands[1];
 566
 567   /* Don't apply the swap optimization if we've already performed register
 568      allocation and the hard register destination is not in the altivec
 569      range.  */
 570   if ((MEM_ALIGN (mem) >= 128)
 571       && (!HARD_REGISTER_P (operands[0])
 572           || ALTIVEC_REGNO_P (REGNO(operands[0]))))
 573     {
 574       rtx mem_address = XEXP (mem, 0);
 575       enum machine_mode mode = GET_MODE (mem);
 576
 577       if (REG_P (mem_address) || rs6000_sum_of_two_registers_p (mem_address))
 578         {
 579           /* Replace the source memory address with masked address.  */
 580           rtx lvx_set_expr = rs6000_gen_lvx (mode, operands[0], mem);
 581           emit_insn (lvx_set_expr);
 582           DONE;
 583         }
 584       else if (rs6000_quadword_masked_address_p (mem_address))
 585         {
 586           /* This rtl is already in the form that matches lvx
 587              instruction, so leave it alone.  */
 588           DONE;
 589         }
 590       /* Otherwise, fall through to transform into a swapping load.  */
 591     }
 592   operands[2] = can_create_pseudo_p () ? gen_reg_rtx_and_attrs (operands[0])
 593                                        : operands[0];
 594 }
 595   [(set_attr "type" "vecload")
 596    (set_attr "length" "8")])
 597
 598 (define_insn_and_split "*vsx_le_perm_load_v16qi"
 599   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
 600         (match_operand:V16QI 1 "indexed_or_indirect_operand" "Z"))]
 601   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR"
 602   "#"
 603   "&& 1"
 604   [(set (match_dup 2)
 605         (vec_select:V16QI
 606           (match_dup 1)
 607           (parallel [(const_int 8) (const_int 9)
 608                      (const_int 10) (const_int 11)
 609                      (const_int 12) (const_int 13)
 610                      (const_int 14) (const_int 15)
 611                      (const_int 0) (const_int 1)
 612                      (const_int 2) (const_int 3)
 613                      (const_int 4) (const_int 5)
 614                      (const_int 6) (const_int 7)])))
 615    (set (match_dup 0)
 616         (vec_select:V16QI
 617           (match_dup 2)
 618           (parallel [(const_int 8) (const_int 9)
 619                      (const_int 10) (const_int 11)
 620                      (const_int 12) (const_int 13)
 621                      (const_int 14) (const_int 15)
 622                      (const_int 0) (const_int 1)
 623                      (const_int 2) (const_int 3)
 624                      (const_int 4) (const_int 5)
 625                      (const_int 6) (const_int 7)])))]
 626 {
 627   rtx mem = operands[1];
 628
 629   /* Don't apply the swap optimization if we've already performed register
 630      allocation and the hard register destination is not in the altivec
 631      range.  */
 632   if ((MEM_ALIGN (mem) >= 128)
 633       && (!HARD_REGISTER_P (operands[0])
 634           || ALTIVEC_REGNO_P (REGNO(operands[0]))))
 635     {
 636       rtx mem_address = XEXP (mem, 0);
 637       enum machine_mode mode = GET_MODE (mem);
 638
 639       if (REG_P (mem_address) || rs6000_sum_of_two_registers_p (mem_address))
 640         {
 641           /* Replace the source memory address with masked address.  */
 642           rtx lvx_set_expr = rs6000_gen_lvx (mode, operands[0], mem);
 643           emit_insn (lvx_set_expr);
 644           DONE;
 645         }
 646       else if (rs6000_quadword_masked_address_p (mem_address))
 647         {
 648           /* This rtl is already in the form that matches lvx
 649              instruction, so leave it alone.  */
 650           DONE;
 651         }
 652       /* Otherwise, fall through to transform into a swapping load.  */
 653     }
 654   operands[2] = can_create_pseudo_p () ? gen_reg_rtx_and_attrs (operands[0])
 655                                        : operands[0];
 656 }
 657   [(set_attr "type" "vecload")
 658    (set_attr "length" "8")])
 659
 660 (define_insn "*vsx_le_perm_store_<mode>"
 661   [(set (match_operand:VSX_D 0 "indexed_or_indirect_operand" "=Z")
 662         (match_operand:VSX_D 1 "vsx_register_operand" "+wa"))]
 663   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR"
 664   "#"
 665   [(set_attr "type" "vecstore")
 666    (set_attr "length" "12")])
 667
 668 (define_split
 669   [(set (match_operand:VSX_D 0 "indexed_or_indirect_operand")
 670         (match_operand:VSX_D 1 "vsx_register_operand"))]
 671   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR && !reload_completed"
 672   [(set (match_dup 2)
 673         (vec_select:<MODE>
 674           (match_dup 1)
 675           (parallel [(const_int 1) (const_int 0)])))
 676    (set (match_dup 0)
 677         (vec_select:<MODE>
 678           (match_dup 2)
 679           (parallel [(const_int 1) (const_int 0)])))]
 680 {
 681   rtx mem = operands[0];
 682
 683   /* Don't apply the swap optimization if we've already performed register
 684      allocation and the hard register source is not in the altivec range.  */
 685   if ((MEM_ALIGN (mem) >= 128)
 686       && (!HARD_REGISTER_NUM_P (reg_or_subregno (operands[1]))
 687           || ALTIVEC_REGNO_P (reg_or_subregno (operands[1]))))
 688     {
 689       rtx mem_address = XEXP (mem, 0);
 690       enum machine_mode mode = GET_MODE (mem);
 691       if (REG_P (mem_address) || rs6000_sum_of_two_registers_p (mem_address))
 692         {
 693           rtx stvx_set_expr = rs6000_gen_stvx (mode, mem, operands[1]);
 694           emit_insn (stvx_set_expr);
 695           DONE;
 696         }
 697       else if (rs6000_quadword_masked_address_p (mem_address))
 698         {
 699           /* This rtl is already in the form that matches stvx instruction,
 700              so leave it alone.  */
 701           DONE;
 702         }
 703       /* Otherwise, fall through to transform into a swapping store.  */
 704     }
 705
 706   operands[2] = can_create_pseudo_p () ? gen_reg_rtx_and_attrs (operands[1])
 707                                        : operands[1];
 708 })
 709
 710 ;; The post-reload split requires that we re-permute the source
 711 ;; register in case it is still live.
 712 (define_split
 713   [(set (match_operand:VSX_D 0 "indexed_or_indirect_operand")
 714         (match_operand:VSX_D 1 "vsx_register_operand"))]
 715   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR && reload_completed"
 716   [(set (match_dup 1)
 717         (vec_select:<MODE>
 718           (match_dup 1)
 719           (parallel [(const_int 1) (const_int 0)])))
 720    (set (match_dup 0)
 721         (vec_select:<MODE>
 722           (match_dup 1)
 723           (parallel [(const_int 1) (const_int 0)])))
 724    (set (match_dup 1)
 725         (vec_select:<MODE>
 726           (match_dup 1)
 727           (parallel [(const_int 1) (const_int 0)])))]
 728   "")
 729
 730 (define_insn "*vsx_le_perm_store_<mode>"
 731   [(set (match_operand:VSX_W 0 "indexed_or_indirect_operand" "=Z")
 732         (match_operand:VSX_W 1 "vsx_register_operand" "+wa"))]
 733   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR"
 734   "#"
 735   [(set_attr "type" "vecstore")
 736    (set_attr "length" "12")])
 737
 738 (define_split
 739   [(set (match_operand:VSX_W 0 "indexed_or_indirect_operand")
 740         (match_operand:VSX_W 1 "vsx_register_operand"))]
 741   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR && !reload_completed"
 742   [(set (match_dup 2)
 743         (vec_select:<MODE>
 744           (match_dup 1)
 745           (parallel [(const_int 2) (const_int 3)
 746                      (const_int 0) (const_int 1)])))
 747    (set (match_dup 0)
 748         (vec_select:<MODE>
 749           (match_dup 2)
 750           (parallel [(const_int 2) (const_int 3)
 751                      (const_int 0) (const_int 1)])))]
 752 {
 753   rtx mem = operands[0];
 754
 755   /* Don't apply the swap optimization if we've already performed register
 756      allocation and the hard register source is not in the altivec range.  */
 757   if ((MEM_ALIGN (mem) >= 128)
 758       && (!HARD_REGISTER_NUM_P (reg_or_subregno (operands[1]))
 759           || ALTIVEC_REGNO_P (reg_or_subregno (operands[1]))))
 760     {
 761       rtx mem_address = XEXP (mem, 0);
 762       enum machine_mode mode = GET_MODE (mem);
 763       if (REG_P (mem_address) || rs6000_sum_of_two_registers_p (mem_address))
 764         {
 765           rtx stvx_set_expr = rs6000_gen_stvx (mode, mem, operands[1]);
 766           emit_insn (stvx_set_expr);
 767           DONE;
 768         }
 769       else if (rs6000_quadword_masked_address_p (mem_address))
 770         {
 771           /* This rtl is already in the form that matches stvx instruction,
 772              so leave it alone.  */
 773           DONE;
 774         }
 775       /* Otherwise, fall through to transform into a swapping store.  */
 776     }
 777
 778   operands[2] = can_create_pseudo_p () ? gen_reg_rtx_and_attrs (operands[1])
 779                                        : operands[1];
 780 })
 781
 782 ;; The post-reload split requires that we re-permute the source
 783 ;; register in case it is still live.
 784 (define_split
 785   [(set (match_operand:VSX_W 0 "indexed_or_indirect_operand")
 786         (match_operand:VSX_W 1 "vsx_register_operand"))]
 787   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR && reload_completed"
 788   [(set (match_dup 1)
 789         (vec_select:<MODE>
 790           (match_dup 1)
 791           (parallel [(const_int 2) (const_int 3)
 792                      (const_int 0) (const_int 1)])))
 793    (set (match_dup 0)
 794         (vec_select:<MODE>
 795           (match_dup 1)
 796           (parallel [(const_int 2) (const_int 3)
 797                      (const_int 0) (const_int 1)])))
 798    (set (match_dup 1)
 799         (vec_select:<MODE>
 800           (match_dup 1)
 801           (parallel [(const_int 2) (const_int 3)
 802                      (const_int 0) (const_int 1)])))]
 803   "")
 804
 805 (define_insn "*vsx_le_perm_store_v8hi"
 806   [(set (match_operand:V8HI 0 "indexed_or_indirect_operand" "=Z")
 807         (match_operand:V8HI 1 "vsx_register_operand" "+wa"))]
 808   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR"
 809   "#"
 810   [(set_attr "type" "vecstore")
 811    (set_attr "length" "12")])
 812
 813 (define_split
 814   [(set (match_operand:V8HI 0 "indexed_or_indirect_operand")
 815         (match_operand:V8HI 1 "vsx_register_operand"))]
 816   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR && !reload_completed"
 817   [(set (match_dup 2)
 818         (vec_select:V8HI
 819           (match_dup 1)
 820           (parallel [(const_int 4) (const_int 5)
 821                      (const_int 6) (const_int 7)
 822                      (const_int 0) (const_int 1)
 823                      (const_int 2) (const_int 3)])))
 824    (set (match_dup 0)
 825         (vec_select:V8HI
 826           (match_dup 2)
 827           (parallel [(const_int 4) (const_int 5)
 828                      (const_int 6) (const_int 7)
 829                      (const_int 0) (const_int 1)
 830                      (const_int 2) (const_int 3)])))]
 831 {
 832   rtx mem = operands[0];
 833
 834   /* Don't apply the swap optimization if we've already performed register
 835      allocation and the hard register source is not in the altivec range.  */
 836   if ((MEM_ALIGN (mem) >= 128)
 837       && (!HARD_REGISTER_NUM_P (reg_or_subregno (operands[1]))
 838           || ALTIVEC_REGNO_P (reg_or_subregno (operands[1]))))
 839     {
 840       rtx mem_address = XEXP (mem, 0);
 841       enum machine_mode mode = GET_MODE (mem);
 842       if (REG_P (mem_address) || rs6000_sum_of_two_registers_p (mem_address))
 843         {
 844           rtx stvx_set_expr = rs6000_gen_stvx (mode, mem, operands[1]);
 845           emit_insn (stvx_set_expr);
 846           DONE;
 847         }
 848       else if (rs6000_quadword_masked_address_p (mem_address))
 849         {
 850           /* This rtl is already in the form that matches stvx instruction,
 851              so leave it alone.  */
 852           DONE;
 853         }
 854       /* Otherwise, fall through to transform into a swapping store.  */
 855     }
 856
 857   operands[2] = can_create_pseudo_p () ? gen_reg_rtx_and_attrs (operands[1])
 858                                        : operands[1];
 859 })
 860
 861 ;; The post-reload split requires that we re-permute the source
 862 ;; register in case it is still live.
 863 (define_split
 864   [(set (match_operand:V8HI 0 "indexed_or_indirect_operand")
 865         (match_operand:V8HI 1 "vsx_register_operand"))]
 866   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR && reload_completed"
 867   [(set (match_dup 1)
 868         (vec_select:V8HI
 869           (match_dup 1)
 870           (parallel [(const_int 4) (const_int 5)
 871                      (const_int 6) (const_int 7)
 872                      (const_int 0) (const_int 1)
 873                      (const_int 2) (const_int 3)])))
 874    (set (match_dup 0)
 875         (vec_select:V8HI
 876           (match_dup 1)
 877           (parallel [(const_int 4) (const_int 5)
 878                      (const_int 6) (const_int 7)
 879                      (const_int 0) (const_int 1)
 880                      (const_int 2) (const_int 3)])))
 881    (set (match_dup 1)
 882         (vec_select:V8HI
 883           (match_dup 1)
 884           (parallel [(const_int 4) (const_int 5)
 885                      (const_int 6) (const_int 7)
 886                      (const_int 0) (const_int 1)
 887                      (const_int 2) (const_int 3)])))]
 888   "")
 889
 890 (define_insn "*vsx_le_perm_store_v16qi"
 891   [(set (match_operand:V16QI 0 "indexed_or_indirect_operand" "=Z")
 892         (match_operand:V16QI 1 "vsx_register_operand" "+wa"))]
 893   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR"
 894   "#"
 895   [(set_attr "type" "vecstore")
 896    (set_attr "length" "12")])
 897
 898 (define_split
 899   [(set (match_operand:V16QI 0 "indexed_or_indirect_operand")
 900         (match_operand:V16QI 1 "vsx_register_operand"))]
 901   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR && !reload_completed"
 902   [(set (match_dup 2)
 903         (vec_select:V16QI
 904           (match_dup 1)
 905           (parallel [(const_int 8) (const_int 9)
 906                      (const_int 10) (const_int 11)
 907                      (const_int 12) (const_int 13)
 908                      (const_int 14) (const_int 15)
 909                      (const_int 0) (const_int 1)
 910                      (const_int 2) (const_int 3)
 911                      (const_int 4) (const_int 5)
 912                      (const_int 6) (const_int 7)])))
 913    (set (match_dup 0)
 914         (vec_select:V16QI
 915           (match_dup 2)
 916           (parallel [(const_int 8) (const_int 9)
 917                      (const_int 10) (const_int 11)
 918                      (const_int 12) (const_int 13)
 919                      (const_int 14) (const_int 15)
 920                      (const_int 0) (const_int 1)
 921                      (const_int 2) (const_int 3)
 922                      (const_int 4) (const_int 5)
 923                      (const_int 6) (const_int 7)])))]
 924 {
 925   rtx mem = operands[0];
 926
 927   /* Don't apply the swap optimization if we've already performed register
 928      allocation and the hard register source is not in the altivec range.  */
 929   if ((MEM_ALIGN (mem) >= 128)
 930       && (!HARD_REGISTER_NUM_P (reg_or_subregno (operands[1]))
 931           || ALTIVEC_REGNO_P (reg_or_subregno (operands[1]))))
 932     {
 933       rtx mem_address = XEXP (mem, 0);
 934       enum machine_mode mode = GET_MODE (mem);
 935       if (REG_P (mem_address) || rs6000_sum_of_two_registers_p (mem_address))
 936         {
 937           rtx stvx_set_expr = rs6000_gen_stvx (mode, mem, operands[1]);
 938           emit_insn (stvx_set_expr);
 939           DONE;
 940         }
 941       else if (rs6000_quadword_masked_address_p (mem_address))
 942         {
 943           /* This rtl is already in the form that matches stvx instruction,
 944              so leave it alone.  */
 945           DONE;
 946         }
 947       /* Otherwise, fall through to transform into a swapping store.  */
 948     }
 949
 950   operands[2] = can_create_pseudo_p () ? gen_reg_rtx_and_attrs (operands[1])
 951                                        : operands[1];
 952 })
 953
 954 ;; The post-reload split requires that we re-permute the source
 955 ;; register in case it is still live.
 956 (define_split
 957   [(set (match_operand:V16QI 0 "indexed_or_indirect_operand")
 958         (match_operand:V16QI 1 "vsx_register_operand"))]
 959   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR && reload_completed"
 960   [(set (match_dup 1)
 961         (vec_select:V16QI
 962           (match_dup 1)
 963           (parallel [(const_int 8) (const_int 9)
 964                      (const_int 10) (const_int 11)
 965                      (const_int 12) (const_int 13)
 966                      (const_int 14) (const_int 15)
 967                      (const_int 0) (const_int 1)
 968                      (const_int 2) (const_int 3)
 969                      (const_int 4) (const_int 5)
 970                      (const_int 6) (const_int 7)])))
 971    (set (match_dup 0)
 972         (vec_select:V16QI
 973           (match_dup 1)
 974           (parallel [(const_int 8) (const_int 9)
 975                      (const_int 10) (const_int 11)
 976                      (const_int 12) (const_int 13)
 977                      (const_int 14) (const_int 15)
 978                      (const_int 0) (const_int 1)
 979                      (const_int 2) (const_int 3)
 980                      (const_int 4) (const_int 5)
 981                      (const_int 6) (const_int 7)])))
 982    (set (match_dup 1)
 983         (vec_select:V16QI
 984           (match_dup 1)
 985           (parallel [(const_int 8) (const_int 9)
 986                      (const_int 10) (const_int 11)
 987                      (const_int 12) (const_int 13)
 988                      (const_int 14) (const_int 15)
 989                      (const_int 0) (const_int 1)
 990                      (const_int 2) (const_int 3)
 991                      (const_int 4) (const_int 5)
 992                      (const_int 6) (const_int 7)])))]
 993   "")
 994
 995 ;; Little endian word swapping for 128-bit types that are either scalars or the
 996 ;; special V1TI container class, which it is not appropriate to use vec_select
 997 ;; for the type.
 998 (define_insn "*vsx_le_permute_<mode>"
 999   [(set (match_operand:VEC_TI 0 "nonimmediate_operand" "=wa,wa,Z,&r,&r,Q")
1000         (rotate:VEC_TI
1001          (match_operand:VEC_TI 1 "input_operand" "wa,Z,wa,r,Q,r")
1002          (const_int 64)))]
1003   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR"
1004   "@
1005    xxpermdi %x0,%x1,%x1,2
1006    lxvd2x %x0,%y1
1007    stxvd2x %x1,%y0
1008    mr %0,%L1\;mr %L0,%1
1009    ld%U1%X1 %0,%L1\;ld%U1%X1 %L0,%1
1010    std%U0%X0 %L1,%0\;std%U0%X0 %1,%L0"
1011   [(set_attr "length" "*,*,*,8,8,8")
1012    (set_attr "type" "vecperm,vecload,vecstore,*,load,store")])
1013
1014 (define_insn_and_split "*vsx_le_undo_permute_<mode>"
1015   [(set (match_operand:VEC_TI 0 "vsx_register_operand" "=wa,wa")
1016         (rotate:VEC_TI
1017          (rotate:VEC_TI
1018           (match_operand:VEC_TI 1 "vsx_register_operand" "0,wa")
1019           (const_int 64))
1020          (const_int 64)))]
1021   "!BYTES_BIG_ENDIAN && TARGET_VSX"
1022   "@
1023    #
1024    xxlor %x0,%x1"
1025   "&& 1"
1026   [(set (match_dup 0) (match_dup 1))]
1027 {
1028   if (reload_completed && REGNO (operands[0]) == REGNO (operands[1]))
1029     {
1030       emit_note (NOTE_INSN_DELETED);
1031       DONE;
1032     }
1033 }
1034   [(set_attr "length" "0,4")
1035    (set_attr "type" "veclogical")])
1036
1037 (define_insn_and_split "*vsx_le_perm_load_<mode>"
1038   [(set (match_operand:VSX_LE_128 0 "vsx_register_operand" "=wa,r")
1039         (match_operand:VSX_LE_128 1 "memory_operand" "Z,Q"))]
1040   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR
1041    && !altivec_indexed_or_indirect_operand (operands[1], <MODE>mode)"
1042   "@
1043    #
1044    #"
1045   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR
1046    && !altivec_indexed_or_indirect_operand (operands[1], <MODE>mode)"
1047   [(const_int 0)]
1048 {
1049   rtx tmp = (can_create_pseudo_p ()
1050              ? gen_reg_rtx_and_attrs (operands[0])
1051              : operands[0]);
1052   rs6000_emit_le_vsx_permute (tmp, operands[1], <MODE>mode);
1053   rs6000_emit_le_vsx_permute (operands[0], tmp, <MODE>mode);
1054   DONE;
1055 }
1056   [(set_attr "type" "vecload,load")
1057    (set_attr "length" "8,8")
1058    (set_attr "isa" "<VSisa>,*")])
1059
1060 (define_insn "*vsx_le_perm_store_<mode>"
1061   [(set (match_operand:VSX_LE_128 0 "memory_operand" "=Z,Q")
1062         (match_operand:VSX_LE_128 1 "vsx_register_operand" "+wa,r"))]
1063   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR
1064    && !altivec_indexed_or_indirect_operand (operands[0], <MODE>mode)"
1065   "@
1066    #
1067    #"
1068   [(set_attr "type" "vecstore,store")
1069    (set_attr "length" "12,8")
1070    (set_attr "isa" "<VSisa>,*")])
1071
1072 (define_split
1073   [(set (match_operand:VSX_LE_128 0 "memory_operand")
1074         (match_operand:VSX_LE_128 1 "vsx_register_operand"))]
1075   "!BYTES_BIG_ENDIAN && TARGET_VSX && !reload_completed && !TARGET_P9_VECTOR
1076    && !altivec_indexed_or_indirect_operand (operands[0], <MODE>mode)"
1077   [(const_int 0)]
1078 {
1079   rtx tmp = (can_create_pseudo_p ()
1080              ? gen_reg_rtx_and_attrs (operands[0])
1081              : operands[0]);
1082   rs6000_emit_le_vsx_permute (tmp, operands[1], <MODE>mode);
1083   rs6000_emit_le_vsx_permute (operands[0], tmp, <MODE>mode);
1084   DONE;
1085 })
1086
1087 ;; Peepholes to catch loads and stores for TImode if TImode landed in
1088 ;; GPR registers on a little endian system.
1089 (define_peephole2
1090   [(set (match_operand:VEC_TI 0 "int_reg_operand")
1091         (rotate:VEC_TI (match_operand:VEC_TI 1 "memory_operand")
1092                        (const_int 64)))
1093    (set (match_operand:VEC_TI 2 "int_reg_operand")
1094         (rotate:VEC_TI (match_dup 0)
1095                        (const_int 64)))]
1096   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR
1097    && (rtx_equal_p (operands[0], operands[2])
1098        || peep2_reg_dead_p (2, operands[0]))"
1099    [(set (match_dup 2) (match_dup 1))])
1100
1101 (define_peephole2
1102   [(set (match_operand:VEC_TI 0 "int_reg_operand")
1103         (rotate:VEC_TI (match_operand:VEC_TI 1 "int_reg_operand")
1104                        (const_int 64)))
1105    (set (match_operand:VEC_TI 2 "memory_operand")
1106         (rotate:VEC_TI (match_dup 0)
1107                        (const_int 64)))]
1108   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR
1109    && peep2_reg_dead_p (2, operands[0])"
1110    [(set (match_dup 2) (match_dup 1))])
1111
1112 ;; Peephole to catch memory to memory transfers for TImode if TImode landed in
1113 ;; VSX registers on a little endian system.  The vector types and IEEE 128-bit
1114 ;; floating point are handled by the more generic swap elimination pass.
1115 (define_peephole2
1116   [(set (match_operand:TI 0 "vsx_register_operand")
1117         (rotate:TI (match_operand:TI 1 "vsx_register_operand")
1118                    (const_int 64)))
1119    (set (match_operand:TI 2 "vsx_register_operand")
1120         (rotate:TI (match_dup 0)
1121                    (const_int 64)))]
1122   "!BYTES_BIG_ENDIAN && TARGET_VSX && !TARGET_P9_VECTOR
1123    && (rtx_equal_p (operands[0], operands[2])
1124        || peep2_reg_dead_p (2, operands[0]))"
1125    [(set (match_dup 2) (match_dup 1))])
1126
1127 ;; The post-reload split requires that we re-permute the source
1128 ;; register in case it is still live.
1129 (define_split
1130   [(set (match_operand:VSX_LE_128 0 "memory_operand")
1131         (match_operand:VSX_LE_128 1 "vsx_register_operand"))]
1132   "!BYTES_BIG_ENDIAN && TARGET_VSX && reload_completed && !TARGET_P9_VECTOR
1133    && !altivec_indexed_or_indirect_operand (operands[0], <MODE>mode)"
1134   [(const_int 0)]
1135 {
1136   rs6000_emit_le_vsx_permute (operands[1], operands[1], <MODE>mode);
1137   rs6000_emit_le_vsx_permute (operands[0], operands[1], <MODE>mode);
1138   rs6000_emit_le_vsx_permute (operands[1], operands[1], <MODE>mode);
1139   DONE;
1140 })
1141
1142 ;; Vector constants that can be generated with XXSPLTIB that was added in ISA
1143 ;; 3.0.  Both (const_vector [..]) and (vec_duplicate ...) forms are recognized.
1144 (define_insn "xxspltib_v16qi"
1145   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
1146         (vec_duplicate:V16QI (match_operand:SI 1 "s8bit_cint_operand" "n")))]
1147   "TARGET_P9_VECTOR"
1148 {
1149   operands[2] = GEN_INT (INTVAL (operands[1]) & 0xff);
1150   return "xxspltib %x0,%2";
1151 }
1152   [(set_attr "type" "vecperm")])
1153
1154 (define_insn "xxspltib_<mode>_nosplit"
1155   [(set (match_operand:VSINT_842 0 "vsx_register_operand" "=wa,wa")
1156         (match_operand:VSINT_842 1 "xxspltib_constant_nosplit" "jwM,wE"))]
1157   "TARGET_P9_VECTOR"
1158 {
1159   rtx op1 = operands[1];
1160   int value = 256;
1161   int num_insns = -1;
1162
1163   if (!xxspltib_constant_p (op1, <MODE>mode, &num_insns, &value)
1164       || num_insns != 1)
1165     gcc_unreachable ();
1166
1167   operands[2] = GEN_INT (value & 0xff);
1168   return "xxspltib %x0,%2";
1169 }
1170   [(set_attr "type" "vecperm")])
1171
1172 (define_insn_and_split "*xxspltib_<mode>_split"
1173   [(set (match_operand:VSINT_842 0 "altivec_register_operand" "=v")
1174         (match_operand:VSINT_842 1 "xxspltib_constant_split" "wS"))]
1175   "TARGET_P9_VECTOR"
1176   "#"
1177   "&& 1"
1178   [(const_int 0)]
1179 {
1180   int value = 256;
1181   int num_insns = -1;
1182   rtx op0 = operands[0];
1183   rtx op1 = operands[1];
1184   rtx tmp = ((can_create_pseudo_p ())
1185              ? gen_reg_rtx (V16QImode)
1186              : gen_lowpart (V16QImode, op0));
1187
1188   if (!xxspltib_constant_p (op1, <MODE>mode, &num_insns, &value)
1189       || num_insns != 2)
1190     gcc_unreachable ();
1191
1192   emit_insn (gen_xxspltib_v16qi (tmp, GEN_INT (value)));
1193
1194   if (<MODE>mode == V2DImode)
1195     emit_insn (gen_vsx_sign_extend_v16qi_v2di (op0, tmp));
1196
1197   else if (<MODE>mode == V4SImode)
1198     emit_insn (gen_vsx_sign_extend_v16qi_v4si (op0, tmp));
1199
1200   else if (<MODE>mode == V8HImode)
1201     emit_insn (gen_altivec_vupkhsb  (op0, tmp));
1202
1203   else
1204     gcc_unreachable ();
1205
1206   DONE;
1207 }
1208   [(set_attr "type" "vecperm")
1209    (set_attr "length" "8")])
1210
1211 (define_insn_and_split "*vspltisw_v2di_split"
1212   [(set (match_operand:V2DI 0 "altivec_register_operand" "=v")
1213         (match_operand:V2DI 1 "vspltisw_vupkhsw_constant_split" "W"))]
1214   "TARGET_P8_VECTOR && vspltisw_vupkhsw_constant_split (operands[1], V2DImode)"
1215   "#"
1216   "&& 1"
1217   [(const_int 0)]
1218 {
1219   rtx op0 = operands[0];
1220   rtx op1 = operands[1];
1221   rtx tmp = can_create_pseudo_p ()
1222             ? gen_reg_rtx (V4SImode)
1223             : gen_lowpart (V4SImode, op0);
1224   int value;
1225
1226   vspltisw_vupkhsw_constant_p (op1, V2DImode, &value);
1227   emit_insn (gen_altivec_vspltisw (tmp, GEN_INT (value)));
1228   emit_insn (gen_altivec_vupkhsw_direct (op0, tmp));
1229
1230   DONE;
1231 }
1232   [(set_attr "type" "vecperm")
1233    (set_attr "length" "8")])
1234
1235
1236 ;; Prefer using vector registers over GPRs.  Prefer using ISA 3.0's XXSPLTISB
1237 ;; or Altivec VSPLITW 0/-1 over XXLXOR/XXLORC to set a register to all 0's or
1238 ;; all 1's, since the machine does not have to wait for the previous
1239 ;; instruction using the register being set (such as a store waiting on a slow
1240 ;; instruction). But generate XXLXOR/XXLORC if it will avoid a register move.
1241
1242 ;;              VSX store  VSX load   VSX move  VSX->GPR   GPR->VSX    LQ (GPR)
1243 ;;              STQ (GPR)  GPR load   GPR store GPR move   XXSPLTIB    VSPLTISW
1244 ;;              LXVKQ      XXSPLTI*
1245 ;;              VSX 0/-1   VMX const  GPR const LVX (VMX)  STVX (VMX)
1246 (define_insn "vsx_mov<mode>_64bit"
1247   [(set (match_operand:VSX_M 0 "nonimmediate_operand"
1248                "=ZwO,      wa,        wa,        r,         we,        ?wQ,
1249                 ?&r,       ??r,       ??Y,       <??r>,     wa,        v,
1250                 wa,        wa,
1251                 ?wa,       v,         <??r>,     wZ,        v")
1252
1253         (match_operand:VSX_M 1 "input_operand"
1254                "wa,        ZwO,       wa,        we,        r,         r,
1255                 wQ,        Y,         r,         r,         wE,        jwM,
1256                 eQ,        eP,
1257                 ?jwM,      W,         <nW>,      v,         wZ"))]
1258
1259   "TARGET_POWERPC64 && VECTOR_MEM_VSX_P (<MODE>mode)
1260    && (register_operand (operands[0], <MODE>mode)
1261        || register_operand (operands[1], <MODE>mode))"
1262 {
1263   return rs6000_output_move_128bit (operands);
1264 }
1265   [(set_attr "type"
1266                "vecstore,  vecload,   vecsimple, mtvsr,     mfvsr,     load,
1267                 store,     load,      store,     *,         vecsimple, vecsimple,
1268                 vecperm,   vecperm,
1269                 vecsimple, *,         *,         vecstore,  vecload")
1270    (set_attr "num_insns"
1271                "*,         *,         *,         2,         *,         2,
1272                 2,         2,         2,         2,         *,         *,
1273                 *,         *,
1274                 *,         5,         2,         *,         *")
1275    (set_attr "max_prefixed_insns"
1276                "*,         *,         *,         *,         *,         2,
1277                 2,         2,         2,         2,         *,         *,
1278                 *,         *,
1279                 *,         *,         *,         *,         *")
1280    (set_attr "length"
1281                "*,         *,         *,         8,         *,         8,
1282                 8,         8,         8,         8,         *,         *,
1283                 *,         *,
1284                 *,         20,        8,         *,         *")
1285    (set_attr "isa"
1286                "<VSisa>,   <VSisa>,   <VSisa>,   *,         *,         *,
1287                 *,         *,         *,         *,         p9v,       *,
1288                 p10,       p10,
1289                 <VSisa>,   *,         *,         *,         *")
1290    (set_attr "prefixed"
1291                "*,         *,         *,         *,         *,         *,
1292                 *,         *,         *,         *,         *,         *,
1293                 *,         yes,
1294                 *,         *,         *,         *,         *")])
1295
1296 ;;              VSX store  VSX load   VSX move   GPR load   GPR store  GPR move
1297 ;;              LXVKQ      XXSPLTI*
1298 ;;              XXSPLTIB   VSPLTISW   VSX 0/-1   VMX const  GPR const
1299 ;;              LVX (VMX)  STVX (VMX)
1300 (define_insn "*vsx_mov<mode>_32bit"
1301   [(set (match_operand:VSX_M 0 "nonimmediate_operand"
1302                "=ZwO,      wa,        wa,        ??r,       ??Y,       <??r>,
1303                 wa,        wa,
1304                 wa,        v,         ?wa,       v,         <??r>,
1305                 wZ,        v")
1306
1307         (match_operand:VSX_M 1 "input_operand"
1308                "wa,        ZwO,       wa,        Y,         r,         r,
1309                 eQ,        eP,
1310                 wE,        jwM,       ?jwM,      W,         <nW>,
1311                 v,         wZ"))]
1312
1313   "!TARGET_POWERPC64 && VECTOR_MEM_VSX_P (<MODE>mode)
1314    && (register_operand (operands[0], <MODE>mode)
1315        || register_operand (operands[1], <MODE>mode))"
1316 {
1317   return rs6000_output_move_128bit (operands);
1318 }
1319   [(set_attr "type"
1320                "vecstore,  vecload,   vecsimple, load,      store,    *,
1321                 vecperm,   vecperm,
1322                 vecsimple, vecsimple, vecsimple, *,         *,
1323                 vecstore,  vecload")
1324    (set_attr "length"
1325                "*,         *,         *,         16,        16,        16,
1326                 *,         *,
1327                 *,         *,         *,         20,        16,
1328                 *,         *")
1329    (set_attr "isa"
1330                "<VSisa>,   <VSisa>,   <VSisa>,   *,         *,         *,
1331                 p10,       p10,
1332                 p9v,       *,         <VSisa>,   *,         *,
1333                 *,         *")
1334    (set_attr "prefixed"
1335                "*,         *,         *,         *,         *,         *,
1336                 *,         yes,
1337                 *,         *,         *,         *,         *,
1338                 *,         *")])
1339
1340 ;; Explicit  load/store expanders for the builtin functions
1341 (define_expand "vsx_load_<mode>"
1342   [(set (match_operand:VSX_M 0 "vsx_register_operand")
1343         (match_operand:VSX_M 1 "memory_operand"))]
1344   "VECTOR_MEM_VSX_P (<MODE>mode)"
1345 {
1346   /* Expand to swaps if needed, prior to swap optimization.  */
1347   if (!BYTES_BIG_ENDIAN && !TARGET_P9_VECTOR
1348       && !altivec_indexed_or_indirect_operand(operands[1], <MODE>mode))
1349     {
1350       rs6000_emit_le_vsx_move (operands[0], operands[1], <MODE>mode);
1351       DONE;
1352     }
1353 })
1354
1355 (define_expand "vsx_store_<mode>"
1356   [(set (match_operand:VSX_M 0 "memory_operand")
1357         (match_operand:VSX_M 1 "vsx_register_operand"))]
1358   "VECTOR_MEM_VSX_P (<MODE>mode)"
1359 {
1360   /* Expand to swaps if needed, prior to swap optimization.  */
1361   if (!BYTES_BIG_ENDIAN && !TARGET_P9_VECTOR
1362       && !altivec_indexed_or_indirect_operand(operands[0], <MODE>mode))
1363     {
1364       rs6000_emit_le_vsx_move (operands[0], operands[1], <MODE>mode);
1365       DONE;
1366     }
1367 })
1368
1369 ;; Load rightmost element from load_data
1370 ;; using lxvrbx, lxvrhx, lxvrwx, lxvrdx.
1371 (define_insn "vsx_lxvr<wd>x"
1372   [(set (match_operand:TI 0 "vsx_register_operand" "=wa")
1373         (zero_extend:TI (match_operand:INT_ISA3  1 "memory_operand" "Z")))]
1374   "TARGET_POWER10"
1375   "lxvr<wd>x %x0,%y1"
1376   [(set_attr "type" "vecload")])
1377
1378 ;; Store rightmost element into store_data
1379 ;; using stxvrbx, stxvrhx, strvxwx, strvxdx.
1380 (define_insn "vsx_stxvr<wd>x"
1381   [(set (match_operand:INT_ISA3 0 "memory_operand" "=Z")
1382         (truncate:INT_ISA3 (match_operand:TI 1 "vsx_register_operand" "wa")))]
1383   "TARGET_POWER10"
1384   "stxvr<wd>x %x1,%y0"
1385   [(set_attr "type" "vecstore")])
1386
1387 ;; Explicit load/store expanders for the builtin functions for lxvd2x, etc.,
1388 ;; when you really want their element-reversing behavior.
1389 (define_insn "vsx_ld_elemrev_v2di"
1390   [(set (match_operand:V2DI 0 "vsx_register_operand" "=wa")
1391         (vec_select:V2DI
1392           (match_operand:V2DI 1 "memory_operand" "Z")
1393           (parallel [(const_int 1) (const_int 0)])))]
1394   "VECTOR_MEM_VSX_P (V2DImode) && !BYTES_BIG_ENDIAN"
1395   "lxvd2x %x0,%y1"
1396   [(set_attr "type" "vecload")])
1397
1398 (define_insn "vsx_ld_elemrev_v1ti"
1399   [(set (match_operand:V1TI 0 "vsx_register_operand" "=wa")
1400         (vec_select:V1TI
1401           (match_operand:V1TI 1 "memory_operand" "Z")
1402           (parallel [(const_int 0)])))]
1403   "VECTOR_MEM_VSX_P (V1TImode) && !BYTES_BIG_ENDIAN"
1404 {
1405    return "lxvd2x %x0,%y1\;xxpermdi %x0,%x0,%x0,2";
1406 }
1407   [(set_attr "type" "vecload")])
1408
1409 (define_insn "vsx_ld_elemrev_v2df"
1410   [(set (match_operand:V2DF 0 "vsx_register_operand" "=wa")
1411         (vec_select:V2DF
1412           (match_operand:V2DF 1 "memory_operand" "Z")
1413           (parallel [(const_int 1) (const_int 0)])))]
1414   "VECTOR_MEM_VSX_P (V2DFmode) && !BYTES_BIG_ENDIAN"
1415   "lxvd2x %x0,%y1"
1416   [(set_attr "type" "vecload")])
1417
1418 (define_insn "vsx_ld_elemrev_v4si"
1419   [(set (match_operand:V4SI 0 "vsx_register_operand" "=wa")
1420         (vec_select:V4SI
1421           (match_operand:V4SI 1 "memory_operand" "Z")
1422           (parallel [(const_int 3) (const_int 2)
1423                      (const_int 1) (const_int 0)])))]
1424   "VECTOR_MEM_VSX_P (V4SImode) && !BYTES_BIG_ENDIAN"
1425   "lxvw4x %x0,%y1"
1426   [(set_attr "type" "vecload")])
1427
1428 (define_insn "vsx_ld_elemrev_v4sf"
1429   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa")
1430         (vec_select:V4SF
1431           (match_operand:V4SF 1 "memory_operand" "Z")
1432           (parallel [(const_int 3) (const_int 2)
1433                      (const_int 1) (const_int 0)])))]
1434   "VECTOR_MEM_VSX_P (V4SFmode) && !BYTES_BIG_ENDIAN"
1435   "lxvw4x %x0,%y1"
1436   [(set_attr "type" "vecload")])
1437
1438 (define_expand "vsx_ld_elemrev_v8hi"
1439   [(set (match_operand:V8HI 0 "vsx_register_operand" "=wa")
1440         (vec_select:V8HI
1441           (match_operand:V8HI 1 "memory_operand" "Z")
1442           (parallel [(const_int 7) (const_int 6)
1443                      (const_int 5) (const_int 4)
1444                      (const_int 3) (const_int 2)
1445                      (const_int 1) (const_int 0)])))]
1446   "VECTOR_MEM_VSX_P (V8HImode) && !BYTES_BIG_ENDIAN"
1447 {
1448   if (!TARGET_P9_VECTOR)
1449     {
1450       rtx tmp = gen_reg_rtx (V4SImode);
1451       rtx subreg, subreg2, perm[16], pcv;
1452       /* 2 is leftmost element in register */
1453       unsigned int reorder[16] = {13,12,15,14,9,8,11,10,5,4,7,6,1,0,3,2};
1454       int i;
1455
1456       subreg = simplify_gen_subreg (V4SImode, operands[1], V8HImode, 0);
1457       emit_insn (gen_vsx_ld_elemrev_v4si (tmp, subreg));
1458       subreg2 = simplify_gen_subreg (V8HImode, tmp, V4SImode, 0);
1459
1460       for (i = 0; i < 16; ++i)
1461         perm[i] = GEN_INT (reorder[i]);
1462
1463       pcv = force_reg (V16QImode,
1464                        gen_rtx_CONST_VECTOR (V16QImode,
1465                                              gen_rtvec_v (16, perm)));
1466       emit_insn (gen_altivec_vperm_v8hi_direct (operands[0], subreg2,
1467                                                 subreg2, pcv));
1468       DONE;
1469     }
1470 })
1471
1472 (define_insn "*vsx_ld_elemrev_v8hi_internal"
1473   [(set (match_operand:V8HI 0 "vsx_register_operand" "=wa")
1474         (vec_select:V8HI
1475           (match_operand:V8HI 1 "memory_operand" "Z")
1476           (parallel [(const_int 7) (const_int 6)
1477                      (const_int 5) (const_int 4)
1478                      (const_int 3) (const_int 2)
1479                      (const_int 1) (const_int 0)])))]
1480   "VECTOR_MEM_VSX_P (V8HImode) && !BYTES_BIG_ENDIAN && TARGET_P9_VECTOR"
1481   "lxvh8x %x0,%y1"
1482   [(set_attr "type" "vecload")])
1483
1484 (define_expand "vsx_ld_elemrev_v16qi"
1485   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
1486         (vec_select:V16QI
1487           (match_operand:V16QI 1 "memory_operand" "Z")
1488           (parallel [(const_int 15) (const_int 14)
1489                      (const_int 13) (const_int 12)
1490                      (const_int 11) (const_int 10)
1491                      (const_int  9) (const_int  8)
1492                      (const_int  7) (const_int  6)
1493                      (const_int  5) (const_int  4)
1494                      (const_int  3) (const_int  2)
1495                      (const_int  1) (const_int  0)])))]
1496   "VECTOR_MEM_VSX_P (V16QImode) && !BYTES_BIG_ENDIAN"
1497 {
1498   if (!TARGET_P9_VECTOR)
1499     {
1500       rtx tmp = gen_reg_rtx (V4SImode);
1501       rtx subreg, subreg2, perm[16], pcv;
1502       /* 3 is leftmost element in register */
1503       unsigned int reorder[16] = {12,13,14,15,8,9,10,11,4,5,6,7,0,1,2,3};
1504       int i;
1505
1506       subreg = simplify_gen_subreg (V4SImode, operands[1], V16QImode, 0);
1507       emit_insn (gen_vsx_ld_elemrev_v4si (tmp, subreg));
1508       subreg2 = simplify_gen_subreg (V16QImode, tmp, V4SImode, 0);
1509
1510       for (i = 0; i < 16; ++i)
1511         perm[i] = GEN_INT (reorder[i]);
1512
1513       pcv = force_reg (V16QImode,
1514                        gen_rtx_CONST_VECTOR (V16QImode,
1515                                              gen_rtvec_v (16, perm)));
1516       emit_insn (gen_altivec_vperm_v16qi_direct (operands[0], subreg2,
1517                                                  subreg2, pcv));
1518       DONE;
1519     }
1520 })
1521
1522 (define_insn "vsx_ld_elemrev_v16qi_internal"
1523   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
1524         (vec_select:V16QI
1525           (match_operand:V16QI 1 "memory_operand" "Z")
1526           (parallel [(const_int 15) (const_int 14)
1527                      (const_int 13) (const_int 12)
1528                      (const_int 11) (const_int 10)
1529                      (const_int  9) (const_int  8)
1530                      (const_int  7) (const_int  6)
1531                      (const_int  5) (const_int  4)
1532                      (const_int  3) (const_int  2)
1533                      (const_int  1) (const_int  0)])))]
1534   "VECTOR_MEM_VSX_P (V16QImode) && !BYTES_BIG_ENDIAN && TARGET_P9_VECTOR"
1535   "lxvb16x %x0,%y1"
1536   [(set_attr "type" "vecload")])
1537
1538 (define_insn "vsx_st_elemrev_v1ti"
1539   [(set (match_operand:V1TI 0 "memory_operand" "=Z")
1540         (vec_select:V1TI
1541           (match_operand:V1TI 1 "vsx_register_operand" "+wa")
1542           (parallel [(const_int 0)])))
1543    (clobber (match_dup 1))]
1544   "VECTOR_MEM_VSX_P (V2DImode) && !BYTES_BIG_ENDIAN"
1545 {
1546   return "xxpermdi %x1,%x1,%x1,2\;stxvd2x %x1,%y0";
1547 }
1548   [(set_attr "type" "vecstore")])
1549
1550 (define_insn "vsx_st_elemrev_v2df"
1551   [(set (match_operand:V2DF 0 "memory_operand" "=Z")
1552         (vec_select:V2DF
1553           (match_operand:V2DF 1 "vsx_register_operand" "wa")
1554           (parallel [(const_int 1) (const_int 0)])))]
1555   "VECTOR_MEM_VSX_P (V2DFmode) && !BYTES_BIG_ENDIAN"
1556   "stxvd2x %x1,%y0"
1557   [(set_attr "type" "vecstore")])
1558
1559 (define_insn "vsx_st_elemrev_v2di"
1560   [(set (match_operand:V2DI 0 "memory_operand" "=Z")
1561         (vec_select:V2DI
1562           (match_operand:V2DI 1 "vsx_register_operand" "wa")
1563           (parallel [(const_int 1) (const_int 0)])))]
1564   "VECTOR_MEM_VSX_P (V2DImode) && !BYTES_BIG_ENDIAN"
1565   "stxvd2x %x1,%y0"
1566   [(set_attr "type" "vecstore")])
1567
1568 (define_insn "vsx_st_elemrev_v4sf"
1569   [(set (match_operand:V4SF 0 "memory_operand" "=Z")
1570         (vec_select:V4SF
1571           (match_operand:V4SF 1 "vsx_register_operand" "wa")
1572           (parallel [(const_int 3) (const_int 2)
1573                      (const_int 1) (const_int 0)])))]
1574   "VECTOR_MEM_VSX_P (V4SFmode) && !BYTES_BIG_ENDIAN"
1575   "stxvw4x %x1,%y0"
1576   [(set_attr "type" "vecstore")])
1577
1578 (define_insn "vsx_st_elemrev_v4si"
1579   [(set (match_operand:V4SI 0 "memory_operand" "=Z")
1580         (vec_select:V4SI
1581           (match_operand:V4SI 1 "vsx_register_operand" "wa")
1582           (parallel [(const_int 3) (const_int 2)
1583                      (const_int 1) (const_int 0)])))]
1584   "VECTOR_MEM_VSX_P (V4SImode) && !BYTES_BIG_ENDIAN"
1585   "stxvw4x %x1,%y0"
1586   [(set_attr "type" "vecstore")])
1587
1588 (define_expand "vsx_st_elemrev_v8hi"
1589   [(set (match_operand:V8HI 0 "memory_operand" "=Z")
1590         (vec_select:V8HI
1591           (match_operand:V8HI 1 "vsx_register_operand" "wa")
1592           (parallel [(const_int 7) (const_int 6)
1593                      (const_int 5) (const_int 4)
1594                      (const_int 3) (const_int 2)
1595                      (const_int 1) (const_int 0)])))]
1596   "VECTOR_MEM_VSX_P (V8HImode) && !BYTES_BIG_ENDIAN"
1597 {
1598   if (!TARGET_P9_VECTOR)
1599     {
1600       rtx mem_subreg, subreg, perm[16], pcv;
1601       rtx tmp = gen_reg_rtx (V8HImode);
1602       /* 2 is leftmost element in register */
1603       unsigned int reorder[16] = {13,12,15,14,9,8,11,10,5,4,7,6,1,0,3,2};
1604       int i;
1605
1606       for (i = 0; i < 16; ++i)
1607         perm[i] = GEN_INT (reorder[i]);
1608
1609       pcv = force_reg (V16QImode,
1610                        gen_rtx_CONST_VECTOR (V16QImode,
1611                                              gen_rtvec_v (16, perm)));
1612       emit_insn (gen_altivec_vperm_v8hi_direct (tmp, operands[1],
1613                                                 operands[1], pcv));
1614       subreg = simplify_gen_subreg (V4SImode, tmp, V8HImode, 0);
1615       mem_subreg = simplify_gen_subreg (V4SImode, operands[0], V8HImode, 0);
1616       emit_insn (gen_vsx_st_elemrev_v4si (mem_subreg, subreg));
1617       DONE;
1618     }
1619 })
1620
1621 (define_insn "*vsx_st_elemrev_v2di_internal"
1622   [(set (match_operand:V2DI 0 "memory_operand" "=Z")
1623         (vec_select:V2DI
1624           (match_operand:V2DI 1 "vsx_register_operand" "wa")
1625           (parallel [(const_int 1) (const_int 0)])))]
1626   "VECTOR_MEM_VSX_P (V2DImode) && !BYTES_BIG_ENDIAN && TARGET_P9_VECTOR"
1627   "stxvd2x %x1,%y0"
1628   [(set_attr "type" "vecstore")])
1629
1630 (define_insn "*vsx_st_elemrev_v8hi_internal"
1631   [(set (match_operand:V8HI 0 "memory_operand" "=Z")
1632         (vec_select:V8HI
1633           (match_operand:V8HI 1 "vsx_register_operand" "wa")
1634           (parallel [(const_int 7) (const_int 6)
1635                      (const_int 5) (const_int 4)
1636                      (const_int 3) (const_int 2)
1637                      (const_int 1) (const_int 0)])))]
1638   "VECTOR_MEM_VSX_P (V8HImode) && !BYTES_BIG_ENDIAN && TARGET_P9_VECTOR"
1639   "stxvh8x %x1,%y0"
1640   [(set_attr "type" "vecstore")])
1641
1642 (define_expand "vsx_st_elemrev_v16qi"
1643   [(set (match_operand:V16QI 0 "memory_operand" "=Z")
1644         (vec_select:V16QI
1645           (match_operand:V16QI 1 "vsx_register_operand" "wa")
1646           (parallel [(const_int 15) (const_int 14)
1647                      (const_int 13) (const_int 12)
1648                      (const_int 11) (const_int 10)
1649                      (const_int  9) (const_int  8)
1650                      (const_int  7) (const_int  6)
1651                      (const_int  5) (const_int  4)
1652                      (const_int  3) (const_int  2)
1653                      (const_int  1) (const_int  0)])))]
1654   "VECTOR_MEM_VSX_P (V16QImode) && !BYTES_BIG_ENDIAN"
1655 {
1656   if (!TARGET_P9_VECTOR)
1657     {
1658       rtx mem_subreg, subreg, perm[16], pcv;
1659       rtx tmp = gen_reg_rtx (V16QImode);
1660       /* 3 is leftmost element in register */
1661       unsigned int reorder[16] = {12,13,14,15,8,9,10,11,4,5,6,7,0,1,2,3};
1662       int i;
1663
1664       for (i = 0; i < 16; ++i)
1665         perm[i] = GEN_INT (reorder[i]);
1666
1667       pcv = force_reg (V16QImode,
1668                        gen_rtx_CONST_VECTOR (V16QImode,
1669                                              gen_rtvec_v (16, perm)));
1670       emit_insn (gen_altivec_vperm_v16qi_direct (tmp, operands[1],
1671                                                  operands[1], pcv));
1672       subreg = simplify_gen_subreg (V4SImode, tmp, V16QImode, 0);
1673       mem_subreg = simplify_gen_subreg (V4SImode, operands[0], V16QImode, 0);
1674       emit_insn (gen_vsx_st_elemrev_v4si (mem_subreg, subreg));
1675       DONE;
1676     }
1677 })
1678
1679 (define_insn "*vsx_st_elemrev_v16qi_internal"
1680   [(set (match_operand:V16QI 0 "memory_operand" "=Z")
1681         (vec_select:V16QI
1682           (match_operand:V16QI 1 "vsx_register_operand" "wa")
1683           (parallel [(const_int 15) (const_int 14)
1684                      (const_int 13) (const_int 12)
1685                      (const_int 11) (const_int 10)
1686                      (const_int  9) (const_int  8)
1687                      (const_int  7) (const_int  6)
1688                      (const_int  5) (const_int  4)
1689                      (const_int  3) (const_int  2)
1690                      (const_int  1) (const_int  0)])))]
1691   "VECTOR_MEM_VSX_P (V16QImode) && !BYTES_BIG_ENDIAN && TARGET_P9_VECTOR"
1692   "stxvb16x %x1,%y0"
1693   [(set_attr "type" "vecstore")])
1694
1695 \f
1696 ;; VSX vector floating point arithmetic instructions.  The VSX scalar
1697 ;; instructions are now combined with the insn for the traditional floating
1698 ;; point unit.
1699 (define_insn "*vsx_add<mode>3"
1700   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
1701         (plus:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")
1702                     (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
1703   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1704   "xvadd<sd>p %x0,%x1,%x2"
1705   [(set_attr "type" "<VStype_simple>")])
1706
1707 (define_insn "*vsx_sub<mode>3"
1708   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa>")
1709         (minus:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")
1710                      (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
1711   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1712   "xvsub<sd>p %x0,%x1,%x2"
1713   [(set_attr "type" "<VStype_simple>")])
1714
1715 (define_insn "*vsx_mul<mode>3"
1716   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
1717         (mult:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")
1718                     (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
1719   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1720   "xvmul<sd>p %x0,%x1,%x2"
1721   [(set_attr "type" "<VStype_simple>")])
1722
1723 ; Emulate vector with scalar for vec_mul in V2DImode
1724 (define_insn_and_split "vsx_mul_v2di"
1725   [(set (match_operand:V2DI 0 "vsx_register_operand" "=wa")
1726         (unspec:V2DI [(match_operand:V2DI 1 "vsx_register_operand" "wa")
1727                       (match_operand:V2DI 2 "vsx_register_operand" "wa")]
1728                      UNSPEC_VSX_MULSD))]
1729   "VECTOR_MEM_VSX_P (V2DImode)"
1730   "#"
1731   "VECTOR_MEM_VSX_P (V2DImode) && !reload_completed"
1732   [(const_int 0)]
1733 {
1734   rtx op0 = operands[0];
1735   rtx op1 = operands[1];
1736   rtx op2 = operands[2];
1737
1738   if (TARGET_POWER10)
1739     emit_insn (gen_mulv2di3 (op0, op1, op2) );
1740
1741   else
1742     {
1743       rtx op3 = gen_reg_rtx (DImode);
1744       rtx op4 = gen_reg_rtx (DImode);
1745       rtx op5 = gen_reg_rtx (DImode);
1746       emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (0)));
1747       emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (0)));
1748       if (TARGET_POWERPC64)
1749         emit_insn (gen_muldi3 (op5, op3, op4));
1750       else
1751         {
1752           rtx ret = expand_mult (DImode, op3, op4, NULL, 0, false);
1753           emit_move_insn (op5, ret);
1754         }
1755       emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (1)));
1756       emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (1)));
1757       if (TARGET_POWERPC64)
1758         emit_insn (gen_muldi3 (op3, op3, op4));
1759       else
1760         {
1761           rtx ret = expand_mult (DImode, op3, op4, NULL, 0, false);
1762           emit_move_insn (op3, ret);
1763         }
1764       emit_insn (gen_vsx_concat_v2di (op0, op5, op3));
1765     }
1766   DONE;
1767 }
1768   [(set_attr "type" "mul")])
1769
1770 (define_insn "*vsx_div<mode>3"
1771   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
1772         (div:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")
1773                    (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
1774   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1775   "xvdiv<sd>p %x0,%x1,%x2"
1776   [(set_attr "type" "<VStype_div>")])
1777
1778 ; Emulate vector with scalar for vec_div in V2DImode
1779 (define_insn_and_split "vsx_div_v2di"
1780   [(set (match_operand:V2DI 0 "vsx_register_operand" "=wa")
1781         (unspec:V2DI [(match_operand:V2DI 1 "vsx_register_operand" "wa")
1782                       (match_operand:V2DI 2 "vsx_register_operand" "wa")]
1783                      UNSPEC_VSX_DIVSD))]
1784   "VECTOR_MEM_VSX_P (V2DImode)"
1785   "#"
1786   "VECTOR_MEM_VSX_P (V2DImode) && !reload_completed"
1787   [(const_int 0)]
1788 {
1789   rtx op0 = operands[0];
1790   rtx op1 = operands[1];
1791   rtx op2 = operands[2];
1792   rtx op3 = gen_reg_rtx (DImode);
1793   rtx op4 = gen_reg_rtx (DImode);
1794   rtx op5 = gen_reg_rtx (DImode);
1795   emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (0)));
1796   emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (0)));
1797   if (TARGET_POWERPC64)
1798     emit_insn (gen_divdi3 (op5, op3, op4));
1799   else
1800     {
1801       rtx libfunc = optab_libfunc (sdiv_optab, DImode);
1802       rtx target = emit_library_call_value (libfunc,
1803                                             op5, LCT_NORMAL, DImode,
1804                                             op3, DImode,
1805                                             op4, DImode);
1806       emit_move_insn (op5, target);
1807     }
1808   emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (1)));
1809   emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (1)));
1810   if (TARGET_POWERPC64)
1811     emit_insn (gen_divdi3 (op3, op3, op4));
1812   else
1813     {
1814       rtx libfunc = optab_libfunc (sdiv_optab, DImode);
1815       rtx target = emit_library_call_value (libfunc,
1816                                             op3, LCT_NORMAL, DImode,
1817                                             op3, DImode,
1818                                             op4, DImode);
1819       emit_move_insn (op3, target);
1820     }
1821   emit_insn (gen_vsx_concat_v2di (op0, op5, op3));
1822   DONE;
1823 }
1824   [(set_attr "type" "div")])
1825
1826 (define_insn_and_split "vsx_udiv_v2di"
1827   [(set (match_operand:V2DI 0 "vsx_register_operand" "=wa")
1828         (unspec:V2DI [(match_operand:V2DI 1 "vsx_register_operand" "wa")
1829                       (match_operand:V2DI 2 "vsx_register_operand" "wa")]
1830                      UNSPEC_VSX_DIVUD))]
1831   "VECTOR_MEM_VSX_P (V2DImode)"
1832   "#"
1833   "VECTOR_MEM_VSX_P (V2DImode) && !reload_completed"
1834   [(const_int 0)]
1835 {
1836   rtx op0 = operands[0];
1837   rtx op1 = operands[1];
1838   rtx op2 = operands[2];
1839
1840     if (TARGET_POWER10)
1841       emit_insn (gen_udivv2di3 (op0, op1, op2) );
1842     else
1843       {
1844         rtx op3 = gen_reg_rtx (DImode);
1845         rtx op4 = gen_reg_rtx (DImode);
1846         rtx op5 = gen_reg_rtx (DImode);
1847
1848         emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (0)));
1849         emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (0)));
1850
1851         if (TARGET_POWERPC64)
1852           emit_insn (gen_udivdi3 (op5, op3, op4));
1853         else
1854           {
1855             rtx libfunc = optab_libfunc (udiv_optab, DImode);
1856             rtx target = emit_library_call_value (libfunc,
1857                                                   op5, LCT_NORMAL, DImode,
1858                                                   op3, DImode,
1859                                                   op4, DImode);
1860             emit_move_insn (op5, target);
1861           }
1862         emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (1)));
1863         emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (1)));
1864
1865         if (TARGET_POWERPC64)
1866           emit_insn (gen_udivdi3 (op3, op3, op4));
1867         else
1868           {
1869             rtx libfunc = optab_libfunc (udiv_optab, DImode);
1870             rtx target = emit_library_call_value (libfunc,
1871                                                   op3, LCT_NORMAL, DImode,
1872                                                   op3, DImode,
1873                                                   op4, DImode);
1874             emit_move_insn (op3, target);
1875           }
1876         emit_insn (gen_vsx_concat_v2di (op0, op5, op3));
1877       }
1878     DONE;
1879 }
1880   [(set_attr "type" "div")])
1881
1882 ;; Vector integer signed/unsigned divide
1883 (define_insn "vsx_div_v1ti"
1884   [(set (match_operand:V1TI 0 "vsx_register_operand" "=v")
1885         (unspec:V1TI [(match_operand:V1TI 1 "vsx_register_operand" "v")
1886                       (match_operand:V1TI 2 "vsx_register_operand" "v")]
1887                      UNSPEC_VSX_DIVSQ))]
1888   "TARGET_POWER10"
1889   "vdivsq %0,%1,%2"
1890   [(set_attr "type" "div")])
1891
1892 (define_insn "vsx_udiv_v1ti"
1893   [(set (match_operand:V1TI 0 "vsx_register_operand" "=v")
1894         (unspec:V1TI [(match_operand:V1TI 1 "vsx_register_operand" "v")
1895                       (match_operand:V1TI 2 "vsx_register_operand" "v")]
1896                      UNSPEC_VSX_DIVUQ))]
1897   "TARGET_POWER10"
1898   "vdivuq %0,%1,%2"
1899   [(set_attr "type" "div")])
1900
1901 (define_insn "vsx_dives_v1ti"
1902   [(set (match_operand:V1TI 0 "vsx_register_operand" "=v")
1903         (unspec:V1TI [(match_operand:V1TI 1 "vsx_register_operand" "v")
1904                       (match_operand:V1TI 2 "vsx_register_operand" "v")]
1905                      UNSPEC_VSX_DIVESQ))]
1906   "TARGET_POWER10"
1907   "vdivesq %0,%1,%2"
1908   [(set_attr "type" "div")])
1909
1910 (define_insn "vsx_diveu_v1ti"
1911   [(set (match_operand:V1TI 0 "vsx_register_operand" "=v")
1912         (unspec:V1TI [(match_operand:V1TI 1 "vsx_register_operand" "v")
1913                       (match_operand:V1TI 2 "vsx_register_operand" "v")]
1914                      UNSPEC_VSX_DIVEUQ))]
1915   "TARGET_POWER10"
1916   "vdiveuq %0,%1,%2"
1917   [(set_attr "type" "div")])
1918
1919 (define_insn "vsx_mods_v1ti"
1920   [(set (match_operand:V1TI 0 "vsx_register_operand" "=v")
1921         (unspec:V1TI [(match_operand:V1TI 1 "vsx_register_operand" "v")
1922                       (match_operand:V1TI 2 "vsx_register_operand" "v")]
1923                      UNSPEC_VSX_MODSQ))]
1924   "TARGET_POWER10"
1925   "vmodsq %0,%1,%2"
1926   [(set_attr "type" "div")])
1927
1928 (define_insn "vsx_modu_v1ti"
1929   [(set (match_operand:V1TI 0 "vsx_register_operand" "=v")
1930         (unspec:V1TI [(match_operand:V1TI 1 "vsx_register_operand" "v")
1931                       (match_operand:V1TI 2 "vsx_register_operand" "v")]
1932                      UNSPEC_VSX_MODUQ))]
1933   "TARGET_POWER10"
1934   "vmoduq %0,%1,%2"
1935   [(set_attr "type" "div")])
1936
1937 ;; *tdiv* instruction returning the FG flag
1938 (define_expand "vsx_tdiv<mode>3_fg"
1939   [(set (match_dup 3)
1940         (unspec:CCFP [(match_operand:VSX_B 1 "vsx_register_operand")
1941                       (match_operand:VSX_B 2 "vsx_register_operand")]
1942                      UNSPEC_VSX_TDIV))
1943    (set (match_operand:SI 0 "gpc_reg_operand")
1944         (gt:SI (match_dup 3)
1945                (const_int 0)))]
1946   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1947 {
1948   operands[3] = gen_reg_rtx (CCFPmode);
1949 })
1950
1951 ;; *tdiv* instruction returning the FE flag
1952 (define_expand "vsx_tdiv<mode>3_fe"
1953   [(set (match_dup 3)
1954         (unspec:CCFP [(match_operand:VSX_B 1 "vsx_register_operand")
1955                       (match_operand:VSX_B 2 "vsx_register_operand")]
1956                      UNSPEC_VSX_TDIV))
1957    (set (match_operand:SI 0 "gpc_reg_operand")
1958         (eq:SI (match_dup 3)
1959                (const_int 0)))]
1960   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1961 {
1962   operands[3] = gen_reg_rtx (CCFPmode);
1963 })
1964
1965 (define_insn "*vsx_tdiv<mode>3_internal"
1966   [(set (match_operand:CCFP 0 "cc_reg_operand" "=x")
1967         (unspec:CCFP [(match_operand:VSX_B 1 "vsx_register_operand" "wa")
1968                       (match_operand:VSX_B 2 "vsx_register_operand" "wa")]
1969                    UNSPEC_VSX_TDIV))]
1970   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1971   "x<VSv>tdiv<sd>p %0,%x1,%x2"
1972   [(set_attr "type" "<VStype_simple>")])
1973
1974 (define_insn "vsx_fre<mode>2"
1975   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
1976         (unspec:VSX_F [(match_operand:VSX_F 1 "vsx_register_operand" "wa")]
1977                       UNSPEC_FRES))]
1978   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1979   "xvre<sd>p %x0,%x1"
1980   [(set_attr "type" "<VStype_simple>")])
1981
1982 (define_insn "*vsx_neg<mode>2"
1983   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
1984         (neg:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")))]
1985   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1986   "xvneg<sd>p %x0,%x1"
1987   [(set_attr "type" "<VStype_simple>")])
1988
1989 (define_insn "*vsx_abs<mode>2"
1990   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
1991         (abs:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")))]
1992   "VECTOR_UNIT_VSX_P (<MODE>mode)"
1993   "xvabs<sd>p %x0,%x1"
1994   [(set_attr "type" "<VStype_simple>")])
1995
1996 (define_insn "vsx_nabs<mode>2"
1997   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
1998         (neg:VSX_F
1999          (abs:VSX_F
2000           (match_operand:VSX_F 1 "vsx_register_operand" "wa"))))]
2001   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2002   "xvnabs<sd>p %x0,%x1"
2003   [(set_attr "type" "<VStype_simple>")])
2004
2005 (define_insn "vsx_smax<mode>3"
2006   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2007         (smax:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")
2008                     (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
2009   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2010   "xvmax<sd>p %x0,%x1,%x2"
2011   [(set_attr "type" "<VStype_simple>")])
2012
2013 (define_insn "*vsx_smin<mode>3"
2014   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2015         (smin:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")
2016                     (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
2017   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2018   "xvmin<sd>p %x0,%x1,%x2"
2019   [(set_attr "type" "<VStype_simple>")])
2020
2021 (define_insn "*vsx_sqrt<mode>2"
2022   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2023         (sqrt:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")))]
2024   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2025   "xvsqrt<sd>p %x0,%x1"
2026   [(set_attr "type" "<sd>sqrt")])
2027
2028 (define_insn "*vsx_rsqrte<mode>2"
2029   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2030         (unspec:VSX_F [(match_operand:VSX_F 1 "vsx_register_operand" "wa")]
2031                       UNSPEC_RSQRT))]
2032   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2033   "xvrsqrte<sd>p %x0,%x1"
2034   [(set_attr "type" "<VStype_simple>")])
2035
2036 ;; *tsqrt* returning the fg flag
2037 (define_expand "vsx_tsqrt<mode>2_fg"
2038   [(set (match_dup 2)
2039         (unspec:CCFP [(match_operand:VSX_B 1 "vsx_register_operand")]
2040                      UNSPEC_VSX_TSQRT))
2041    (set (match_operand:SI 0 "gpc_reg_operand")
2042         (gt:SI (match_dup 2)
2043                (const_int 0)))]
2044   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2045 {
2046   operands[2] = gen_reg_rtx (CCFPmode);
2047 })
2048
2049 ;; *tsqrt* returning the fe flag
2050 (define_expand "vsx_tsqrt<mode>2_fe"
2051   [(set (match_dup 2)
2052         (unspec:CCFP [(match_operand:VSX_B 1 "vsx_register_operand")]
2053                      UNSPEC_VSX_TSQRT))
2054    (set (match_operand:SI 0 "gpc_reg_operand")
2055         (eq:SI (match_dup 2)
2056                (const_int 0)))]
2057   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2058 {
2059   operands[2] = gen_reg_rtx (CCFPmode);
2060 })
2061
2062 (define_insn "*vsx_tsqrt<mode>2_internal"
2063   [(set (match_operand:CCFP 0 "cc_reg_operand" "=x")
2064         (unspec:CCFP [(match_operand:VSX_B 1 "vsx_register_operand" "wa")]
2065                      UNSPEC_VSX_TSQRT))]
2066   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2067   "x<VSv>tsqrt<sd>p %0,%x1"
2068   [(set_attr "type" "<VStype_simple>")])
2069
2070 ;; Fused vector multiply/add instructions. Do not generate the Altivec versions
2071 ;; of fma (vmaddfp and vnmsubfp).  These instructions allows the target to be a
2072 ;; separate register from the 3 inputs, which can possibly save an extra move
2073 ;; being generated (assuming all registers are AltiVec registers).  However,
2074 ;; vmaddfp and vnmsubfp can have different behaviors than the VSX instructions
2075 ;; in some corner cases due to VSCR[NJ] being set or if the addend is +0.0
2076 ;; instead of -0.0.
2077 (define_insn "*vsx_fmav4sf4"
2078   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa,wa")
2079         (fma:V4SF
2080           (match_operand:V4SF 1 "vsx_register_operand" "%wa,wa")
2081           (match_operand:V4SF 2 "vsx_register_operand" "wa,0")
2082           (match_operand:V4SF 3 "vsx_register_operand" "0,wa")))]
2083   "VECTOR_UNIT_VSX_P (V4SFmode)"
2084   "@
2085    xvmaddasp %x0,%x1,%x2
2086    xvmaddmsp %x0,%x1,%x3"
2087   [(set_attr "type" "vecfloat")])
2088
2089 (define_insn "*vsx_fmav2df4"
2090   [(set (match_operand:V2DF 0 "vsx_register_operand" "=wa,wa")
2091         (fma:V2DF
2092           (match_operand:V2DF 1 "vsx_register_operand" "%wa,wa")
2093           (match_operand:V2DF 2 "vsx_register_operand" "wa,0")
2094           (match_operand:V2DF 3 "vsx_register_operand" "0,wa")))]
2095   "VECTOR_UNIT_VSX_P (V2DFmode)"
2096   "@
2097    xvmaddadp %x0,%x1,%x2
2098    xvmaddmdp %x0,%x1,%x3"
2099   [(set_attr "type" "vecdouble")])
2100
2101 (define_insn "*vsx_fms<mode>4"
2102   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa,wa")
2103         (fma:VSX_F
2104           (match_operand:VSX_F 1 "vsx_register_operand" "%wa,wa")
2105           (match_operand:VSX_F 2 "vsx_register_operand" "wa,0")
2106           (neg:VSX_F
2107             (match_operand:VSX_F 3 "vsx_register_operand" "0,wa"))))]
2108   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2109   "@
2110    xvmsuba<sd>p %x0,%x1,%x2
2111    xvmsubm<sd>p %x0,%x1,%x3"
2112   [(set_attr "type" "<VStype_mul>")])
2113
2114 (define_insn "*vsx_nfma<mode>4"
2115   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa,wa")
2116         (neg:VSX_F
2117          (fma:VSX_F
2118           (match_operand:VSX_F 1 "vsx_register_operand" "wa,wa")
2119           (match_operand:VSX_F 2 "vsx_register_operand" "wa,0")
2120           (match_operand:VSX_F 3 "vsx_register_operand" "0,wa"))))]
2121   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2122   "@
2123    xvnmadda<sd>p %x0,%x1,%x2
2124    xvnmaddm<sd>p %x0,%x1,%x3"
2125   [(set_attr "type" "<VStype_mul>")])
2126
2127 (define_insn "*vsx_nfmsv4sf4"
2128   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa,wa")
2129         (neg:V4SF
2130          (fma:V4SF
2131            (match_operand:V4SF 1 "vsx_register_operand" "%wa,wa")
2132            (match_operand:V4SF 2 "vsx_register_operand" "wa,0")
2133            (neg:V4SF
2134              (match_operand:V4SF 3 "vsx_register_operand" "0,wa")))))]
2135   "VECTOR_UNIT_VSX_P (V4SFmode)"
2136   "@
2137    xvnmsubasp %x0,%x1,%x2
2138    xvnmsubmsp %x0,%x1,%x3"
2139   [(set_attr "type" "vecfloat")])
2140
2141 (define_insn "*vsx_nfmsv2df4"
2142   [(set (match_operand:V2DF 0 "vsx_register_operand" "=wa,wa")
2143         (neg:V2DF
2144          (fma:V2DF
2145            (match_operand:V2DF 1 "vsx_register_operand" "%wa,wa")
2146            (match_operand:V2DF 2 "vsx_register_operand" "wa,0")
2147            (neg:V2DF
2148              (match_operand:V2DF 3 "vsx_register_operand" "0,wa")))))]
2149   "VECTOR_UNIT_VSX_P (V2DFmode)"
2150   "@
2151    xvnmsubadp %x0,%x1,%x2
2152    xvnmsubmdp %x0,%x1,%x3"
2153   [(set_attr "type" "vecdouble")])
2154
2155 ;; Vector conditional expressions (no scalar version for these instructions)
2156 (define_insn "vsx_eq<mode>"
2157   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2158         (eq:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")
2159                   (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
2160   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2161   "xvcmpeq<sd>p %x0,%x1,%x2"
2162   [(set_attr "type" "<VStype_simple>")])
2163
2164 (define_insn "vsx_gt<mode>"
2165   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2166         (gt:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")
2167                   (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
2168   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2169   "xvcmpgt<sd>p %x0,%x1,%x2"
2170   [(set_attr "type" "<VStype_simple>")])
2171
2172 (define_insn "*vsx_ge<mode>"
2173   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2174         (ge:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")
2175                   (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
2176   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2177   "xvcmpge<sd>p %x0,%x1,%x2"
2178   [(set_attr "type" "<VStype_simple>")])
2179
2180 ;; Compare vectors producing a vector result and a predicate, setting CR6 to
2181 ;; indicate a combined status
2182 (define_insn "*vsx_eq_<mode>_p"
2183   [(set (reg:CC CR6_REGNO)
2184         (unspec:CC
2185          [(eq:CC (match_operand:VSX_F 1 "vsx_register_operand" "wa")
2186                  (match_operand:VSX_F 2 "vsx_register_operand" "wa"))]
2187          UNSPEC_PREDICATE))
2188    (set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2189         (eq:VSX_F (match_dup 1)
2190                   (match_dup 2)))]
2191   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2192   "xvcmpeq<sd>p. %x0,%x1,%x2"
2193   [(set_attr "type" "<VStype_simple>")])
2194
2195 (define_insn "*vsx_gt_<mode>_p"
2196   [(set (reg:CC CR6_REGNO)
2197         (unspec:CC
2198          [(gt:CC (match_operand:VSX_F 1 "vsx_register_operand" "wa")
2199                  (match_operand:VSX_F 2 "vsx_register_operand" "wa"))]
2200          UNSPEC_PREDICATE))
2201    (set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2202         (gt:VSX_F (match_dup 1)
2203                   (match_dup 2)))]
2204   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2205   "xvcmpgt<sd>p. %x0,%x1,%x2"
2206   [(set_attr "type" "<VStype_simple>")])
2207
2208 ;; xvtlsbb BF,XB
2209 ;; Set the CR field BF to indicate if the lowest bit (bit 7) of every byte
2210 ;; element in VSR[XB] is equal to 1 (ALL_TRUE) or equal to 0 (ALL_FALSE).
2211 (define_insn "*xvtlsbb_internal"
2212   [(set (match_operand:CC 0 "cc_reg_operand" "=y")
2213         (unspec:CC [(match_operand:V16QI 1 "vsx_register_operand" "wa")]
2214          UNSPEC_XVTLSBB))]
2215   "TARGET_POWER10"
2216   "xvtlsbb %0,%x1"
2217   [(set_attr "type" "logical")])
2218
2219 ;; Vector Test Least Significant Bit by Byte
2220 ;; for the implementation of the builtin
2221 ;;     __builtin_vec_test_lsbb_all_ones
2222 ;;     int vec_test_lsbb_all_ones (vector unsigned char);
2223 ;; and
2224 ;;     __builtin_vec_test_lsbb_all_zeros
2225 ;;     int vec_test_lsbb_all_zeros (vector unsigned char);
2226 (define_expand "xvtlsbbo"
2227   [(set (match_dup 2)
2228         (unspec:CC [(match_operand:V16QI 1 "vsx_register_operand" "v")]
2229          UNSPEC_XVTLSBB))
2230    (set (match_operand:SI 0 "gpc_reg_operand" "=r")
2231         (lt:SI (match_dup 2) (const_int 0)))]
2232   "TARGET_POWER10"
2233 {
2234    operands[2] = gen_reg_rtx (CCmode);
2235 })
2236 (define_expand "xvtlsbbz"
2237   [(set (match_dup 2)
2238         (unspec:CC [(match_operand:V16QI 1 "vsx_register_operand" "v")]
2239          UNSPEC_XVTLSBB))
2240    (set (match_operand:SI 0 "gpc_reg_operand" "=r")
2241         (eq:SI (match_dup 2) (const_int 0)))]
2242   "TARGET_POWER10"
2243 {
2244    operands[2] = gen_reg_rtx (CCmode);
2245 })
2246
2247 (define_insn "*vsx_ge_<mode>_p"
2248   [(set (reg:CC CR6_REGNO)
2249         (unspec:CC
2250          [(ge:CC (match_operand:VSX_F 1 "vsx_register_operand" "wa")
2251                  (match_operand:VSX_F 2 "vsx_register_operand" "wa"))]
2252          UNSPEC_PREDICATE))
2253    (set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2254         (ge:VSX_F (match_dup 1)
2255                   (match_dup 2)))]
2256   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2257   "xvcmpge<sd>p. %x0,%x1,%x2"
2258   [(set_attr "type" "<VStype_simple>")])
2259
2260 ;; Copy sign
2261 (define_insn "vsx_copysign<mode>3"
2262   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2263         (copysign:VSX_F
2264          (match_operand:VSX_F 1 "vsx_register_operand" "wa")
2265          (match_operand:VSX_F 2 "vsx_register_operand" "wa")))]
2266   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2267   "xvcpsgn<sd>p %x0,%x2,%x1"
2268   [(set_attr "type" "<VStype_simple>")])
2269
2270 ;; For the conversions, limit the register class for the integer value to be
2271 ;; the fprs because we don't want to add the altivec registers to movdi/movsi.
2272 ;; For the unsigned tests, there isn't a generic double -> unsigned conversion
2273 ;; in rs6000.md so don't test VECTOR_UNIT_VSX_P, just test against VSX.
2274 ;; Don't use vsx_register_operand here, use gpc_reg_operand to match rs6000.md
2275 ;; in allowing virtual registers.
2276 (define_insn "vsx_float<VSi><mode>2"
2277   [(set (match_operand:VSX_F 0 "gpc_reg_operand" "=wa")
2278         (float:VSX_F (match_operand:<VSI> 1 "gpc_reg_operand" "wa")))]
2279   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2280   "xvcvsx<VSc><sd>p %x0,%x1"
2281   [(set_attr "type" "<VStype_simple>")])
2282
2283 (define_insn "vsx_floatuns<VSi><mode>2"
2284   [(set (match_operand:VSX_F 0 "gpc_reg_operand" "=wa")
2285         (unsigned_float:VSX_F (match_operand:<VSI> 1 "gpc_reg_operand" "wa")))]
2286   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2287   "xvcvux<VSc><sd>p %x0,%x1"
2288   [(set_attr "type" "<VStype_simple>")])
2289
2290 (define_insn "vsx_fix_trunc<mode><VSi>2"
2291   [(set (match_operand:<VSI> 0 "gpc_reg_operand" "=wa")
2292         (fix:<VSI> (match_operand:VSX_F 1 "gpc_reg_operand" "wa")))]
2293   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2294   "x<VSv>cv<sd>psx<VSc>s %x0,%x1"
2295   [(set_attr "type" "<VStype_simple>")])
2296
2297 (define_insn "vsx_fixuns_trunc<mode><VSi>2"
2298   [(set (match_operand:<VSI> 0 "gpc_reg_operand" "=wa")
2299         (unsigned_fix:<VSI> (match_operand:VSX_F 1 "gpc_reg_operand" "wa")))]
2300   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2301   "x<VSv>cv<sd>pux<VSc>s %x0,%x1"
2302   [(set_attr "type" "<VStype_simple>")])
2303
2304 ;; Math rounding functions
2305 (define_insn "vsx_x<VSv>r<sd>pi"
2306   [(set (match_operand:VSX_B 0 "vsx_register_operand" "=wa")
2307         (unspec:VSX_B [(match_operand:VSX_B 1 "vsx_register_operand" "wa")]
2308                       UNSPEC_VSX_ROUND_I))]
2309   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2310   "x<VSv>r<sd>pi %x0,%x1"
2311   [(set_attr "type" "<VStype_simple>")])
2312
2313 (define_insn "vsx_x<VSv>r<sd>pic"
2314   [(set (match_operand:VSX_B 0 "vsx_register_operand" "=wa")
2315         (unspec:VSX_B [(match_operand:VSX_B 1 "vsx_register_operand" "wa")]
2316                       UNSPEC_VSX_ROUND_IC))]
2317   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2318   "x<VSv>r<sd>pic %x0,%x1"
2319   [(set_attr "type" "<VStype_simple>")])
2320
2321 (define_insn "vsx_btrunc<mode>2"
2322   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2323         (fix:VSX_F (match_operand:VSX_F 1 "vsx_register_operand" "wa")))]
2324   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2325   "xvr<sd>piz %x0,%x1"
2326   [(set_attr "type" "<VStype_simple>")])
2327
2328 (define_insn "*vsx_b2trunc<mode>2"
2329   [(set (match_operand:VSX_B 0 "vsx_register_operand" "=wa")
2330         (unspec:VSX_B [(match_operand:VSX_B 1 "vsx_register_operand" "wa")]
2331                       UNSPEC_FRIZ))]
2332   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2333   "x<VSv>r<sd>piz %x0,%x1"
2334   [(set_attr "type" "<VStype_simple>")])
2335
2336 (define_insn "vsx_floor<mode>2"
2337   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2338         (unspec:VSX_F [(match_operand:VSX_F 1 "vsx_register_operand" "wa")]
2339                       UNSPEC_FRIM))]
2340   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2341   "xvr<sd>pim %x0,%x1"
2342   [(set_attr "type" "<VStype_simple>")])
2343
2344 (define_insn "vsx_ceil<mode>2"
2345   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
2346         (unspec:VSX_F [(match_operand:VSX_F 1 "vsx_register_operand" "wa")]
2347                       UNSPEC_FRIP))]
2348   "VECTOR_UNIT_VSX_P (<MODE>mode)"
2349   "xvr<sd>pip %x0,%x1"
2350   [(set_attr "type" "<VStype_simple>")])
2351
2352 \f
2353 ;; VSX convert to/from double vector
2354
2355 ;; Convert between single and double precision
2356 ;; Don't use xscvspdp and xscvdpsp for scalar conversions, since the normal
2357 ;; scalar single precision instructions internally use the double format.
2358 ;; Prefer the altivec registers, since we likely will need to do a vperm
2359 (define_insn "vsx_xscvdpsp"
2360   [(set (match_operand:V4SF 0 "vsx_register_operand" "=f,?wa")
2361         (unspec:V4SF [(match_operand:DF 1 "vsx_register_operand" "f,wa")]
2362                               UNSPEC_VSX_CVSPDP))]
2363   "VECTOR_UNIT_VSX_P (DFmode)"
2364   "xscvdpsp %x0,%x1"
2365   [(set_attr "type" "fp")])
2366
2367 (define_insn "vsx_xvcvspdp_be"
2368   [(set (match_operand:V2DF 0 "vsx_register_operand" "=v,?wa")
2369      (float_extend:V2DF
2370        (vec_select:V2SF (match_operand:V4SF 1 "vsx_register_operand" "wa,wa")
2371          (parallel [(const_int 0) (const_int 2)]))))]
2372   "VECTOR_UNIT_VSX_P (V4SFmode) && BYTES_BIG_ENDIAN"
2373   "xvcvspdp %x0,%x1"
2374   [(set_attr "type" "vecdouble")])
2375
2376 (define_insn "vsx_xvcvspdp_le"
2377   [(set (match_operand:V2DF 0 "vsx_register_operand" "=v,?wa")
2378      (float_extend:V2DF
2379        (vec_select:V2SF (match_operand:V4SF 1 "vsx_register_operand" "wa,wa")
2380          (parallel [(const_int 1) (const_int 3)]))))]
2381   "VECTOR_UNIT_VSX_P (V4SFmode) && !BYTES_BIG_ENDIAN"
2382   "xvcvspdp %x0,%x1"
2383   [(set_attr "type" "vecdouble")])
2384
2385 (define_expand "vsx_xvcvspdp"
2386   [(match_operand:V2DF 0 "vsx_register_operand")
2387    (match_operand:V4SF 1 "vsx_register_operand")]
2388   "VECTOR_UNIT_VSX_P (V4SFmode)"
2389 {
2390   if (BYTES_BIG_ENDIAN)
2391     emit_insn (gen_vsx_xvcvspdp_be (operands[0], operands[1]));
2392   else
2393     emit_insn (gen_vsx_xvcvspdp_le (operands[0], operands[1]));
2394   DONE;
2395 })
2396
2397 (define_insn "vsx_xvcvdpsp"
2398   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa,?wa")
2399         (unspec:V4SF [(match_operand:V2DF 1 "vsx_register_operand" "v,wa")]
2400                               UNSPEC_VSX_CVSPDP))]
2401   "VECTOR_UNIT_VSX_P (V2DFmode)"
2402   "xvcvdpsp %x0,%x1"
2403   [(set_attr "type" "vecdouble")])
2404
2405 ;; xscvspdp, represent the scalar SF type as V4SF
2406 (define_insn "vsx_xscvspdp"
2407   [(set (match_operand:DF 0 "vsx_register_operand" "=wa")
2408         (unspec:DF [(match_operand:V4SF 1 "vsx_register_operand" "wa")]
2409                    UNSPEC_VSX_CVSPDP))]
2410   "VECTOR_UNIT_VSX_P (V4SFmode)"
2411   "xscvspdp %x0,%x1"
2412   [(set_attr "type" "fp")])
2413
2414 ;; Same as vsx_xscvspdp, but use SF as the type
2415 (define_insn "vsx_xscvspdp_scalar2"
2416   [(set (match_operand:SF 0 "vsx_register_operand" "=wa")
2417         (unspec:SF [(match_operand:V4SF 1 "vsx_register_operand" "wa")]
2418                    UNSPEC_VSX_CVSPDP))]
2419   "VECTOR_UNIT_VSX_P (V4SFmode)"
2420   "xscvspdp %x0,%x1"
2421   [(set_attr "type" "fp")])
2422
2423 ;; Generate xvcvhpsp instruction
2424 (define_insn "vsx_xvcvhpsp"
2425   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa")
2426         (unspec:V4SF [(match_operand: V16QI 1 "vsx_register_operand" "wa")]
2427                      UNSPEC_VSX_CVHPSP))]
2428   "TARGET_P9_VECTOR"
2429   "xvcvhpsp %x0,%x1"
2430   [(set_attr "type" "vecfloat")])
2431
2432 ;; Generate xvcvsphp
2433 (define_insn "vsx_xvcvsphp"
2434   [(set (match_operand:V4SI 0 "register_operand" "=wa")
2435         (unspec:V4SI [(match_operand:V4SF 1 "vsx_register_operand" "wa")]
2436                      UNSPEC_VSX_XVCVSPHP))]
2437   "TARGET_P9_VECTOR"
2438   "xvcvsphp %x0,%x1"
2439 [(set_attr "type" "vecfloat")])
2440
2441 ;; xscvdpsp used for splat'ing a scalar to V4SF, knowing that the internal SF
2442 ;; format of scalars is actually DF.
2443 (define_insn "vsx_xscvdpsp_scalar"
2444   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa")
2445         (unspec:V4SF [(match_operand:SF 1 "vsx_register_operand" "wa")]
2446                      UNSPEC_VSX_CVSPDP))]
2447   "VECTOR_UNIT_VSX_P (V4SFmode)"
2448   "xscvdpsp %x0,%x1"
2449   [(set_attr "type" "fp")])
2450
2451 ;; ISA 2.07 xscvdpspn/xscvspdpn that does not raise an error on signalling NaNs
2452 (define_insn "vsx_xscvdpspn"
2453   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa")
2454         (unspec:V4SF [(match_operand:DF 1 "vsx_register_operand" "wa")]
2455                      UNSPEC_VSX_CVDPSPN))]
2456   "TARGET_XSCVDPSPN"
2457   "xscvdpspn %x0,%x1"
2458   [(set_attr "type" "fp")])
2459
2460 (define_insn "vsx_xscvspdpn"
2461   [(set (match_operand:DF 0 "vsx_register_operand" "=wa")
2462         (unspec:DF [(match_operand:V4SF 1 "vsx_register_operand" "wa")]
2463                    UNSPEC_VSX_CVSPDPN))]
2464   "TARGET_XSCVSPDPN"
2465   "xscvspdpn %x0,%x1"
2466   [(set_attr "type" "fp")])
2467
2468 (define_insn "vsx_xscvdpspn_scalar"
2469   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa")
2470         (unspec:V4SF [(match_operand:SF 1 "vsx_register_operand" "wa")]
2471                      UNSPEC_VSX_CVDPSPN))]
2472   "TARGET_XSCVDPSPN"
2473   "xscvdpspn %x0,%x1"
2474   [(set_attr "type" "fp")])
2475
2476 ;; Used by direct move to move a SFmode value from GPR to VSX register
2477 (define_insn "vsx_xscvspdpn_directmove"
2478   [(set (match_operand:SF 0 "vsx_register_operand" "=wa")
2479         (unspec:SF [(match_operand:SF 1 "vsx_register_operand" "wa")]
2480                    UNSPEC_VSX_CVSPDPN))]
2481   "TARGET_XSCVSPDPN"
2482   "xscvspdpn %x0,%x1"
2483   [(set_attr "type" "fp")])
2484
2485 ;; Convert and scale (used by vec_ctf, vec_cts, vec_ctu for double/long long)
2486
2487 (define_insn "vsx_xvcv<su>xwsp"
2488   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa")
2489      (any_float:V4SF (match_operand:V4SI 1 "vsx_register_operand" "wa")))]
2490   "VECTOR_UNIT_VSX_P (V4SFmode)"
2491   "xvcv<su>xwsp %x0,%x1"
2492   [(set_attr "type" "vecfloat")])
2493
2494 (define_insn "vsx_xvcv<su>xddp"
2495   [(set (match_operand:V2DF 0 "vsx_register_operand" "=wa")
2496         (any_float:V2DF (match_operand:V2DI 1 "vsx_register_operand" "wa")))]
2497   "VECTOR_UNIT_VSX_P (V2DFmode)"
2498   "xvcv<su>xddp %x0,%x1"
2499   [(set_attr "type" "vecdouble")])
2500
2501 (define_insn "vsx_xvcvsp<su>xws"
2502   [(set (match_operand:V4SI 0 "vsx_register_operand" "=wa")
2503         (any_fix:V4SI (match_operand:V4SF 1 "vsx_register_operand" "wa")))]
2504   "VECTOR_UNIT_VSX_P (V4SFmode)"
2505   "xvcvsp<su>xws %x0,%x1"
2506   [(set_attr "type" "vecfloat")])
2507
2508 (define_insn "vsx_xvcvdp<su>xds"
2509   [(set (match_operand:V2DI 0 "vsx_register_operand" "=wa")
2510         (any_fix:V2DI (match_operand:V2DF 1 "vsx_register_operand" "wa")))]
2511   "VECTOR_UNIT_VSX_P (V2DFmode)"
2512   "xvcvdp<su>xds %x0,%x1"
2513   [(set_attr "type" "vecdouble")])
2514
2515 (define_expand "vsx_xvcvsxddp_scale"
2516   [(match_operand:V2DF 0 "vsx_register_operand")
2517    (match_operand:V2DI 1 "vsx_register_operand")
2518    (match_operand:QI 2 "immediate_operand")]
2519   "VECTOR_UNIT_VSX_P (V2DFmode)"
2520 {
2521   rtx op0 = operands[0];
2522   rtx op1 = operands[1];
2523   int scale = INTVAL(operands[2]);
2524   emit_insn (gen_vsx_xvcvsxddp (op0, op1));
2525   if (scale != 0)
2526     rs6000_scale_v2df (op0, op0, -scale);
2527   DONE;
2528 })
2529
2530 (define_expand "vsx_xvcvuxddp_scale"
2531   [(match_operand:V2DF 0 "vsx_register_operand")
2532    (match_operand:V2DI 1 "vsx_register_operand")
2533    (match_operand:QI 2 "immediate_operand")]
2534   "VECTOR_UNIT_VSX_P (V2DFmode)"
2535 {
2536   rtx op0 = operands[0];
2537   rtx op1 = operands[1];
2538   int scale = INTVAL(operands[2]);
2539   emit_insn (gen_vsx_xvcvuxddp (op0, op1));
2540   if (scale != 0)
2541     rs6000_scale_v2df (op0, op0, -scale);
2542   DONE;
2543 })
2544
2545 (define_expand "vsx_xvcvdpsxds_scale"
2546   [(match_operand:V2DI 0 "vsx_register_operand")
2547    (match_operand:V2DF 1 "vsx_register_operand")
2548    (match_operand:QI 2 "immediate_operand")]
2549   "VECTOR_UNIT_VSX_P (V2DFmode)"
2550 {
2551   rtx op0 = operands[0];
2552   rtx op1 = operands[1];
2553   rtx tmp;
2554   int scale = INTVAL (operands[2]);
2555   if (scale == 0)
2556     tmp = op1;
2557   else
2558     {
2559       tmp  = gen_reg_rtx (V2DFmode);
2560       rs6000_scale_v2df (tmp, op1, scale);
2561     }
2562   emit_insn (gen_vsx_xvcvdpsxds (op0, tmp));
2563   DONE;
2564 })
2565
2566 ;; convert vector of 64-bit floating point numbers to vector of
2567 ;; 64-bit unsigned integer
2568 (define_expand "vsx_xvcvdpuxds_scale"
2569   [(match_operand:V2DI 0 "vsx_register_operand")
2570    (match_operand:V2DF 1 "vsx_register_operand")
2571    (match_operand:QI 2 "immediate_operand")]
2572   "VECTOR_UNIT_VSX_P (V2DFmode)"
2573 {
2574   rtx op0 = operands[0];
2575   rtx op1 = operands[1];
2576   rtx tmp;
2577   int scale = INTVAL (operands[2]);
2578   if (scale == 0)
2579     tmp = op1;
2580   else
2581     {
2582       tmp = gen_reg_rtx (V2DFmode);
2583       rs6000_scale_v2df (tmp, op1, scale);
2584     }
2585   emit_insn (gen_vsx_xvcvdpuxds (op0, tmp));
2586   DONE;
2587 })
2588
2589 ;; Convert from 64-bit to 32-bit types
2590 ;; Note, favor the Altivec registers since the usual use of these instructions
2591 ;; is in vector converts and we need to use the Altivec vperm instruction.
2592
2593 (define_insn "vsx_xvcvdpsxws"
2594   [(set (match_operand:V4SI 0 "vsx_register_operand" "=v,?wa")
2595         (unspec:V4SI [(match_operand:V2DF 1 "vsx_register_operand" "wa,wa")]
2596                      UNSPEC_VSX_CVDPSXWS))]
2597   "VECTOR_UNIT_VSX_P (V2DFmode)"
2598   "xvcvdpsxws %x0,%x1"
2599   [(set_attr "type" "vecdouble")])
2600
2601 (define_insn "vsx_xvcvdpuxws"
2602   [(set (match_operand:V4SI 0 "vsx_register_operand" "=v,?wa")
2603         (unspec:V4SI [(match_operand:V2DF 1 "vsx_register_operand" "wa,wa")]
2604                      UNSPEC_VSX_CVDPUXWS))]
2605   "VECTOR_UNIT_VSX_P (V2DFmode)"
2606   "xvcvdpuxws %x0,%x1"
2607   [(set_attr "type" "vecdouble")])
2608
2609 (define_insn "vsx_xvcvsxdsp"
2610   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa")
2611         (unspec:V4SF [(match_operand:V2DI 1 "vsx_register_operand" "wa")]
2612                      UNSPEC_VSX_CVSXDSP))]
2613   "VECTOR_UNIT_VSX_P (V2DFmode)"
2614   "xvcvsxdsp %x0,%x1"
2615   [(set_attr "type" "vecfloat")])
2616
2617 (define_insn "vsx_xvcvuxdsp"
2618   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa")
2619         (unspec:V4SF [(match_operand:V2DI 1 "vsx_register_operand" "wa")]
2620                      UNSPEC_VSX_CVUXDSP))]
2621   "VECTOR_UNIT_VSX_P (V2DFmode)"
2622   "xvcvuxdsp %x0,%x1"
2623   [(set_attr "type" "vecdouble")])
2624
2625 ;; Convert vector of 32-bit signed/unsigned integers to vector of
2626 ;; 64-bit floating point numbers.
2627 (define_insn "vsx_xvcv<su>xwdp_be"
2628   [(set (match_operand:V2DF 0 "vsx_register_operand" "=wa")
2629      (any_float:V2DF
2630        (vec_select:V2SI (match_operand:V4SI 1 "vsx_register_operand" "wa")
2631          (parallel [(const_int 0) (const_int 2)]))))]
2632   "VECTOR_UNIT_VSX_P (V2DFmode) && BYTES_BIG_ENDIAN"
2633   "xvcv<su>xwdp %x0,%x1"
2634   [(set_attr "type" "vecdouble")])
2635
2636 (define_insn "vsx_xvcv<su>xwdp_le"
2637   [(set (match_operand:V2DF 0 "vsx_register_operand" "=wa")
2638      (any_float:V2DF
2639        (vec_select:V2SI (match_operand:V4SI 1 "vsx_register_operand" "wa")
2640          (parallel [(const_int 1) (const_int 3)]))))]
2641   "VECTOR_UNIT_VSX_P (V2DFmode) && !BYTES_BIG_ENDIAN"
2642   "xvcv<su>xwdp %x0,%x1"
2643   [(set_attr "type" "vecdouble")])
2644
2645 (define_expand "vsx_xvcv<su>xwdp"
2646   [(match_operand:V2DF 0 "vsx_register_operand")
2647    (match_operand:V4SI 1 "vsx_register_operand")
2648    (any_float (pc))]
2649   "VECTOR_UNIT_VSX_P (V2DFmode)"
2650 {
2651   if (BYTES_BIG_ENDIAN)
2652     emit_insn (gen_vsx_xvcv<su>xwdp_be (operands[0], operands[1]));
2653   else
2654     emit_insn (gen_vsx_xvcv<su>xwdp_le (operands[0], operands[1]));
2655   DONE;
2656 })
2657
2658 (define_insn "vsx_xvcvsxwdp_df"
2659   [(set (match_operand:DF 0 "vsx_register_operand" "=wa")
2660         (unspec:DF [(match_operand:V4SI 1 "vsx_register_operand" "wa")]
2661                    UNSPEC_VSX_CVSXWDP))]
2662   "TARGET_VSX"
2663   "xvcvsxwdp %x0,%x1"
2664   [(set_attr "type" "vecdouble")])
2665
2666 (define_insn "vsx_xvcvuxwdp_df"
2667   [(set (match_operand:DF 0 "vsx_register_operand" "=wa")
2668         (unspec:DF [(match_operand:V4SI 1 "vsx_register_operand" "wa")]
2669                    UNSPEC_VSX_CVUXWDP))]
2670   "TARGET_VSX"
2671   "xvcvuxwdp %x0,%x1"
2672   [(set_attr "type" "vecdouble")])
2673
2674 ;; Convert vector of 32-bit floating point numbers to vector of
2675 ;; 64-bit signed/unsigned integers.
2676 (define_insn "vsx_xvcvsp<su>xds_be"
2677   [(set (match_operand:V2DI 0 "vsx_register_operand" "=v,?wa")
2678      (any_fix:V2DI
2679        (vec_select:V2SF (match_operand:V4SF 1 "vsx_register_operand" "wa,wa")
2680          (parallel [(const_int 0) (const_int 2)]))))]
2681   "VECTOR_UNIT_VSX_P (V2DFmode) && BYTES_BIG_ENDIAN"
2682   "xvcvsp<su>xds %x0,%x1"
2683   [(set_attr "type" "vecdouble")])
2684
2685 (define_insn "vsx_xvcvsp<su>xds_le"
2686   [(set (match_operand:V2DI 0 "vsx_register_operand" "=v,?wa")
2687      (any_fix:V2DI
2688        (vec_select:V2SF (match_operand:V4SF 1 "vsx_register_operand" "wa,wa")
2689          (parallel [(const_int 1) (const_int 3)]))))]
2690   "VECTOR_UNIT_VSX_P (V2DFmode) && !BYTES_BIG_ENDIAN"
2691   "xvcvsp<su>xds %x0,%x1"
2692   [(set_attr "type" "vecdouble")])
2693
2694 (define_expand "vsx_xvcvsp<su>xds"
2695   [(match_operand:V2DI 0 "vsx_register_operand")
2696    (match_operand:V4SF 1 "vsx_register_operand")
2697    (any_fix (pc))]
2698   "VECTOR_UNIT_VSX_P (V2DFmode)"
2699 {
2700   if (BYTES_BIG_ENDIAN)
2701     emit_insn (gen_vsx_xvcvsp<su>xds_be (operands[0], operands[1]));
2702   else
2703     emit_insn (gen_vsx_xvcvsp<su>xds_le (operands[0], operands[1]));
2704   DONE;
2705 })
2706
2707 ;; Convert float vector even elements to signed long long vector
2708 (define_expand "vsignede_v4sf"
2709   [(match_operand:V2DI 0 "vsx_register_operand")
2710    (match_operand:V4SF 1 "vsx_register_operand")]
2711   "VECTOR_UNIT_VSX_P (V2DFmode)"
2712 {
2713   if (BYTES_BIG_ENDIAN)
2714     emit_insn (gen_vsx_xvcvspsxds_be (operands[0], operands[1]));
2715   else
2716     {
2717       /* Shift left one word to put even word in correct location.  */
2718       rtx rtx_tmp = gen_reg_rtx (V4SFmode);
2719       rtx rtx_val = GEN_INT (4);
2720       emit_insn (gen_altivec_vsldoi_v4sf (rtx_tmp, operands[1], operands[1],
2721                                           rtx_val));
2722       emit_insn (gen_vsx_xvcvspsxds_le (operands[0], rtx_tmp));
2723     }
2724
2725   DONE;
2726 })
2727
2728 ;; Convert float vector odd elements to signed long long vector
2729 (define_expand "vsignedo_v4sf"
2730   [(match_operand:V2DI 0 "vsx_register_operand")
2731    (match_operand:V4SF 1 "vsx_register_operand")]
2732   "VECTOR_UNIT_VSX_P (V2DFmode)"
2733 {
2734   if (BYTES_BIG_ENDIAN)
2735     {
2736       /* Shift left one word to put even word in correct location.  */
2737       rtx rtx_tmp = gen_reg_rtx (V4SFmode);
2738       rtx rtx_val = GEN_INT (4);
2739       emit_insn (gen_altivec_vsldoi_v4sf (rtx_tmp, operands[1], operands[1],
2740                                           rtx_val));
2741       emit_insn (gen_vsx_xvcvspsxds_be (operands[0], rtx_tmp));
2742     }
2743   else
2744     emit_insn (gen_vsx_xvcvspsxds_le (operands[0], operands[1]));
2745
2746   DONE;
2747 })
2748
2749 ;; Convert float vector of even vector elements to unsigned long long vector
2750 (define_expand "vunsignede_v4sf"
2751   [(match_operand:V2DI 0 "vsx_register_operand")
2752    (match_operand:V4SF 1 "vsx_register_operand")]
2753   "VECTOR_UNIT_VSX_P (V2DFmode)"
2754 {
2755   if (BYTES_BIG_ENDIAN)
2756     emit_insn (gen_vsx_xvcvspuxds_be (operands[0], operands[1]));
2757   else
2758     {
2759       /* Shift left one word to put even word in correct location.  */
2760       rtx rtx_tmp = gen_reg_rtx (V4SFmode);
2761       rtx rtx_val = GEN_INT (4);
2762       emit_insn (gen_altivec_vsldoi_v4sf (rtx_tmp, operands[1], operands[1],
2763                                           rtx_val));
2764       emit_insn (gen_vsx_xvcvspuxds_le (operands[0], rtx_tmp));
2765     }
2766
2767   DONE;
2768 })
2769
2770 ;; Convert float vector of odd elements to unsigned long long vector
2771 (define_expand "vunsignedo_v4sf"
2772   [(match_operand:V2DI 0 "vsx_register_operand")
2773    (match_operand:V4SF 1 "vsx_register_operand")]
2774   "VECTOR_UNIT_VSX_P (V2DFmode)"
2775 {
2776   if (BYTES_BIG_ENDIAN)
2777     {
2778       /* Shift left one word to put even word in correct location.  */
2779       rtx rtx_tmp = gen_reg_rtx (V4SFmode);
2780       rtx rtx_val = GEN_INT (4);
2781       emit_insn (gen_altivec_vsldoi_v4sf (rtx_tmp, operands[1], operands[1],
2782                                           rtx_val));
2783       emit_insn (gen_vsx_xvcvspuxds_be (operands[0], rtx_tmp));
2784     }
2785   else
2786     emit_insn (gen_vsx_xvcvspuxds_le (operands[0], operands[1]));
2787
2788   DONE;
2789 })
2790
2791 ;; Generate float2 double
2792 ;; convert two double to float
2793 (define_expand "float2_v2df"
2794   [(use (match_operand:V4SF 0 "register_operand" "=wa"))
2795    (use (match_operand:V2DF 1 "register_operand" "wa"))
2796    (use (match_operand:V2DF 2 "register_operand" "wa"))]
2797  "VECTOR_UNIT_VSX_P (V4SFmode)"
2798 {
2799   rtx rtx_src1, rtx_src2, rtx_dst;
2800
2801   rtx_dst = operands[0];
2802   rtx_src1 = operands[1];
2803   rtx_src2 = operands[2];
2804
2805   rs6000_generate_float2_double_code (rtx_dst, rtx_src1, rtx_src2);
2806   DONE;
2807 })
2808
2809 ;; Generate float2
2810 ;; convert two long long signed ints to float
2811 (define_expand "float2_v2di"
2812   [(use (match_operand:V4SF 0 "register_operand" "=wa"))
2813    (use (match_operand:V2DI 1 "register_operand" "wa"))
2814    (use (match_operand:V2DI 2 "register_operand" "wa"))]
2815  "VECTOR_UNIT_VSX_P (V4SFmode)"
2816 {
2817   rtx rtx_src1, rtx_src2, rtx_dst;
2818
2819   rtx_dst = operands[0];
2820   rtx_src1 = operands[1];
2821   rtx_src2 = operands[2];
2822
2823   rs6000_generate_float2_code (true, rtx_dst, rtx_src1, rtx_src2);
2824   DONE;
2825 })
2826
2827 ;; Generate uns_float2
2828 ;; convert two long long unsigned ints to float
2829 (define_expand "uns_float2_v2di"
2830   [(use (match_operand:V4SF 0 "register_operand" "=wa"))
2831    (use (match_operand:V2DI 1 "register_operand" "wa"))
2832    (use (match_operand:V2DI 2 "register_operand" "wa"))]
2833  "VECTOR_UNIT_VSX_P (V4SFmode)"
2834 {
2835   rtx rtx_src1, rtx_src2, rtx_dst;
2836
2837   rtx_dst = operands[0];
2838   rtx_src1 = operands[1];
2839   rtx_src2 = operands[2];
2840
2841   rs6000_generate_float2_code (true, rtx_dst, rtx_src1, rtx_src2);
2842   DONE;
2843 })
2844
2845 ;; Generate floate
2846 ;; convert  double or long long signed to float
2847 ;; (Only even words are valid, BE numbering)
2848 (define_expand "floate<mode>"
2849   [(use (match_operand:V4SF 0 "register_operand" "=wa"))
2850    (use (match_operand:VSX_D 1 "register_operand" "wa"))]
2851   "VECTOR_UNIT_VSX_P (V4SFmode)"
2852 {
2853   if (BYTES_BIG_ENDIAN)
2854     {
2855       /* Shift left one word to put even word correct location */
2856       rtx rtx_tmp;
2857       rtx rtx_val = GEN_INT (4);
2858
2859       rtx_tmp = gen_reg_rtx (V4SFmode);
2860       emit_insn (gen_vsx_xvcv<VF_sxddp>sp (rtx_tmp, operands[1]));
2861       emit_insn (gen_altivec_vsldoi_v4sf (operands[0],
2862                  rtx_tmp, rtx_tmp, rtx_val));
2863     }
2864   else
2865     emit_insn (gen_vsx_xvcv<VF_sxddp>sp (operands[0], operands[1]));
2866
2867   DONE;
2868 })
2869
2870 ;; Generate uns_floate
2871 ;; convert long long unsigned to float
2872 ;; (Only even words are valid, BE numbering)
2873 (define_expand "unsfloatev2di"
2874   [(use (match_operand:V4SF 0 "register_operand" "=wa"))
2875    (use (match_operand:V2DI 1 "register_operand" "wa"))]
2876   "VECTOR_UNIT_VSX_P (V4SFmode)"
2877 {
2878   if (BYTES_BIG_ENDIAN)
2879     {
2880       /* Shift left one word to put even word correct location */
2881       rtx rtx_tmp;
2882       rtx rtx_val = GEN_INT (4);
2883
2884       rtx_tmp = gen_reg_rtx (V4SFmode);
2885       emit_insn (gen_vsx_xvcvuxdsp (rtx_tmp, operands[1]));
2886       emit_insn (gen_altivec_vsldoi_v4sf (operands[0],
2887                  rtx_tmp, rtx_tmp, rtx_val));
2888     }
2889   else
2890     emit_insn (gen_vsx_xvcvuxdsp (operands[0], operands[1]));
2891
2892   DONE;
2893 })
2894
2895 ;; Generate floato
2896 ;; convert double or long long signed to float
2897 ;; Only odd words are valid, BE numbering)
2898 (define_expand "floato<mode>"
2899   [(use (match_operand:V4SF 0 "register_operand" "=wa"))
2900    (use (match_operand:VSX_D 1 "register_operand" "wa"))]
2901   "VECTOR_UNIT_VSX_P (V4SFmode)"
2902 {
2903   if (BYTES_BIG_ENDIAN)
2904     emit_insn (gen_vsx_xvcv<VF_sxddp>sp (operands[0], operands[1]));
2905   else
2906     {
2907       /* Shift left one word to put odd word correct location */
2908       rtx rtx_tmp;
2909       rtx rtx_val = GEN_INT (4);
2910
2911       rtx_tmp = gen_reg_rtx (V4SFmode);
2912       emit_insn (gen_vsx_xvcv<VF_sxddp>sp (rtx_tmp, operands[1]));
2913       emit_insn (gen_altivec_vsldoi_v4sf (operands[0],
2914                  rtx_tmp, rtx_tmp, rtx_val));
2915     }
2916   DONE;
2917 })
2918
2919 ;; Generate uns_floato
2920 ;; convert long long unsigned to float
2921 ;; (Only odd words are valid, BE numbering)
2922 (define_expand "unsfloatov2di"
2923  [(use (match_operand:V4SF 0 "register_operand" "=wa"))
2924   (use (match_operand:V2DI 1 "register_operand" "wa"))]
2925  "VECTOR_UNIT_VSX_P (V4SFmode)"
2926 {
2927   if (BYTES_BIG_ENDIAN)
2928     emit_insn (gen_vsx_xvcvuxdsp (operands[0], operands[1]));
2929   else
2930     {
2931       /* Shift left one word to put odd word correct location */
2932       rtx rtx_tmp;
2933       rtx rtx_val = GEN_INT (4);
2934
2935       rtx_tmp = gen_reg_rtx (V4SFmode);
2936       emit_insn (gen_vsx_xvcvuxdsp (rtx_tmp, operands[1]));
2937       emit_insn (gen_altivec_vsldoi_v4sf (operands[0],
2938                  rtx_tmp, rtx_tmp, rtx_val));
2939     }
2940   DONE;
2941 })
2942
2943 ;; Generate vsigned2
2944 ;; convert two double float vectors to a vector of single precision ints
2945 (define_expand "vsigned2_v2df"
2946   [(match_operand:V4SI 0 "register_operand" "=wa")
2947    (unspec:V4SI [(match_operand:V2DF 1 "register_operand" "wa")
2948                  (match_operand:V2DF 2 "register_operand" "wa")]
2949   UNSPEC_VSX_VSIGNED2)]
2950   "TARGET_VSX"
2951 {
2952   rtx rtx_src1, rtx_src2, rtx_dst;
2953   bool signed_convert=true;
2954
2955   rtx_dst = operands[0];
2956   rtx_src1 = operands[1];
2957   rtx_src2 = operands[2];
2958
2959   rs6000_generate_vsigned2_code (signed_convert, rtx_dst, rtx_src1, rtx_src2);
2960   DONE;
2961 })
2962
2963 ;; Generate vsignedo_v2df
2964 ;; signed double float to int convert odd word
2965 (define_expand "vsignedo_v2df"
2966   [(set (match_operand:V4SI 0 "register_operand" "=wa")
2967         (match_operand:V2DF 1 "register_operand" "wa"))]
2968   "TARGET_VSX"
2969 {
2970   if (BYTES_BIG_ENDIAN)
2971     {
2972       rtx rtx_tmp;
2973       rtx rtx_val = GEN_INT (12);
2974       rtx_tmp = gen_reg_rtx (V4SImode);
2975
2976       emit_insn (gen_vsx_xvcvdpsxws (rtx_tmp, operands[1]));
2977
2978       /* Big endian word numbering for words in operand is 0 1 2 3.
2979          take (operand[1] operand[1]) and shift left one word
2980          0 1 2 3    0 1 2 3  =>  1 2 3 0
2981          Words 1 and 3 are now are now where they need to be for result.  */
2982
2983       emit_insn (gen_altivec_vsldoi_v4si (operands[0], rtx_tmp,
2984                  rtx_tmp, rtx_val));
2985     }
2986   else
2987     /* Little endian word numbering for operand is 3 2 1 0.
2988        Result words 3 and 1 are where they need to be.  */
2989     emit_insn (gen_vsx_xvcvdpsxws (operands[0], operands[1]));
2990
2991   DONE;
2992 }
2993   [(set_attr "type" "veccomplex")])
2994
2995 ;; Generate vsignede_v2df
2996 ;; signed double float to int even word
2997 (define_expand "vsignede_v2df"
2998   [(set (match_operand:V4SI 0 "register_operand" "=v")
2999         (match_operand:V2DF 1 "register_operand" "v"))]
3000   "TARGET_VSX"
3001 {
3002   if (BYTES_BIG_ENDIAN)
3003     /* Big endian word numbering for words in operand is 0 1
3004        Result words 0 is where they need to be.  */
3005     emit_insn (gen_vsx_xvcvdpsxws (operands[0], operands[1]));
3006
3007   else
3008     {
3009       rtx rtx_tmp;
3010       rtx rtx_val = GEN_INT (12);
3011       rtx_tmp = gen_reg_rtx (V4SImode);
3012
3013       emit_insn (gen_vsx_xvcvdpsxws (rtx_tmp, operands[1]));
3014
3015       /* Little endian word numbering for operand is 3 2 1 0.
3016          take (operand[1] operand[1]) and shift left three words
3017          0 1 2 3   0 1 2 3  =>  3 0 1 2
3018          Words 0 and 2 are now where they need to be for the result.  */
3019       emit_insn (gen_altivec_vsldoi_v4si (operands[0], rtx_tmp,
3020                  rtx_tmp, rtx_val));
3021     }
3022   DONE;
3023 }
3024   [(set_attr "type" "veccomplex")])
3025
3026 ;; Generate unsigned2
3027 ;; convert two double float vectors to a vector of single precision
3028 ;; unsigned ints
3029 (define_expand "vunsigned2_v2df"
3030 [(match_operand:V4SI 0 "register_operand" "=v")
3031  (unspec:V4SI [(match_operand:V2DF 1 "register_operand" "v")
3032                (match_operand:V2DF 2 "register_operand" "v")]
3033               UNSPEC_VSX_VSIGNED2)]
3034  "TARGET_VSX"
3035 {
3036   rtx rtx_src1, rtx_src2, rtx_dst;
3037   bool signed_convert=false;
3038
3039   rtx_dst = operands[0];
3040   rtx_src1 = operands[1];
3041   rtx_src2 = operands[2];
3042
3043   rs6000_generate_vsigned2_code (signed_convert, rtx_dst, rtx_src1, rtx_src2);
3044   DONE;
3045 })
3046
3047 ;; Generate vunsignedo_v2df
3048 ;; unsigned double float to int convert odd word
3049 (define_expand "vunsignedo_v2df"
3050   [(set (match_operand:V4SI 0 "register_operand" "=v")
3051         (match_operand:V2DF 1 "register_operand" "v"))]
3052   "TARGET_VSX"
3053 {
3054   if (BYTES_BIG_ENDIAN)
3055     {
3056       rtx rtx_tmp;
3057       rtx rtx_val = GEN_INT (12);
3058       rtx_tmp = gen_reg_rtx (V4SImode);
3059
3060       emit_insn (gen_vsx_xvcvdpuxws (rtx_tmp, operands[1]));
3061
3062       /* Big endian word numbering for words in operand is 0 1 2 3.
3063          take (operand[1] operand[1]) and shift left one word
3064          0 1 2 3    0 1 2 3  =>  1 2 3 0
3065          Words 1 and 3 are now are now where they need to be for result.  */
3066
3067       emit_insn (gen_altivec_vsldoi_v4si (operands[0], rtx_tmp,
3068                  rtx_tmp, rtx_val));
3069     }
3070   else
3071     /* Little endian word numbering for operand is 3 2 1 0.
3072        Result words 3 and 1 are where they need to be.  */
3073     emit_insn (gen_vsx_xvcvdpuxws (operands[0], operands[1]));
3074
3075   DONE;
3076 }
3077   [(set_attr "type" "veccomplex")])
3078
3079 ;; Generate vunsignede_v2df
3080 ;; unsigned double float to int even word
3081 (define_expand "vunsignede_v2df"
3082   [(set (match_operand:V4SI 0 "register_operand" "=v")
3083         (match_operand:V2DF 1 "register_operand" "v"))]
3084   "TARGET_VSX"
3085 {
3086   if (BYTES_BIG_ENDIAN)
3087     /* Big endian word numbering for words in operand is 0 1
3088        Result words 0 is where they need to be.  */
3089     emit_insn (gen_vsx_xvcvdpuxws (operands[0], operands[1]));
3090
3091   else
3092     {
3093       rtx rtx_tmp;
3094       rtx rtx_val = GEN_INT (12);
3095       rtx_tmp = gen_reg_rtx (V4SImode);
3096
3097       emit_insn (gen_vsx_xvcvdpuxws (rtx_tmp, operands[1]));
3098
3099       /* Little endian word numbering for operand is 3 2 1 0.
3100          take (operand[1] operand[1]) and shift left three words
3101          0 1 2 3   0 1 2 3  =>  3 0 1 2
3102          Words 0 and 2 are now where they need to be for the result.  */
3103       emit_insn (gen_altivec_vsldoi_v4si (operands[0], rtx_tmp,
3104                  rtx_tmp, rtx_val));
3105     }
3106   DONE;
3107 }
3108   [(set_attr "type" "veccomplex")])
3109
3110 ;; Only optimize (float (fix x)) -> frz if we are in fast-math mode, since
3111 ;; since the xvrdpiz instruction does not truncate the value if the floating
3112 ;; point value is < LONG_MIN or > LONG_MAX.
3113 (define_insn "*vsx_float_fix_v2df2"
3114   [(set (match_operand:V2DF 0 "vsx_register_operand" "=wa,?wa")
3115         (float:V2DF
3116          (fix:V2DI
3117           (match_operand:V2DF 1 "vsx_register_operand" "wa,?wa"))))]
3118   "TARGET_HARD_FLOAT
3119    && VECTOR_UNIT_VSX_P (V2DFmode) && flag_unsafe_math_optimizations
3120    && !flag_trapping_math && TARGET_FRIZ"
3121   "xvrdpiz %x0,%x1"
3122   [(set_attr "type" "vecdouble")])
3123
3124 \f
3125 ;; Permute operations
3126
3127 ;; Build a V2DF/V2DI vector from two scalars
3128 (define_insn "vsx_concat_<mode>"
3129   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa,we")
3130         (vec_concat:VSX_D
3131          (match_operand:<VEC_base> 1 "gpc_reg_operand" "wa,b")
3132          (match_operand:<VEC_base> 2 "gpc_reg_operand" "wa,b")))]
3133   "VECTOR_MEM_VSX_P (<MODE>mode)"
3134 {
3135   if (which_alternative == 0)
3136     return (BYTES_BIG_ENDIAN
3137             ? "xxpermdi %x0,%x1,%x2,0"
3138             : "xxpermdi %x0,%x2,%x1,0");
3139
3140   else if (which_alternative == 1)
3141     return (BYTES_BIG_ENDIAN
3142             ? "mtvsrdd %x0,%1,%2"
3143             : "mtvsrdd %x0,%2,%1");
3144
3145   else
3146     gcc_unreachable ();
3147 }
3148   [(set_attr "type" "vecperm,vecmove")])
3149
3150 ;; Combiner patterns to allow creating XXPERMDI's to access either double
3151 ;; word element in a vector register.
3152 (define_insn "*vsx_concat_<mode>_1"
3153   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
3154         (vec_concat:VSX_D
3155          (vec_select:<VEC_base>
3156           (match_operand:VSX_D 1 "gpc_reg_operand" "wa")
3157           (parallel [(match_operand:QI 2 "const_0_to_1_operand" "n")]))
3158          (match_operand:<VEC_base> 3 "gpc_reg_operand" "wa")))]
3159   "VECTOR_MEM_VSX_P (<MODE>mode)"
3160 {
3161   HOST_WIDE_INT dword = INTVAL (operands[2]);
3162   if (BYTES_BIG_ENDIAN)
3163     {
3164       operands[4] = GEN_INT (2*dword);
3165       return "xxpermdi %x0,%x1,%x3,%4";
3166     }
3167   else
3168     {
3169       operands[4] = GEN_INT (!dword);
3170       return "xxpermdi %x0,%x3,%x1,%4";
3171     }
3172 }
3173   [(set_attr "type" "vecperm")])
3174
3175 (define_insn "*vsx_concat_<mode>_2"
3176   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
3177         (vec_concat:VSX_D
3178          (match_operand:<VEC_base> 1 "gpc_reg_operand" "wa")
3179          (vec_select:<VEC_base>
3180           (match_operand:VSX_D 2 "gpc_reg_operand" "wa")
3181           (parallel [(match_operand:QI 3 "const_0_to_1_operand" "n")]))))]
3182   "VECTOR_MEM_VSX_P (<MODE>mode)"
3183 {
3184   HOST_WIDE_INT dword = INTVAL (operands[3]);
3185   if (BYTES_BIG_ENDIAN)
3186     {
3187       operands[4] = GEN_INT (dword);
3188       return "xxpermdi %x0,%x1,%x2,%4";
3189     }
3190   else
3191     {
3192       operands[4] = GEN_INT (2 * !dword);
3193       return "xxpermdi %x0,%x2,%x1,%4";
3194     }
3195 }
3196   [(set_attr "type" "vecperm")])
3197
3198 (define_insn "*vsx_concat_<mode>_3"
3199   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
3200         (vec_concat:VSX_D
3201          (vec_select:<VEC_base>
3202           (match_operand:VSX_D 1 "gpc_reg_operand" "wa")
3203           (parallel [(match_operand:QI 2 "const_0_to_1_operand" "n")]))
3204          (vec_select:<VEC_base>
3205           (match_operand:VSX_D 3 "gpc_reg_operand" "wa")
3206           (parallel [(match_operand:QI 4 "const_0_to_1_operand" "n")]))))]
3207   "VECTOR_MEM_VSX_P (<MODE>mode)"
3208 {
3209   HOST_WIDE_INT dword1 = INTVAL (operands[2]);
3210   HOST_WIDE_INT dword2 = INTVAL (operands[4]);
3211   if (BYTES_BIG_ENDIAN)
3212     {
3213       operands[5] = GEN_INT ((2 * dword1) + dword2);
3214       return "xxpermdi %x0,%x1,%x3,%5";
3215     }
3216   else
3217     {
3218       operands[5] = GEN_INT ((2 * !dword2) + !dword1);
3219       return "xxpermdi %x0,%x3,%x1,%5";
3220     }
3221 }
3222   [(set_attr "type" "vecperm")])
3223
3224 ;; Special purpose concat using xxpermdi to glue two single precision values
3225 ;; together, relying on the fact that internally scalar floats are represented
3226 ;; as doubles.  This is used to initialize a V4SF vector with 4 floats
3227 (define_insn "vsx_concat_v2sf"
3228   [(set (match_operand:V2DF 0 "vsx_register_operand" "=wa")
3229         (unspec:V2DF
3230          [(match_operand:SF 1 "vsx_register_operand" "wa")
3231           (match_operand:SF 2 "vsx_register_operand" "wa")]
3232          UNSPEC_VSX_CONCAT))]
3233   "VECTOR_MEM_VSX_P (V2DFmode)"
3234 {
3235   if (BYTES_BIG_ENDIAN)
3236     return "xxpermdi %x0,%x1,%x2,0";
3237   else
3238     return "xxpermdi %x0,%x2,%x1,0";
3239 }
3240   [(set_attr "type" "vecperm")])
3241
3242 ;; Concatenate 4 SImode elements into a V4SImode reg.
3243 (define_expand "vsx_init_v4si"
3244   [(use (match_operand:V4SI 0 "gpc_reg_operand"))
3245    (use (match_operand:SI 1 "gpc_reg_operand"))
3246    (use (match_operand:SI 2 "gpc_reg_operand"))
3247    (use (match_operand:SI 3 "gpc_reg_operand"))
3248    (use (match_operand:SI 4 "gpc_reg_operand"))]
3249    "VECTOR_MEM_VSX_P (V4SImode) && TARGET_DIRECT_MOVE_64BIT"
3250 {
3251   rtx a = gen_lowpart_SUBREG (DImode, operands[1]);
3252   rtx b = gen_lowpart_SUBREG (DImode, operands[2]);
3253   rtx c = gen_lowpart_SUBREG (DImode, operands[3]);
3254   rtx d = gen_lowpart_SUBREG (DImode, operands[4]);
3255   if (!BYTES_BIG_ENDIAN)
3256     {
3257       std::swap (a, b);
3258       std::swap (c, d);
3259     }
3260
3261   rtx ab = gen_reg_rtx (DImode);
3262   rtx cd = gen_reg_rtx (DImode);
3263   emit_insn (gen_rotldi3_insert_3 (ab, a, GEN_INT (32), b,
3264                                    GEN_INT (0xffffffff)));
3265   emit_insn (gen_rotldi3_insert_3 (cd, c, GEN_INT (32), d,
3266                                    GEN_INT (0xffffffff)));
3267
3268   rtx abcd = gen_reg_rtx (V2DImode);
3269   emit_insn (gen_vsx_concat_v2di (abcd, ab, cd));
3270   emit_move_insn (operands[0], gen_lowpart (V4SImode, abcd));
3271   DONE;
3272 })
3273
3274 ;; xxpermdi for little endian loads and stores.  We need several of
3275 ;; these since the form of the PARALLEL differs by mode.
3276 (define_insn "*vsx_xxpermdi2_le_<mode>"
3277   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
3278         (vec_select:VSX_D
3279           (match_operand:VSX_D 1 "vsx_register_operand" "wa")
3280           (parallel [(const_int 1) (const_int 0)])))]
3281   "!BYTES_BIG_ENDIAN && VECTOR_MEM_VSX_P (<MODE>mode)"
3282   "xxpermdi %x0,%x1,%x1,2"
3283   [(set_attr "type" "vecperm")])
3284
3285 (define_insn "xxswapd_v16qi"
3286   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
3287         (vec_select:V16QI
3288           (match_operand:V16QI 1 "vsx_register_operand" "wa")
3289           (parallel [(const_int 8) (const_int 9)
3290                      (const_int 10) (const_int 11)
3291                      (const_int 12) (const_int 13)
3292                      (const_int 14) (const_int 15)
3293                      (const_int 0) (const_int 1)
3294                      (const_int 2) (const_int 3)
3295                      (const_int 4) (const_int 5)
3296                      (const_int 6) (const_int 7)])))]
3297   "TARGET_VSX"
3298 ;; AIX does not support the extended mnemonic xxswapd.  Use the basic
3299 ;; mnemonic xxpermdi instead.
3300   "xxpermdi %x0,%x1,%x1,2"
3301   [(set_attr "type" "vecperm")])
3302
3303 (define_insn "xxswapd_v8hi"
3304   [(set (match_operand:V8HI 0 "vsx_register_operand" "=wa")
3305         (vec_select:V8HI
3306           (match_operand:V8HI 1 "vsx_register_operand" "wa")
3307           (parallel [(const_int 4) (const_int 5)
3308                      (const_int 6) (const_int 7)
3309                      (const_int 0) (const_int 1)
3310                      (const_int 2) (const_int 3)])))]
3311   "TARGET_VSX"
3312 ;; AIX does not support the extended mnemonic xxswapd.  Use the basic
3313 ;; mnemonic xxpermdi instead.
3314   "xxpermdi %x0,%x1,%x1,2"
3315   [(set_attr "type" "vecperm")])
3316
3317 (define_insn "xxswapd_<mode>"
3318   [(set (match_operand:VSX_W 0 "vsx_register_operand" "=wa")
3319         (vec_select:VSX_W
3320           (match_operand:VSX_W 1 "vsx_register_operand" "wa")
3321           (parallel [(const_int 2) (const_int 3)
3322                      (const_int 0) (const_int 1)])))]
3323   "TARGET_VSX"
3324 ;; AIX does not support extended mnemonic xxswapd.  Use the basic
3325 ;; mnemonic xxpermdi instead.
3326   "xxpermdi %x0,%x1,%x1,2"
3327   [(set_attr "type" "vecperm")])
3328
3329 (define_insn "xxswapd_<mode>"
3330   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
3331         (vec_select:VSX_D
3332           (match_operand:VSX_D 1 "vsx_register_operand" "wa")
3333           (parallel [(const_int 1) (const_int 0)])))]
3334   "TARGET_VSX"
3335 ;; AIX does not support extended mnemonic xxswapd.  Use the basic
3336 ;; mnemonic xxpermdi instead.
3337   "xxpermdi %x0,%x1,%x1,2"
3338   [(set_attr "type" "vecperm")])
3339
3340 ;; Swap upper/lower 64-bit values in a 128-bit vector
3341 (define_insn "xxswapd_v1ti"
3342   [(set (match_operand:V1TI 0 "vsx_register_operand" "=v")
3343      (subreg:V1TI
3344           (vec_select:V2DI
3345             (subreg:V2DI
3346               (match_operand:V1TI 1 "vsx_register_operand" "v") 0 )
3347           (parallel [(const_int 1)(const_int 0)]))
3348            0))]
3349   "TARGET_POWER10"
3350 ;; AIX does not support extended mnemonic xxswapd.  Use the basic
3351 ;; mnemonic xxpermdi instead.
3352   "xxpermdi %x0,%x1,%x1,2"
3353   [(set_attr "type" "vecperm")])
3354
3355 (define_insn "xxgenpcvm_<mode>_internal"
3356   [(set (match_operand:VSX_EXTRACT_I4 0 "altivec_register_operand" "=wa")
3357         (unspec:VSX_EXTRACT_I4
3358          [(match_operand:VSX_EXTRACT_I4 1 "altivec_register_operand" "v")
3359           (match_operand:QI 2 "const_0_to_3_operand" "n")]
3360          UNSPEC_XXGENPCV))]
3361     "TARGET_POWER10"
3362     "xxgenpcv<wd>m %x0,%1,%2"
3363     [(set_attr "type" "vecsimple")])
3364
3365 (define_expand "xxgenpcvm_<mode>"
3366   [(use (match_operand:VSX_EXTRACT_I4 0 "register_operand"))
3367    (use (match_operand:VSX_EXTRACT_I4 1 "register_operand"))
3368    (use (match_operand:QI 2 "immediate_operand"))]
3369   "TARGET_POWER10"
3370 {
3371   if (!BYTES_BIG_ENDIAN)
3372     {
3373       /* gen_xxgenpcvm assumes Big Endian order.  If LE,
3374          change swap upper and lower double words.  */
3375       rtx tmp = gen_reg_rtx (<MODE>mode);
3376
3377       emit_insn (gen_xxswapd_<mode> (tmp, operands[1]));
3378       operands[1] = tmp;
3379     }
3380     emit_insn (gen_xxgenpcvm_<mode>_internal (operands[0], operands[1],
3381                                               operands[2]));
3382   DONE;
3383 })
3384
3385 ;; lxvd2x for little endian loads.  We need several of
3386 ;; these since the form of the PARALLEL differs by mode.
3387 (define_insn "*vsx_lxvd2x2_le_<mode>"
3388   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
3389         (vec_select:VSX_D
3390           (match_operand:VSX_D 1 "memory_operand" "Z")
3391           (parallel [(const_int 1) (const_int 0)])))]
3392   "!BYTES_BIG_ENDIAN && VECTOR_MEM_VSX_P (<MODE>mode) && !TARGET_P9_VECTOR"
3393   "lxvd2x %x0,%y1"
3394   [(set_attr "type" "vecload")])
3395
3396 (define_insn "*vsx_lxvd2x4_le_<mode>"
3397   [(set (match_operand:VSX_W 0 "vsx_register_operand" "=wa")
3398         (vec_select:VSX_W
3399           (match_operand:VSX_W 1 "memory_operand" "Z")
3400           (parallel [(const_int 2) (const_int 3)
3401                      (const_int 0) (const_int 1)])))]
3402   "!BYTES_BIG_ENDIAN && VECTOR_MEM_VSX_P (<MODE>mode) && !TARGET_P9_VECTOR"
3403   "lxvd2x %x0,%y1"
3404   [(set_attr "type" "vecload")])
3405
3406 (define_insn "*vsx_lxvd2x8_le_V8HI"
3407   [(set (match_operand:V8HI 0 "vsx_register_operand" "=wa")
3408         (vec_select:V8HI
3409           (match_operand:V8HI 1 "memory_operand" "Z")
3410           (parallel [(const_int 4) (const_int 5)
3411                      (const_int 6) (const_int 7)
3412                      (const_int 0) (const_int 1)
3413                      (const_int 2) (const_int 3)])))]
3414   "!BYTES_BIG_ENDIAN && VECTOR_MEM_VSX_P (V8HImode) && !TARGET_P9_VECTOR"
3415   "lxvd2x %x0,%y1"
3416   [(set_attr "type" "vecload")])
3417
3418 (define_insn "*vsx_lxvd2x16_le_V16QI"
3419   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
3420         (vec_select:V16QI
3421           (match_operand:V16QI 1 "memory_operand" "Z")
3422           (parallel [(const_int 8) (const_int 9)
3423                      (const_int 10) (const_int 11)
3424                      (const_int 12) (const_int 13)
3425                      (const_int 14) (const_int 15)
3426                      (const_int 0) (const_int 1)
3427                      (const_int 2) (const_int 3)
3428                      (const_int 4) (const_int 5)
3429                      (const_int 6) (const_int 7)])))]
3430   "!BYTES_BIG_ENDIAN && VECTOR_MEM_VSX_P (V16QImode) && !TARGET_P9_VECTOR"
3431   "lxvd2x %x0,%y1"
3432   [(set_attr "type" "vecload")])
3433
3434 ;; stxvd2x for little endian stores.  We need several of
3435 ;; these since the form of the PARALLEL differs by mode.
3436 (define_insn "*vsx_stxvd2x2_le_<mode>"
3437   [(set (match_operand:VSX_D 0 "memory_operand" "=Z")
3438         (vec_select:VSX_D
3439           (match_operand:VSX_D 1 "vsx_register_operand" "wa")
3440           (parallel [(const_int 1) (const_int 0)])))]
3441   "!BYTES_BIG_ENDIAN && VECTOR_MEM_VSX_P (<MODE>mode) && !TARGET_P9_VECTOR"
3442   "stxvd2x %x1,%y0"
3443   [(set_attr "type" "vecstore")])
3444
3445 (define_insn "*vsx_stxvd2x4_le_<mode>"
3446   [(set (match_operand:VSX_W 0 "memory_operand" "=Z")
3447         (vec_select:VSX_W
3448           (match_operand:VSX_W 1 "vsx_register_operand" "wa")
3449           (parallel [(const_int 2) (const_int 3)
3450                      (const_int 0) (const_int 1)])))]
3451   "!BYTES_BIG_ENDIAN && VECTOR_MEM_VSX_P (<MODE>mode) && !TARGET_P9_VECTOR"
3452   "stxvd2x %x1,%y0"
3453   [(set_attr "type" "vecstore")])
3454
3455 (define_insn_and_split "vsx_stxvd2x4_le_const_<mode>"
3456   [(set (match_operand:VSX_W 0 "memory_operand" "=Z")
3457         (match_operand:VSX_W 1 "immediate_operand" "W"))]
3458   "!BYTES_BIG_ENDIAN
3459    && VECTOR_MEM_VSX_P (<MODE>mode)
3460    && !TARGET_P9_VECTOR
3461    && const_vec_duplicate_p (operands[1])
3462    && can_create_pseudo_p ()"
3463   "#"
3464   "&& 1"
3465   [(set (match_dup 2)
3466         (match_dup 1))
3467    (set (match_dup 0)
3468         (vec_select:VSX_W
3469           (match_dup 2)
3470           (parallel [(const_int 2) (const_int 3)
3471                      (const_int 0) (const_int 1)])))]
3472 {
3473   /* Here all the constants must be loaded without memory.  */
3474   gcc_assert (easy_altivec_constant (operands[1], <MODE>mode));
3475   operands[2] = gen_reg_rtx (<MODE>mode);
3476 }
3477   [(set_attr "type" "vecstore")
3478    (set_attr "length" "8")])
3479
3480 (define_insn "*vsx_stxvd2x8_le_V8HI"
3481   [(set (match_operand:V8HI 0 "memory_operand" "=Z")
3482         (vec_select:V8HI
3483           (match_operand:V8HI 1 "vsx_register_operand" "wa")
3484           (parallel [(const_int 4) (const_int 5)
3485                      (const_int 6) (const_int 7)
3486                      (const_int 0) (const_int 1)
3487                      (const_int 2) (const_int 3)])))]
3488   "!BYTES_BIG_ENDIAN && VECTOR_MEM_VSX_P (V8HImode) && !TARGET_P9_VECTOR"
3489   "stxvd2x %x1,%y0"
3490   [(set_attr "type" "vecstore")])
3491
3492 (define_insn "*vsx_stxvd2x16_le_V16QI"
3493   [(set (match_operand:V16QI 0 "memory_operand" "=Z")
3494         (vec_select:V16QI
3495           (match_operand:V16QI 1 "vsx_register_operand" "wa")
3496           (parallel [(const_int 8) (const_int 9)
3497                      (const_int 10) (const_int 11)
3498                      (const_int 12) (const_int 13)
3499                      (const_int 14) (const_int 15)
3500                      (const_int 0) (const_int 1)
3501                      (const_int 2) (const_int 3)
3502                      (const_int 4) (const_int 5)
3503                      (const_int 6) (const_int 7)])))]
3504   "!BYTES_BIG_ENDIAN && VECTOR_MEM_VSX_P (V16QImode) && !TARGET_P9_VECTOR"
3505   "stxvd2x %x1,%y0"
3506   [(set_attr "type" "vecstore")])
3507
3508 ;; Convert a TImode value into V1TImode
3509 (define_expand "vsx_set_v1ti"
3510   [(match_operand:V1TI 0 "nonimmediate_operand")
3511    (match_operand:V1TI 1 "nonimmediate_operand")
3512    (match_operand:TI 2 "input_operand")
3513    (match_operand:QI 3 "u5bit_cint_operand")]
3514   "VECTOR_MEM_VSX_P (V1TImode)"
3515 {
3516   if (operands[3] != const0_rtx)
3517     gcc_unreachable ();
3518
3519   emit_move_insn (operands[0], gen_lowpart (V1TImode, operands[1]));
3520   DONE;
3521 })
3522
3523 ;; Rewrite V2DF/V2DI set in terms of VEC_CONCAT
3524 (define_expand "vsx_set_<mode>"
3525   [(use (match_operand:VSX_D 0 "vsx_register_operand"))
3526    (use (match_operand:VSX_D 1 "vsx_register_operand"))
3527    (use (match_operand:<VEC_base> 2 "gpc_reg_operand"))
3528    (use (match_operand:QI 3 "const_0_to_1_operand"))]
3529   "VECTOR_MEM_VSX_P (<MODE>mode)"
3530 {
3531   rtx dest = operands[0];
3532   rtx vec_reg = operands[1];
3533   rtx value = operands[2];
3534   rtx ele = operands[3];
3535   rtx tmp = gen_reg_rtx (<VEC_base>mode);
3536
3537   if (ele == const0_rtx)
3538     {
3539       emit_insn (gen_vsx_extract_<mode> (tmp, vec_reg, const1_rtx));
3540       emit_insn (gen_vsx_concat_<mode> (dest, value, tmp));
3541       DONE;
3542     }
3543   else if (ele == const1_rtx)
3544     {
3545       emit_insn (gen_vsx_extract_<mode> (tmp, vec_reg, const0_rtx));
3546       emit_insn (gen_vsx_concat_<mode> (dest, tmp, value));
3547       DONE;
3548     }
3549   else
3550     gcc_unreachable ();
3551 })
3552
3553 ;; Extract a DF/DI element from V2DF/V2DI
3554 ;; Optimize cases were we can do a simple or direct move.
3555 ;; Or see if we can avoid doing the move at all
3556
3557 (define_expand "vsx_extract_<mode>"
3558   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand")
3559         (vec_select:<VEC_base>
3560          (match_operand:VSX_D 1 "gpc_reg_operand")
3561          (parallel
3562           [(match_operand:QI 2 "const_0_to_1_operand")])))]
3563   "VECTOR_MEM_VSX_P (<MODE>mode)"
3564   "")
3565
3566 (define_insn "*vsx_extract_<mode>_0"
3567   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand" "=wa,wa,wr")
3568         (vec_select:<VEC_base>
3569          (match_operand:VSX_D 1 "gpc_reg_operand" "0,wa,wa")
3570          (parallel
3571           [(match_operand:QI 2 "const_0_to_1_operand" "n,n,n")])))]
3572   "VECTOR_MEM_VSX_P (<MODE>mode)
3573    && INTVAL (operands[2]) == (BYTES_BIG_ENDIAN ? 0 : 1)"
3574 {
3575   if (which_alternative == 0)
3576     return ASM_COMMENT_START " vec_extract to same register";
3577
3578   if (which_alternative == 2)
3579     return "mfvsrd %0,%x1";
3580
3581   return "xxlor %x0,%x1,%x1";
3582 }
3583   [(set_attr "type" "*,veclogical,mfvsr")
3584    (set_attr "isa" "*,*,p8v")
3585    (set_attr "length" "0,*,*")])
3586
3587 (define_insn "*vsx_extract_<mode>_1"
3588   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand" "=wa,wr")
3589         (vec_select:<VEC_base>
3590          (match_operand:VSX_D 1 "gpc_reg_operand" "wa,wa")
3591          (parallel
3592           [(match_operand:QI 2 "const_0_to_1_operand" "n,n")])))]
3593   "VECTOR_MEM_VSX_P (<MODE>mode)
3594    && INTVAL (operands[2]) == (BYTES_BIG_ENDIAN ? 1 : 0)"
3595 {
3596   if (which_alternative == 1)
3597     return "mfvsrld %0,%x1";
3598
3599   operands[3] = GEN_INT (BYTES_BIG_ENDIAN ? 2 : 3);
3600   return "xxpermdi %x0,%x1,%x1,%3";
3601 }
3602   [(set_attr "type" "mfvsr,vecperm")
3603    (set_attr "isa" "*,p9v")])
3604
3605 ;; Optimize extracting a single scalar element from memory.
3606 (define_insn_and_split "*vsx_extract_<P:mode>_<VSX_D:mode>_load"
3607   [(set (match_operand:<VEC_base> 0 "register_operand" "=wa,wr")
3608         (vec_select:<VSX_D:VEC_base>
3609          (match_operand:VSX_D 1 "memory_operand" "m,m")
3610          (parallel [(match_operand:QI 2 "const_0_to_1_operand" "n,n")])))
3611    (clobber (match_scratch:P 3 "=&b,&b"))]
3612   "TARGET_POWERPC64 && VECTOR_MEM_VSX_P (<VSX_D:MODE>mode)"
3613   "#"
3614   "&& reload_completed"
3615   [(set (match_dup 0) (match_dup 4))]
3616 {
3617   operands[4] = rs6000_adjust_vec_address (operands[0], operands[1], operands[2],
3618                                            operands[3], <VSX_D:VEC_base>mode);
3619 }
3620   [(set_attr "type" "fpload,load")
3621    (set_attr "length" "8")])
3622
3623 ;; Optimize storing a single scalar element that is the right location to
3624 ;; memory
3625 (define_insn "*vsx_extract_<mode>_store"
3626   [(set (match_operand:<VEC_base> 0 "memory_operand" "=m,Z,wY")
3627         (vec_select:<VEC_base>
3628          (match_operand:VSX_D 1 "register_operand" "d,v,v")
3629          (parallel [(match_operand:QI 2 "vsx_scalar_64bit" "n,n,n")])))]
3630   "VECTOR_MEM_VSX_P (<MODE>mode)
3631    && INTVAL (operands[2]) == (BYTES_BIG_ENDIAN ? 0 : 1)"
3632   "@
3633    stfd%U0%X0 %1,%0
3634    stxsdx %x1,%y0
3635    stxsd %1,%0"
3636   [(set_attr "type" "fpstore")
3637    (set_attr "isa" "*,p7v,p9v")])
3638
3639 ;; Variable V2DI/V2DF extract shift
3640 (define_insn "vsx_vslo_<mode>"
3641   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand" "=v")
3642         (unspec:<VEC_base> [(match_operand:VSX_D 1 "gpc_reg_operand" "v")
3643                              (match_operand:V2DI 2 "gpc_reg_operand" "v")]
3644                             UNSPEC_VSX_VSLO))]
3645   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_DIRECT_MOVE_64BIT"
3646   "vslo %0,%1,%2"
3647   [(set_attr "type" "vecperm")])
3648
3649 ;; Variable V2DI/V2DF extract from a register
3650 (define_insn_and_split "vsx_extract_<mode>_var"
3651   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand" "=v")
3652         (unspec:<VEC_base> [(match_operand:VSX_D 1 "gpc_reg_operand" "v")
3653                              (match_operand:DI 2 "gpc_reg_operand" "r")]
3654                             UNSPEC_VSX_EXTRACT))
3655    (clobber (match_scratch:DI 3 "=r"))
3656    (clobber (match_scratch:V2DI 4 "=&v"))]
3657   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_DIRECT_MOVE_64BIT"
3658   "#"
3659   "&& reload_completed"
3660   [(const_int 0)]
3661 {
3662   rs6000_split_vec_extract_var (operands[0], operands[1], operands[2],
3663                                 operands[3], operands[4]);
3664   DONE;
3665 })
3666
3667 ;; Variable V2DI/V2DF extract from memory
3668 (define_insn_and_split "*vsx_extract_<mode>_var_load"
3669   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand" "=wa,r")
3670         (unspec:<VEC_base> [(match_operand:VSX_D 1 "memory_operand" "Q,Q")
3671                              (match_operand:DI 2 "gpc_reg_operand" "r,r")]
3672                             UNSPEC_VSX_EXTRACT))
3673    (clobber (match_scratch:DI 3 "=&b,&b"))]
3674   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_DIRECT_MOVE_64BIT"
3675   "#"
3676   "&& reload_completed"
3677   [(set (match_dup 0) (match_dup 4))]
3678 {
3679   operands[4] = rs6000_adjust_vec_address (operands[0], operands[1], operands[2],
3680                                            operands[3], <VEC_base>mode);
3681 }
3682   [(set_attr "type" "fpload,load")])
3683
3684 ;; Extract a SF element from V4SF
3685 (define_insn_and_split "vsx_extract_v4sf"
3686   [(set (match_operand:SF 0 "vsx_register_operand" "=wa")
3687         (vec_select:SF
3688          (match_operand:V4SF 1 "vsx_register_operand" "wa")
3689          (parallel [(match_operand:QI 2 "u5bit_cint_operand" "n")])))
3690    (clobber (match_scratch:V4SF 3 "=0"))]
3691   "VECTOR_UNIT_VSX_P (V4SFmode)"
3692   "#"
3693   "&& 1"
3694   [(const_int 0)]
3695 {
3696   rtx op0 = operands[0];
3697   rtx op1 = operands[1];
3698   rtx op2 = operands[2];
3699   rtx op3 = operands[3];
3700   rtx tmp;
3701   HOST_WIDE_INT ele = BYTES_BIG_ENDIAN ? INTVAL (op2) : 3 - INTVAL (op2);
3702
3703   if (ele == 0)
3704     tmp = op1;
3705   else
3706     {
3707       if (GET_CODE (op3) == SCRATCH)
3708         op3 = gen_reg_rtx (V4SFmode);
3709       emit_insn (gen_vsx_xxsldwi_v4sf (op3, op1, op1, GEN_INT (ele)));
3710       tmp = op3;
3711     }
3712   emit_insn (gen_vsx_xscvspdp_scalar2 (op0, tmp));
3713   DONE;
3714 }
3715   [(set_attr "length" "8")
3716    (set_attr "type" "fp")])
3717
3718 (define_insn_and_split "*vsx_extract_v4sf_<mode>_load"
3719   [(set (match_operand:SF 0 "register_operand" "=f,v,v,?r")
3720         (vec_select:SF
3721          (match_operand:V4SF 1 "memory_operand" "m,Z,m,m")
3722          (parallel [(match_operand:QI 2 "const_0_to_3_operand" "n,n,n,n")])))
3723    (clobber (match_scratch:P 3 "=&b,&b,&b,&b"))]
3724   "VECTOR_MEM_VSX_P (V4SFmode)"
3725   "#"
3726   "&& reload_completed"
3727   [(set (match_dup 0) (match_dup 4))]
3728 {
3729   operands[4] = rs6000_adjust_vec_address (operands[0], operands[1], operands[2],
3730                                            operands[3], SFmode);
3731 }
3732   [(set_attr "type" "fpload,fpload,fpload,load")
3733    (set_attr "length" "8")
3734    (set_attr "isa" "*,p7v,p9v,*")])
3735
3736 ;; Variable V4SF extract from a register
3737 (define_insn_and_split "vsx_extract_v4sf_var"
3738   [(set (match_operand:SF 0 "gpc_reg_operand" "=wa")
3739         (unspec:SF [(match_operand:V4SF 1 "gpc_reg_operand" "v")
3740                     (match_operand:DI 2 "gpc_reg_operand" "r")]
3741                    UNSPEC_VSX_EXTRACT))
3742    (clobber (match_scratch:DI 3 "=r"))
3743    (clobber (match_scratch:V2DI 4 "=&v"))]
3744   "VECTOR_MEM_VSX_P (V4SFmode) && TARGET_DIRECT_MOVE_64BIT"
3745   "#"
3746   "&& reload_completed"
3747   [(const_int 0)]
3748 {
3749   rs6000_split_vec_extract_var (operands[0], operands[1], operands[2],
3750                                 operands[3], operands[4]);
3751   DONE;
3752 })
3753
3754 ;; Variable V4SF extract from memory
3755 (define_insn_and_split "*vsx_extract_v4sf_var_load"
3756   [(set (match_operand:SF 0 "gpc_reg_operand" "=wa,?r")
3757         (unspec:SF [(match_operand:V4SF 1 "memory_operand" "Q,Q")
3758                     (match_operand:DI 2 "gpc_reg_operand" "r,r")]
3759                    UNSPEC_VSX_EXTRACT))
3760    (clobber (match_scratch:DI 3 "=&b,&b"))]
3761   "VECTOR_MEM_VSX_P (V4SFmode) && TARGET_DIRECT_MOVE_64BIT"
3762   "#"
3763   "&& reload_completed"
3764   [(set (match_dup 0) (match_dup 4))]
3765 {
3766   operands[4] = rs6000_adjust_vec_address (operands[0], operands[1], operands[2],
3767                                            operands[3], SFmode);
3768 }
3769   [(set_attr "type" "fpload,load")])
3770
3771 ;; Expand the builtin form of xxpermdi to canonical rtl.
3772 (define_expand "vsx_xxpermdi_<mode>"
3773   [(match_operand:VSX_L 0 "vsx_register_operand")
3774    (match_operand:VSX_L 1 "vsx_register_operand")
3775    (match_operand:VSX_L 2 "vsx_register_operand")
3776    (match_operand:QI 3 "u5bit_cint_operand")]
3777   "VECTOR_MEM_VSX_P (<MODE>mode)"
3778 {
3779   rtx target = operands[0];
3780   rtx op0 = operands[1];
3781   rtx op1 = operands[2];
3782   int mask = INTVAL (operands[3]);
3783   rtx perm0 = GEN_INT ((mask >> 1) & 1);
3784   rtx perm1 = GEN_INT ((mask & 1) + 2);
3785   rtx (*gen) (rtx, rtx, rtx, rtx, rtx);
3786
3787   if (<MODE>mode == V2DFmode)
3788     gen = gen_vsx_xxpermdi2_v2df_1;
3789   else
3790     {
3791       gen = gen_vsx_xxpermdi2_v2di_1;
3792       if (<MODE>mode != V2DImode)
3793         {
3794           target = gen_lowpart (V2DImode, target);
3795           op0 = gen_lowpart (V2DImode, op0);
3796           op1 = gen_lowpart (V2DImode, op1);
3797         }
3798     }
3799   emit_insn (gen (target, op0, op1, perm0, perm1));
3800   DONE;
3801 })
3802
3803 ;; Special version of xxpermdi that retains big-endian semantics.
3804 (define_expand "vsx_xxpermdi_<mode>_be"
3805   [(match_operand:VSX_L 0 "vsx_register_operand")
3806    (match_operand:VSX_L 1 "vsx_register_operand")
3807    (match_operand:VSX_L 2 "vsx_register_operand")
3808    (match_operand:QI 3 "u5bit_cint_operand")]
3809   "VECTOR_MEM_VSX_P (<MODE>mode)"
3810 {
3811   rtx target = operands[0];
3812   rtx op0 = operands[1];
3813   rtx op1 = operands[2];
3814   int mask = INTVAL (operands[3]);
3815   rtx perm0 = GEN_INT ((mask >> 1) & 1);
3816   rtx perm1 = GEN_INT ((mask & 1) + 2);
3817   rtx (*gen) (rtx, rtx, rtx, rtx, rtx);
3818
3819   if (<MODE>mode == V2DFmode)
3820     gen = gen_vsx_xxpermdi2_v2df_1;
3821   else
3822     {
3823       gen = gen_vsx_xxpermdi2_v2di_1;
3824       if (<MODE>mode != V2DImode)
3825         {
3826           target = gen_lowpart (V2DImode, target);
3827           op0 = gen_lowpart (V2DImode, op0);
3828           op1 = gen_lowpart (V2DImode, op1);
3829         }
3830     }
3831   /* In little endian mode, vsx_xxpermdi2_<mode>_1 will perform a
3832      transformation we don't want; it is necessary for
3833      rs6000_expand_vec_perm_const_1 but not for this use.  So we
3834      prepare for that by reversing the transformation here.  */
3835   if (BYTES_BIG_ENDIAN)
3836     emit_insn (gen (target, op0, op1, perm0, perm1));
3837   else
3838     {
3839       rtx p0 = GEN_INT (3 - INTVAL (perm1));
3840       rtx p1 = GEN_INT (3 - INTVAL (perm0));
3841       emit_insn (gen (target, op1, op0, p0, p1));
3842     }
3843   DONE;
3844 })
3845
3846 (define_insn "vsx_xxpermdi2_<mode>_1"
3847   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
3848         (vec_select:VSX_D
3849           (vec_concat:<VS_double>
3850             (match_operand:VSX_D 1 "vsx_register_operand" "wa")
3851             (match_operand:VSX_D 2 "vsx_register_operand" "wa"))
3852           (parallel [(match_operand 3 "const_0_to_1_operand" "")
3853                      (match_operand 4 "const_2_to_3_operand" "")])))]
3854   "VECTOR_MEM_VSX_P (<MODE>mode)"
3855 {
3856   int op3, op4, mask;
3857
3858   /* For little endian, swap operands and invert/swap selectors
3859      to get the correct xxpermdi.  The operand swap sets up the
3860      inputs as a little endian array.  The selectors are swapped
3861      because they are defined to use big endian ordering.  The
3862      selectors are inverted to get the correct doublewords for
3863      little endian ordering.  */
3864   if (BYTES_BIG_ENDIAN)
3865     {
3866       op3 = INTVAL (operands[3]);
3867       op4 = INTVAL (operands[4]);
3868     }
3869   else
3870     {
3871       op3 = 3 - INTVAL (operands[4]);
3872       op4 = 3 - INTVAL (operands[3]);
3873     }
3874
3875   mask = (op3 << 1) | (op4 - 2);
3876   operands[3] = GEN_INT (mask);
3877
3878   if (BYTES_BIG_ENDIAN)
3879     return "xxpermdi %x0,%x1,%x2,%3";
3880   else
3881     return "xxpermdi %x0,%x2,%x1,%3";
3882 }
3883   [(set_attr "type" "vecperm")])
3884
3885 ;; Extraction of a single element in a small integer vector.  Until ISA 3.0,
3886 ;; none of the small types were allowed in a vector register, so we had to
3887 ;; extract to a DImode and either do a direct move or store.
3888 (define_expand  "vsx_extract_<mode>"
3889   [(parallel [(set (match_operand:<VEC_base> 0 "gpc_reg_operand")
3890                    (vec_select:<VEC_base>
3891                     (match_operand:VSX_EXTRACT_I2 1 "gpc_reg_operand")
3892                     (parallel [(match_operand:QI 2 "const_int_operand")])))
3893               (clobber (match_scratch:VSX_EXTRACT_I2 3))])]
3894   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_DIRECT_MOVE_64BIT"
3895 {
3896   /* If we have ISA 3.0, we can do a xxextractuw/vextractu{b,h}.  */
3897   if (TARGET_P9_VECTOR)
3898     {
3899       emit_insn (gen_vsx_extract_<mode>_p9 (operands[0], operands[1],
3900                                             operands[2]));
3901       DONE;
3902     }
3903 })
3904
3905 (define_expand  "vsx_extract_v4si"
3906   [(parallel [(set (match_operand:SI 0 "gpc_reg_operand")
3907                    (vec_select:SI
3908                     (match_operand:V4SI 1 "gpc_reg_operand")
3909                     (parallel [(match_operand:QI 2 "const_0_to_3_operand")])))
3910               (clobber (match_scratch:V4SI 3))])]
3911   "TARGET_DIRECT_MOVE_64BIT"
3912 {
3913   /* The word 1 (BE order) can be extracted by mfvsrwz/stxsiwx.  So just
3914      fall through to vsx_extract_v4si_w1.  */
3915   if (TARGET_P9_VECTOR
3916       && INTVAL (operands[2]) != (BYTES_BIG_ENDIAN ? 1 : 2))
3917     {
3918       emit_insn (gen_vsx_extract_v4si_p9 (operands[0], operands[1],
3919                                           operands[2]));
3920       DONE;
3921     }
3922 })
3923
3924 ;; Extract from word 1 (BE order).
3925 (define_insn "vsx_extract_v4si_w1"
3926   [(set (match_operand:SI 0 "nonimmediate_operand" "=r,wa,Z,wa")
3927         (vec_select:SI
3928          (match_operand:V4SI 1 "gpc_reg_operand" "v,v,v,0")
3929          (parallel [(match_operand:QI 2 "const_0_to_3_operand" "n,n,n,n")])))
3930    (clobber (match_scratch:V4SI 3 "=v,v,v,v"))]
3931   "TARGET_DIRECT_MOVE_64BIT
3932    && INTVAL (operands[2]) == (BYTES_BIG_ENDIAN ? 1 : 2)"
3933 {
3934    if (which_alternative == 0)
3935      return "mfvsrwz %0,%x1";
3936
3937    if (which_alternative == 1)
3938      return "xxlor %x0,%x1,%x1";
3939
3940    if (which_alternative == 2)
3941      return "stxsiwx %x1,%y0";
3942
3943    return ASM_COMMENT_START " vec_extract to same register";
3944 }
3945   [(set_attr "type" "mfvsr,veclogical,fpstore,*")
3946    (set_attr "length" "4,4,4,0")
3947    (set_attr "isa" "p8v,*,p8v,*")])
3948
3949 (define_insn "*mfvsrwz"
3950   [(set (match_operand:DI 0 "register_operand" "=r")
3951         (zero_extend:DI
3952           (vec_select:SI
3953             (match_operand:V4SI 1 "vsx_register_operand" "wa")
3954             (parallel [(match_operand:QI 2 "const_int_operand" "n")]))))
3955    (clobber (match_scratch:V4SI 3 "=v"))]
3956   "TARGET_DIRECT_MOVE_64BIT
3957    && INTVAL (operands[2]) == (BYTES_BIG_ENDIAN ? 1 : 2)"
3958   "mfvsrwz %0,%x1"
3959   [(set_attr "type" "mfvsr")
3960    (set_attr "isa" "p8v")])
3961
3962 (define_insn "vsx_extract_<mode>_p9"
3963   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand" "=r,<VSX_EX>")
3964         (vec_select:<VEC_base>
3965          (match_operand:VSX_EXTRACT_I 1 "gpc_reg_operand" "v,<VSX_EX>")
3966          (parallel [(match_operand:QI 2 "<VSX_EXTRACT_PREDICATE>" "n,n")])))
3967    (clobber (match_scratch:SI 3 "=r,X"))]
3968   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_VEXTRACTUB"
3969 {
3970   if (which_alternative == 0)
3971     return "#";
3972
3973   else
3974     {
3975       HOST_WIDE_INT elt = INTVAL (operands[2]);
3976       HOST_WIDE_INT elt_adj = (!BYTES_BIG_ENDIAN
3977                                ? GET_MODE_NUNITS (<MODE>mode) - 1 - elt
3978                                : elt);
3979
3980       HOST_WIDE_INT unit_size = GET_MODE_UNIT_SIZE (<MODE>mode);
3981       HOST_WIDE_INT offset = unit_size * elt_adj;
3982
3983       operands[2] = GEN_INT (offset);
3984       if (unit_size == 4)
3985         return "xxextractuw %x0,%x1,%2";
3986       else
3987         return "vextractu<wd> %0,%1,%2";
3988     }
3989 }
3990   [(set_attr "type" "vecsimple")
3991    (set_attr "isa" "p9v,*")])
3992
3993 (define_split
3994   [(set (match_operand:<VEC_base> 0 "int_reg_operand")
3995         (vec_select:<VEC_base>
3996          (match_operand:VSX_EXTRACT_I 1 "altivec_register_operand")
3997          (parallel [(match_operand:QI 2 "const_int_operand")])))
3998    (clobber (match_operand:SI 3 "int_reg_operand"))]
3999   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_VEXTRACTUB && reload_completed"
4000   [(const_int 0)]
4001 {
4002   rtx op0_si = gen_rtx_REG (SImode, REGNO (operands[0]));
4003   rtx op1 = operands[1];
4004   rtx op2 = operands[2];
4005   rtx op3 = operands[3];
4006   HOST_WIDE_INT offset = INTVAL (op2) * GET_MODE_UNIT_SIZE (<MODE>mode);
4007
4008   emit_move_insn (op3, GEN_INT (offset));
4009   if (BYTES_BIG_ENDIAN)
4010     emit_insn (gen_vextu<wd>lx (op0_si, op3, op1));
4011   else
4012     emit_insn (gen_vextu<wd>rx (op0_si, op3, op1));
4013   DONE;
4014 })
4015
4016 ;; Optimize zero extracts to eliminate the AND after the extract.
4017 (define_insn_and_split "*vsx_extract_<mode>_di_p9"
4018   [(set (match_operand:DI 0 "gpc_reg_operand" "=r,<VSX_EX>")
4019         (zero_extend:DI
4020          (vec_select:<VEC_base>
4021           (match_operand:VSX_EXTRACT_I 1 "gpc_reg_operand" "v,<VSX_EX>")
4022           (parallel [(match_operand:QI 2 "const_int_operand" "n,n")]))))
4023    (clobber (match_scratch:SI 3 "=r,X"))]
4024   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_VEXTRACTUB"
4025   "#"
4026   "&& reload_completed"
4027   [(parallel [(set (match_dup 4)
4028                    (vec_select:<VEC_base>
4029                     (match_dup 1)
4030                     (parallel [(match_dup 2)])))
4031               (clobber (match_dup 3))])]
4032 {
4033   gcc_assert (<MODE>mode != V4SImode
4034               || INTVAL (operands[2]) != (BYTES_BIG_ENDIAN ? 1 : 2));
4035
4036   operands[4] = gen_rtx_REG (<VEC_base>mode, REGNO (operands[0]));
4037 }
4038   [(set_attr "isa" "p9v,*")])
4039
4040 ;; Optimize stores to use the ISA 3.0 scalar store instructions
4041 (define_insn_and_split "*vsx_extract_<mode>_store_p9"
4042   [(set (match_operand:<VEC_base> 0 "memory_operand" "=Z,m")
4043         (vec_select:<VEC_base>
4044          (match_operand:VSX_EXTRACT_I 1 "gpc_reg_operand" "<VSX_EX>,v")
4045          (parallel [(match_operand:QI 2 "const_int_operand" "n,n")])))
4046    (clobber (match_scratch:<VEC_base> 3 "=<VSX_EX>,&*r"))
4047    (clobber (match_scratch:SI 4 "=X,&r"))]
4048   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_VEXTRACTUB"
4049   "#"
4050   "&& reload_completed"
4051   [(parallel [(set (match_dup 3)
4052                    (vec_select:<VEC_base>
4053                     (match_dup 1)
4054                     (parallel [(match_dup 2)])))
4055               (clobber (match_dup 4))])
4056    (set (match_dup 0)
4057         (match_dup 3))]
4058 {
4059   if (which_alternative == 0
4060       && ((<MODE>mode == V16QImode
4061            && INTVAL (operands[2]) == (BYTES_BIG_ENDIAN ? 7 : 8))
4062           || (<MODE>mode == V8HImode
4063               && INTVAL (operands[2]) == (BYTES_BIG_ENDIAN ? 3 : 4))))
4064     {
4065       enum machine_mode dest_mode = GET_MODE (operands[0]);
4066       emit_move_insn (operands[0],
4067                       gen_rtx_REG (dest_mode, REGNO (operands[3])));
4068       DONE;
4069     }
4070 })
4071
4072
4073 ;; Extract from word 0, 2, 3 (BE order).
4074 (define_insn_and_split "*vsx_extract_v4si_w023"
4075   [(set (match_operand:SI 0 "nonimmediate_operand" "=r,wa,Z")
4076         (vec_select:SI
4077          (match_operand:V4SI 1 "gpc_reg_operand" "v,v,v")
4078          (parallel [(match_operand:QI 2 "const_0_to_3_operand" "n,n,n")])))
4079    (clobber (match_scratch:V4SI 3 "=v,v,v"))]
4080   "TARGET_DIRECT_MOVE_64BIT"
4081   "#"
4082   "&& INTVAL (operands[2]) != (BYTES_BIG_ENDIAN ? 1 : 2)"
4083   [(const_int 0)]
4084 {
4085   gcc_assert (!TARGET_P9_VECTOR);
4086
4087   rtx dest = operands[0];
4088   rtx src = operands[1];
4089   rtx element = operands[2];
4090   rtx vec_tmp;
4091
4092   if (GET_CODE (operands[3]) == SCRATCH)
4093     vec_tmp = gen_reg_rtx (V4SImode);
4094   else
4095     vec_tmp = operands[3];
4096
4097   /* Adjust index for LE element ordering, the below minuend 3 is computed by
4098      GET_MODE_NUNITS (V4SImode) - 1.  */
4099   if (!BYTES_BIG_ENDIAN)
4100     element = GEN_INT (3 - INTVAL (element));
4101
4102   emit_insn (gen_altivec_vspltw_direct (vec_tmp, src, element));
4103
4104   int value = BYTES_BIG_ENDIAN ? 1 : 2;
4105   emit_insn (gen_vsx_extract_v4si_w1 (dest, vec_tmp, GEN_INT (value)));
4106
4107   DONE;
4108 })
4109
4110 (define_insn_and_split  "*vsx_extract_<mode>_p8"
4111   [(set (match_operand:<VEC_base> 0 "nonimmediate_operand" "=r")
4112         (vec_select:<VEC_base>
4113          (match_operand:VSX_EXTRACT_I2 1 "gpc_reg_operand" "v")
4114          (parallel [(match_operand:QI 2 "<VSX_EXTRACT_PREDICATE>" "n")])))
4115    (clobber (match_scratch:VSX_EXTRACT_I2 3 "=v"))]
4116   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_DIRECT_MOVE_64BIT
4117    && !TARGET_P9_VECTOR"
4118   "#"
4119   "&& reload_completed"
4120   [(const_int 0)]
4121 {
4122   rtx dest = operands[0];
4123   rtx src = operands[1];
4124   rtx element = operands[2];
4125   rtx vec_tmp = operands[3];
4126   int value;
4127
4128   if (!BYTES_BIG_ENDIAN)
4129     element = GEN_INT (GET_MODE_NUNITS (<MODE>mode) - 1 - INTVAL (element));
4130
4131   /* If the value is in the correct position, we can avoid doing the VSPLT<x>
4132      instruction.  */
4133   value = INTVAL (element);
4134   if (<MODE>mode == V16QImode)
4135     {
4136       if (value != 7)
4137         emit_insn (gen_altivec_vspltb_direct (vec_tmp, src, element));
4138       else
4139         vec_tmp = src;
4140     }
4141   else if (<MODE>mode == V8HImode)
4142     {
4143       if (value != 3)
4144         emit_insn (gen_altivec_vsplth_direct (vec_tmp, src, element));
4145       else
4146         vec_tmp = src;
4147     }
4148   else
4149     gcc_unreachable ();
4150
4151   emit_move_insn (gen_rtx_REG (DImode, REGNO (dest)),
4152                   gen_rtx_REG (DImode, REGNO (vec_tmp)));
4153   DONE;
4154 }
4155   [(set_attr "type" "mfvsr")])
4156
4157 ;; Optimize extracting a single scalar element from memory.
4158 (define_insn_and_split "*vsx_extract_<mode>_load"
4159   [(set (match_operand:<VEC_base> 0 "register_operand" "=r")
4160         (vec_select:<VEC_base>
4161          (match_operand:VSX_EXTRACT_I 1 "memory_operand" "m")
4162          (parallel [(match_operand:QI 2 "<VSX_EXTRACT_PREDICATE>" "n")])))
4163    (clobber (match_scratch:DI 3 "=&b"))]
4164   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_DIRECT_MOVE_64BIT"
4165   "#"
4166   "&& reload_completed"
4167   [(set (match_dup 0) (match_dup 4))]
4168 {
4169   operands[4] = rs6000_adjust_vec_address (operands[0], operands[1], operands[2],
4170                                            operands[3], <VEC_base>mode);
4171 }
4172   [(set_attr "type" "load")
4173    (set_attr "length" "8")])
4174
4175 ;; Variable V16QI/V8HI/V4SI extract from a register
4176 (define_insn_and_split "vsx_extract_<mode>_var"
4177   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand" "=r,r")
4178         (unspec:<VEC_base>
4179          [(match_operand:VSX_EXTRACT_I 1 "gpc_reg_operand" "v,v")
4180           (match_operand:DI 2 "gpc_reg_operand" "r,r")]
4181          UNSPEC_VSX_EXTRACT))
4182    (clobber (match_scratch:DI 3 "=r,r"))
4183    (clobber (match_scratch:V2DI 4 "=X,&v"))]
4184   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_DIRECT_MOVE_64BIT"
4185   "#"
4186   "&& reload_completed"
4187   [(const_int 0)]
4188 {
4189   rs6000_split_vec_extract_var (operands[0], operands[1], operands[2],
4190                                 operands[3], operands[4]);
4191   DONE;
4192 }
4193   [(set_attr "isa" "p9v,*")])
4194
4195 ;; Variable V16QI/V8HI/V4SI extract from memory
4196 (define_insn_and_split "*vsx_extract_<mode>_var_load"
4197   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand" "=r")
4198         (unspec:<VEC_base>
4199          [(match_operand:VSX_EXTRACT_I 1 "memory_operand" "Q")
4200           (match_operand:DI 2 "gpc_reg_operand" "r")]
4201          UNSPEC_VSX_EXTRACT))
4202    (clobber (match_scratch:DI 3 "=&b"))]
4203   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_DIRECT_MOVE_64BIT"
4204   "#"
4205   "&& reload_completed"
4206   [(set (match_dup 0) (match_dup 4))]
4207 {
4208   operands[4] = rs6000_adjust_vec_address (operands[0], operands[1], operands[2],
4209                                            operands[3], <VEC_base>mode);
4210 }
4211   [(set_attr "type" "load")])
4212
4213 ;; ISA 3.1 extract
4214 (define_expand "vextractl<mode>"
4215   [(set (match_operand:V2DI 0 "altivec_register_operand")
4216         (unspec:V2DI [(match_operand:VI2 1 "altivec_register_operand")
4217                       (match_operand:VI2 2 "altivec_register_operand")
4218                       (match_operand:SI 3 "register_operand")]
4219                      UNSPEC_EXTRACTL))]
4220   "TARGET_POWER10"
4221 {
4222   if (BYTES_BIG_ENDIAN)
4223     {
4224       emit_insn (gen_vextractl<mode>_internal (operands[0], operands[1],
4225                                                operands[2], operands[3]));
4226       emit_insn (gen_xxswapd_v2di (operands[0], operands[0]));
4227     }
4228   else
4229     emit_insn (gen_vextractr<mode>_internal (operands[0], operands[2],
4230                                              operands[1], operands[3]));
4231   DONE;
4232 })
4233
4234 (define_insn "vextractl<mode>_internal"
4235   [(set (match_operand:V2DI 0 "altivec_register_operand" "=v")
4236         (unspec:V2DI [(match_operand:VEC_I 1 "altivec_register_operand" "v")
4237                       (match_operand:VEC_I 2 "altivec_register_operand" "v")
4238                       (match_operand:SI 3 "register_operand" "r")]
4239                      UNSPEC_EXTRACTL))]
4240   "TARGET_POWER10"
4241   "vext<du_or_d><wd>vlx %0,%1,%2,%3"
4242   [(set_attr "type" "vecsimple")])
4243
4244 (define_expand "vextractr<mode>"
4245   [(set (match_operand:V2DI 0 "altivec_register_operand")
4246         (unspec:V2DI [(match_operand:VI2 1 "altivec_register_operand")
4247                       (match_operand:VI2 2 "altivec_register_operand")
4248                       (match_operand:SI 3 "register_operand")]
4249                      UNSPEC_EXTRACTR))]
4250   "TARGET_POWER10"
4251 {
4252   if (BYTES_BIG_ENDIAN)
4253     {
4254       emit_insn (gen_vextractr<mode>_internal (operands[0], operands[1],
4255                                                operands[2], operands[3]));
4256       emit_insn (gen_xxswapd_v2di (operands[0], operands[0]));
4257     }
4258   else
4259     emit_insn (gen_vextractl<mode>_internal (operands[0], operands[2],
4260                                              operands[1], operands[3]));
4261   DONE;
4262 })
4263
4264 (define_insn "vextractr<mode>_internal"
4265   [(set (match_operand:V2DI 0 "altivec_register_operand" "=v")
4266         (unspec:V2DI [(match_operand:VEC_I 1 "altivec_register_operand" "v")
4267                       (match_operand:VEC_I 2 "altivec_register_operand" "v")
4268                       (match_operand:SI 3 "register_operand" "r")]
4269                      UNSPEC_EXTRACTR))]
4270   "TARGET_POWER10"
4271   "vext<du_or_d><wd>vrx %0,%1,%2,%3"
4272   [(set_attr "type" "vecsimple")])
4273
4274 (define_expand "vinsertvl_<mode>"
4275   [(set (match_operand:VI2 0 "altivec_register_operand")
4276         (unspec:VI2 [(match_operand:VI2 1 "altivec_register_operand")
4277                      (match_operand:VI2 2 "altivec_register_operand")
4278                      (match_operand:SI 3 "register_operand" "r")]
4279                     UNSPEC_INSERTL))]
4280   "TARGET_POWER10"
4281 {
4282   if (BYTES_BIG_ENDIAN)
4283      emit_insn (gen_vinsertvl_internal_<mode> (operands[0], operands[3],
4284                                                operands[1], operands[2]));
4285    else
4286      emit_insn (gen_vinsertvr_internal_<mode> (operands[0], operands[3],
4287                                                operands[1], operands[2]));
4288    DONE;
4289 })
4290
4291 (define_insn "vinsertvl_internal_<mode>"
4292   [(set (match_operand:VEC_I 0 "altivec_register_operand" "=v")
4293         (unspec:VEC_I [(match_operand:SI 1 "register_operand" "r")
4294                        (match_operand:VEC_I 2 "altivec_register_operand" "v")
4295                        (match_operand:VEC_I 3 "altivec_register_operand" "0")]
4296                       UNSPEC_INSERTL))]
4297   "TARGET_POWER10"
4298   "vins<wd>vlx %0,%1,%2"
4299   [(set_attr "type" "vecsimple")])
4300
4301 (define_expand "vinsertvr_<mode>"
4302   [(set (match_operand:VI2 0 "altivec_register_operand")
4303         (unspec:VI2 [(match_operand:VI2 1 "altivec_register_operand")
4304                      (match_operand:VI2 2 "altivec_register_operand")
4305                      (match_operand:SI 3 "register_operand" "r")]
4306                     UNSPEC_INSERTR))]
4307   "TARGET_POWER10"
4308 {
4309   if (BYTES_BIG_ENDIAN)
4310      emit_insn (gen_vinsertvr_internal_<mode> (operands[0], operands[3],
4311                                                operands[1], operands[2]));
4312    else
4313      emit_insn (gen_vinsertvl_internal_<mode> (operands[0], operands[3],
4314                                                operands[1], operands[2]));
4315    DONE;
4316 })
4317
4318 (define_insn "vinsertvr_internal_<mode>"
4319   [(set (match_operand:VEC_I 0 "altivec_register_operand" "=v")
4320         (unspec:VEC_I [(match_operand:SI 1 "register_operand" "r")
4321                        (match_operand:VEC_I 2 "altivec_register_operand" "v")
4322                        (match_operand:VEC_I 3 "altivec_register_operand" "0")]
4323                       UNSPEC_INSERTR))]
4324   "TARGET_POWER10"
4325   "vins<wd>vrx %0,%1,%2"
4326   [(set_attr "type" "vecsimple")])
4327
4328 (define_expand "vinsertgl_<mode>"
4329   [(set (match_operand:VI2 0 "altivec_register_operand")
4330         (unspec:VI2 [(match_operand:SI 1 "register_operand")
4331                      (match_operand:VI2 2 "altivec_register_operand")
4332                      (match_operand:SI 3 "register_operand")]
4333                     UNSPEC_INSERTL))]
4334   "TARGET_POWER10"
4335 {
4336   if (BYTES_BIG_ENDIAN)
4337     emit_insn (gen_vinsertgl_internal_<mode> (operands[0], operands[3],
4338                                             operands[1], operands[2]));
4339   else
4340     emit_insn (gen_vinsertgr_internal_<mode> (operands[0], operands[3],
4341                                             operands[1], operands[2]));
4342   DONE;
4343  })
4344
4345 (define_insn "vinsertgl_internal_<mode>"
4346  [(set (match_operand:VEC_I 0 "altivec_register_operand" "=v")
4347        (unspec:VEC_I [(match_operand:SI 1 "register_operand" "r")
4348                       (match_operand:SI 2 "register_operand" "r")
4349                       (match_operand:VEC_I 3 "altivec_register_operand" "0")]
4350                      UNSPEC_INSERTL))]
4351  "TARGET_POWER10"
4352  "vins<wd>lx %0,%1,%2"
4353  [(set_attr "type" "vecsimple")])
4354
4355 (define_expand "vinsertgr_<mode>"
4356   [(set (match_operand:VI2 0 "altivec_register_operand")
4357         (unspec:VI2 [(match_operand:SI 1 "register_operand")
4358                      (match_operand:VI2 2 "altivec_register_operand")
4359                      (match_operand:SI 3 "register_operand")]
4360                     UNSPEC_INSERTR))]
4361   "TARGET_POWER10"
4362 {
4363   if (BYTES_BIG_ENDIAN)
4364     emit_insn (gen_vinsertgr_internal_<mode> (operands[0], operands[3],
4365                                             operands[1], operands[2]));
4366   else
4367     emit_insn (gen_vinsertgl_internal_<mode> (operands[0], operands[3],
4368                                             operands[1], operands[2]));
4369   DONE;
4370  })
4371
4372 (define_insn "vinsertgr_internal_<mode>"
4373  [(set (match_operand:VEC_I 0 "altivec_register_operand" "=v")
4374    (unspec:VEC_I [(match_operand:SI 1 "register_operand" "r")
4375                   (match_operand:SI 2 "register_operand" "r")
4376                   (match_operand:VEC_I 3 "altivec_register_operand" "0")]
4377                  UNSPEC_INSERTR))]
4378  "TARGET_POWER10"
4379  "vins<wd>rx %0,%1,%2"
4380  [(set_attr "type" "vecsimple")])
4381
4382 (define_expand "vreplace_elt_<mode>"
4383   [(set (match_operand:REPLACE_ELT_V 0 "register_operand")
4384   (unspec:REPLACE_ELT_V [(match_operand:REPLACE_ELT_V 1 "register_operand")
4385                          (match_operand:<VEC_base> 2 "register_operand")
4386                          (match_operand:QI 3 "const_0_to_3_operand")]
4387                         UNSPEC_REPLACE_ELT))]
4388  "TARGET_POWER10"
4389 {
4390    int index;
4391    /* Immediate value is the word index, convert to byte index and adjust for
4392       Endianness if needed.  */
4393    if (BYTES_BIG_ENDIAN)
4394      index = INTVAL (operands[3]) << <REPLACE_ELT_sh>;
4395
4396    else
4397      index = <REPLACE_ELT_max> - (INTVAL (operands[3]) << <REPLACE_ELT_sh>);
4398
4399    emit_insn (gen_vreplace_elt_<mode>_inst (operands[0], operands[1],
4400                                             operands[2],
4401                                             GEN_INT (index)));
4402    DONE;
4403  }
4404 [(set_attr "type" "vecsimple")])
4405
4406 (define_insn "vreplace_elt_<mode>_inst"
4407  [(set (match_operand:REPLACE_ELT_V 0 "register_operand" "=v")
4408   (unspec:REPLACE_ELT_V [(match_operand:REPLACE_ELT_V 1 "register_operand" "0")
4409                          (match_operand:<VEC_base> 2 "register_operand" "r")
4410                          (match_operand:QI 3 "const_0_to_12_operand" "n")]
4411                         UNSPEC_REPLACE_ELT))]
4412  "TARGET_POWER10"
4413  "vins<REPLACE_ELT_char> %0,%2,%3"
4414  [(set_attr "type" "vecsimple")])
4415
4416 (define_insn "vreplace_un_<mode>"
4417  [(set (match_operand:V16QI 0 "register_operand" "=v")
4418   (unspec:V16QI [(match_operand:V16QI 1 "register_operand" "0")
4419                  (match_operand:REPLACE_ELT 2 "register_operand" "r")
4420                  (match_operand:QI 3 "const_0_to_12_operand" "n")]
4421                 UNSPEC_REPLACE_UN))]
4422  "TARGET_POWER10"
4423  "vins<REPLACE_ELT_char> %0,%2,%3"
4424  [(set_attr "type" "vecsimple")])
4425
4426 ;; VSX_EXTRACT optimizations
4427 ;; Optimize double d = (double) vec_extract (vi, <n>)
4428 ;; Get the element into the top position and use XVCVSWDP/XVCVUWDP
4429 (define_insn_and_split "*vsx_extract_si_<uns>float_df"
4430   [(set (match_operand:DF 0 "gpc_reg_operand" "=wa")
4431         (any_float:DF
4432          (vec_select:SI
4433           (match_operand:V4SI 1 "gpc_reg_operand" "v")
4434           (parallel [(match_operand:QI 2 "const_0_to_3_operand" "n")]))))
4435    (clobber (match_scratch:V4SI 3 "=v"))]
4436   "VECTOR_MEM_VSX_P (V4SImode) && TARGET_DIRECT_MOVE_64BIT"
4437   "#"
4438   "&& 1"
4439   [(const_int 0)]
4440 {
4441   rtx dest = operands[0];
4442   rtx src = operands[1];
4443   rtx element = operands[2];
4444   rtx v4si_tmp = operands[3];
4445   int value;
4446
4447   /* Adjust index for LE element ordering, the below minuend 3 is computed by
4448      GET_MODE_NUNITS (V4SImode) - 1.  */
4449   if (!BYTES_BIG_ENDIAN)
4450     element = GEN_INT (3 - INTVAL (element));
4451
4452   /* If the value is in the correct position, we can avoid doing the VSPLT<x>
4453      instruction.  */
4454   value = INTVAL (element);
4455   if (value != 0)
4456     {
4457       if (GET_CODE (v4si_tmp) == SCRATCH)
4458         v4si_tmp = gen_reg_rtx (V4SImode);
4459       emit_insn (gen_altivec_vspltw_direct (v4si_tmp, src, element));
4460     }
4461   else
4462     v4si_tmp = src;
4463
4464   emit_insn (gen_vsx_xvcv<su>xwdp_df (dest, v4si_tmp));
4465   DONE;
4466 })
4467
4468 ;; Optimize <type> f = (<type>) vec_extract (vi, <n>)
4469 ;; where <type> is a floating point type that supported by the hardware that is
4470 ;; not double.  First convert the value to double, and then to the desired
4471 ;; type.
4472 (define_insn_and_split "*vsx_extract_si_<uns>float_<mode>"
4473   [(set (match_operand:VSX_EXTRACT_FL 0 "gpc_reg_operand" "=wa")
4474         (any_float:VSX_EXTRACT_FL
4475          (vec_select:SI
4476           (match_operand:V4SI 1 "gpc_reg_operand" "v")
4477           (parallel [(match_operand:QI 2 "const_0_to_3_operand" "n")]))))
4478    (clobber (match_scratch:V4SI 3 "=v"))
4479    (clobber (match_scratch:DF 4 "=wa"))]
4480   "VECTOR_MEM_VSX_P (V4SImode) && TARGET_DIRECT_MOVE_64BIT"
4481   "#"
4482   "&& 1"
4483   [(const_int 0)]
4484 {
4485   rtx dest = operands[0];
4486   rtx src = operands[1];
4487   rtx element = operands[2];
4488   rtx v4si_tmp = operands[3];
4489   rtx df_tmp = operands[4];
4490   int value;
4491
4492   /* Adjust index for LE element ordering, the below minuend 3 is computed by
4493      GET_MODE_NUNITS (V4SImode) - 1.  */
4494   if (!BYTES_BIG_ENDIAN)
4495     element = GEN_INT (3 - INTVAL (element));
4496
4497   /* If the value is in the correct position, we can avoid doing the VSPLT<x>
4498      instruction.  */
4499   value = INTVAL (element);
4500   if (value != 0)
4501     {
4502       if (GET_CODE (v4si_tmp) == SCRATCH)
4503         v4si_tmp = gen_reg_rtx (V4SImode);
4504       emit_insn (gen_altivec_vspltw_direct (v4si_tmp, src, element));
4505     }
4506   else
4507     v4si_tmp = src;
4508
4509   if (GET_CODE (df_tmp) == SCRATCH)
4510     df_tmp = gen_reg_rtx (DFmode);
4511
4512   emit_insn (gen_vsx_xvcv<su>xwdp_df (df_tmp, v4si_tmp));
4513
4514   if (<MODE>mode == SFmode)
4515     emit_insn (gen_truncdfsf2 (dest, df_tmp));
4516   else if (<MODE>mode == TFmode && FLOAT128_IBM_P (TFmode))
4517     emit_insn (gen_extenddftf2_vsx (dest, df_tmp));
4518   else if (<MODE>mode == TFmode && FLOAT128_IEEE_P (TFmode)
4519            && TARGET_FLOAT128_HW)
4520     emit_insn (gen_extenddftf2_hw (dest, df_tmp));
4521   else if (<MODE>mode == IFmode && FLOAT128_IBM_P (IFmode))
4522     emit_insn (gen_extenddfif2 (dest, df_tmp));
4523   else if (<MODE>mode == KFmode && TARGET_FLOAT128_HW)
4524     emit_insn (gen_extenddfkf2_hw (dest, df_tmp));
4525   else
4526     gcc_unreachable ();
4527
4528   DONE;
4529 })
4530
4531 ;; Optimize <type> f = (<ftype>) vec_extract (<vtype>, <n>)
4532 ;; Where <ftype> is SFmode, DFmode (and KFmode/TFmode if those types are IEEE
4533 ;; 128-bit hardware types) and <vtype> is vector char, vector unsigned char,
4534 ;; vector short or vector unsigned short.
4535 (define_insn_and_split "*vsx_ext_<VSX_EXTRACT_I:VEC_base>_fl_<FL_CONV:mode>"
4536   [(set (match_operand:FL_CONV 0 "gpc_reg_operand" "=wa")
4537         (float:FL_CONV
4538          (vec_select:<VSX_EXTRACT_I:VEC_base>
4539           (match_operand:VSX_EXTRACT_I 1 "gpc_reg_operand" "v")
4540           (parallel [(match_operand:QI 2 "const_int_operand" "n")]))))
4541    (clobber (match_scratch:<VSX_EXTRACT_I:VEC_base> 3 "=v"))]
4542   "VECTOR_MEM_VSX_P (<VSX_EXTRACT_I:MODE>mode) && TARGET_DIRECT_MOVE_64BIT
4543    && TARGET_P9_VECTOR"
4544   "#"
4545   "&& reload_completed"
4546   [(parallel [(set (match_dup 3)
4547                    (vec_select:<VSX_EXTRACT_I:VEC_base>
4548                     (match_dup 1)
4549                     (parallel [(match_dup 2)])))
4550               (clobber (scratch:SI))])
4551    (set (match_dup 4)
4552         (sign_extend:DI (match_dup 3)))
4553    (set (match_dup 0)
4554         (float:<FL_CONV:MODE> (match_dup 4)))]
4555 {
4556   operands[4] = gen_rtx_REG (DImode, REGNO (operands[3]));
4557 }
4558   [(set_attr "isa" "<FL_CONV:VSisa>")])
4559
4560 (define_insn_and_split "*vsx_ext_<VSX_EXTRACT_I:VEC_base>_ufl_<FL_CONV:mode>"
4561   [(set (match_operand:FL_CONV 0 "gpc_reg_operand" "=wa")
4562         (unsigned_float:FL_CONV
4563          (vec_select:<VSX_EXTRACT_I:VEC_base>
4564           (match_operand:VSX_EXTRACT_I 1 "gpc_reg_operand" "v")
4565           (parallel [(match_operand:QI 2 "const_int_operand" "n")]))))
4566    (clobber (match_scratch:<VSX_EXTRACT_I:VEC_base> 3 "=v"))]
4567   "VECTOR_MEM_VSX_P (<VSX_EXTRACT_I:MODE>mode) && TARGET_DIRECT_MOVE_64BIT
4568    && TARGET_P9_VECTOR"
4569   "#"
4570   "&& reload_completed"
4571   [(parallel [(set (match_dup 3)
4572                    (vec_select:<VSX_EXTRACT_I:VEC_base>
4573                     (match_dup 1)
4574                     (parallel [(match_dup 2)])))
4575               (clobber (scratch:SI))])
4576    (set (match_dup 0)
4577         (float:<FL_CONV:MODE> (match_dup 4)))]
4578 {
4579   operands[4] = gen_rtx_REG (DImode, REGNO (operands[3]));
4580 }
4581   [(set_attr "isa" "<FL_CONV:VSisa>")])
4582
4583 ;; V4SI/V8HI/V16QI set operation on ISA 3.0
4584 (define_insn "vsx_set_<mode>_p9"
4585   [(set (match_operand:VSX_EXTRACT_I 0 "gpc_reg_operand" "=<VSX_EX>")
4586         (unspec:VSX_EXTRACT_I
4587          [(match_operand:VSX_EXTRACT_I 1 "gpc_reg_operand" "0")
4588           (match_operand:<VEC_base> 2 "gpc_reg_operand" "<VSX_EX>")
4589           (match_operand:QI 3 "<VSX_EXTRACT_PREDICATE>" "n")]
4590          UNSPEC_VSX_SET))]
4591   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_P9_VECTOR && TARGET_POWERPC64"
4592 {
4593   int ele = INTVAL (operands[3]);
4594   int nunits = GET_MODE_NUNITS (<MODE>mode);
4595
4596   if (!BYTES_BIG_ENDIAN)
4597     ele = nunits - 1 - ele;
4598
4599   operands[3] = GEN_INT (GET_MODE_SIZE (<VEC_base>mode) * ele);
4600   if (<MODE>mode == V4SImode)
4601     return "xxinsertw %x0,%x2,%3";
4602   else
4603     return "vinsert<wd> %0,%2,%3";
4604 }
4605   [(set_attr "type" "vecperm")])
4606
4607 (define_insn_and_split "vsx_set_v4sf_p9"
4608   [(set (match_operand:V4SF 0 "gpc_reg_operand" "=wa")
4609         (unspec:V4SF
4610          [(match_operand:V4SF 1 "gpc_reg_operand" "0")
4611           (match_operand:SF 2 "gpc_reg_operand" "wa")
4612           (match_operand:QI 3 "const_0_to_3_operand" "n")]
4613          UNSPEC_VSX_SET))
4614    (clobber (match_scratch:SI 4 "=&wa"))]
4615   "VECTOR_MEM_VSX_P (V4SFmode) && TARGET_P9_VECTOR && TARGET_POWERPC64"
4616   "#"
4617   "&& reload_completed"
4618   [(set (match_dup 5)
4619         (unspec:V4SF [(match_dup 2)]
4620                      UNSPEC_VSX_CVDPSPN))
4621    (parallel [(set (match_dup 4)
4622                    (vec_select:SI (match_dup 6)
4623                                   (parallel [(match_dup 7)])))
4624               (clobber (scratch:SI))])
4625    (set (match_dup 8)
4626         (unspec:V4SI [(match_dup 8)
4627                       (match_dup 4)
4628                       (match_dup 3)]
4629                      UNSPEC_VSX_SET))]
4630 {
4631   unsigned int tmp_regno = reg_or_subregno (operands[4]);
4632
4633   operands[5] = gen_rtx_REG (V4SFmode, tmp_regno);
4634   operands[6] = gen_rtx_REG (V4SImode, tmp_regno);
4635   operands[7] = GEN_INT (BYTES_BIG_ENDIAN ? 0 : 3);
4636   operands[8] = gen_rtx_REG (V4SImode, reg_or_subregno (operands[0]));
4637 }
4638   [(set_attr "type" "vecperm")
4639    (set_attr "length" "12")
4640    (set_attr "isa" "p9v")])
4641
4642 ;; Special case setting 0.0f to a V4SF element
4643 (define_insn_and_split "*vsx_set_v4sf_p9_zero"
4644   [(set (match_operand:V4SF 0 "gpc_reg_operand" "=wa")
4645         (unspec:V4SF
4646          [(match_operand:V4SF 1 "gpc_reg_operand" "0")
4647           (match_operand:SF 2 "zero_fp_constant" "j")
4648           (match_operand:QI 3 "const_0_to_3_operand" "n")]
4649          UNSPEC_VSX_SET))
4650    (clobber (match_scratch:SI 4 "=&wa"))]
4651   "VECTOR_MEM_VSX_P (V4SFmode) && TARGET_P9_VECTOR && TARGET_POWERPC64"
4652   "#"
4653   "&& reload_completed"
4654   [(set (match_dup 4)
4655         (const_int 0))
4656    (set (match_dup 5)
4657         (unspec:V4SI [(match_dup 5)
4658                       (match_dup 4)
4659                       (match_dup 3)]
4660                      UNSPEC_VSX_SET))]
4661 {
4662   operands[5] = gen_rtx_REG (V4SImode, reg_or_subregno (operands[0]));
4663 }
4664   [(set_attr "type" "vecperm")
4665    (set_attr "length" "8")
4666    (set_attr "isa" "p9v")])
4667
4668 ;; Optimize x = vec_insert (vec_extract (v2, n), v1, m) if n is the element
4669 ;; that is in the default scalar position (1 for big endian, 2 for little
4670 ;; endian).  We just need to do an xxinsertw since the element is in the
4671 ;; correct location.
4672
4673 (define_insn "*vsx_insert_extract_v4sf_p9"
4674   [(set (match_operand:V4SF 0 "gpc_reg_operand" "=wa")
4675         (unspec:V4SF
4676          [(match_operand:V4SF 1 "gpc_reg_operand" "0")
4677           (vec_select:SF (match_operand:V4SF 2 "gpc_reg_operand" "wa")
4678                          (parallel
4679                           [(match_operand:QI 3 "const_0_to_3_operand" "n")]))
4680           (match_operand:QI 4 "const_0_to_3_operand" "n")]
4681          UNSPEC_VSX_SET))]
4682   "VECTOR_MEM_VSX_P (V4SFmode) && TARGET_P9_VECTOR && TARGET_POWERPC64
4683    && (INTVAL (operands[3]) == (BYTES_BIG_ENDIAN ? 1 : 2))"
4684 {
4685   int ele = INTVAL (operands[4]);
4686
4687   /* Adjust index for LE element ordering, the below minuend 3 is computed by
4688      GET_MODE_NUNITS (V4SFmode) - 1.  */
4689   if (!BYTES_BIG_ENDIAN)
4690     ele = 3 - ele;
4691
4692   operands[4] = GEN_INT (GET_MODE_SIZE (SFmode) * ele);
4693   return "xxinsertw %x0,%x2,%4";
4694 }
4695   [(set_attr "type" "vecperm")])
4696
4697 ;; Optimize x = vec_insert (vec_extract (v2, n), v1, m) if n is not the element
4698 ;; that is in the default scalar position (1 for big endian, 2 for little
4699 ;; endian).  Convert the insert/extract to int and avoid doing the conversion.
4700
4701 (define_insn_and_split "*vsx_insert_extract_v4sf_p9_2"
4702   [(set (match_operand:V4SF 0 "gpc_reg_operand" "=wa")
4703         (unspec:V4SF
4704          [(match_operand:V4SF 1 "gpc_reg_operand" "0")
4705           (vec_select:SF (match_operand:V4SF 2 "gpc_reg_operand" "wa")
4706                          (parallel
4707                           [(match_operand:QI 3 "const_0_to_3_operand" "n")]))
4708           (match_operand:QI 4 "const_0_to_3_operand" "n")]
4709          UNSPEC_VSX_SET))
4710    (clobber (match_scratch:SI 5 "=&wa"))]
4711   "VECTOR_MEM_VSX_P (V4SFmode) && VECTOR_MEM_VSX_P (V4SImode)
4712    && TARGET_P9_VECTOR && TARGET_POWERPC64
4713    && (INTVAL (operands[3]) != (BYTES_BIG_ENDIAN ? 1 : 2))"
4714   "#"
4715   "&& 1"
4716   [(parallel [(set (match_dup 5)
4717                    (vec_select:SI (match_dup 6)
4718                                   (parallel [(match_dup 3)])))
4719               (clobber (scratch:SI))])
4720    (set (match_dup 7)
4721         (unspec:V4SI [(match_dup 8)
4722                       (match_dup 5)
4723                       (match_dup 4)]
4724                      UNSPEC_VSX_SET))]
4725 {
4726   if (GET_CODE (operands[5]) == SCRATCH)
4727     operands[5] = gen_reg_rtx (SImode);
4728
4729   operands[6] = gen_lowpart (V4SImode, operands[2]);
4730   operands[7] = gen_lowpart (V4SImode, operands[0]);
4731   operands[8] = gen_lowpart (V4SImode, operands[1]);
4732 }
4733   [(set_attr "type" "vecperm")
4734    (set_attr "isa" "p9v")])
4735
4736 ;; Expanders for builtins
4737 (define_expand "vsx_mergel_<mode>"
4738   [(use (match_operand:VSX_D 0 "vsx_register_operand"))
4739    (use (match_operand:VSX_D 1 "vsx_register_operand"))
4740    (use (match_operand:VSX_D 2 "vsx_register_operand"))]
4741   "VECTOR_MEM_VSX_P (<MODE>mode)"
4742 {
4743   rtvec v = gen_rtvec (2, GEN_INT (1), GEN_INT (3));
4744   rtx x = gen_rtx_VEC_CONCAT (<VS_double>mode, operands[1], operands[2]);
4745   x = gen_rtx_VEC_SELECT (<MODE>mode, x, gen_rtx_PARALLEL (VOIDmode, v));
4746   emit_insn (gen_rtx_SET (operands[0], x));
4747   DONE;
4748 })
4749
4750 (define_expand "vsx_mergeh_<mode>"
4751   [(use (match_operand:VSX_D 0 "vsx_register_operand"))
4752    (use (match_operand:VSX_D 1 "vsx_register_operand"))
4753    (use (match_operand:VSX_D 2 "vsx_register_operand"))]
4754   "VECTOR_MEM_VSX_P (<MODE>mode)"
4755 {
4756   rtvec v = gen_rtvec (2, GEN_INT (0), GEN_INT (2));
4757   rtx x = gen_rtx_VEC_CONCAT (<VS_double>mode, operands[1], operands[2]);
4758   x = gen_rtx_VEC_SELECT (<MODE>mode, x, gen_rtx_PARALLEL (VOIDmode, v));
4759   emit_insn (gen_rtx_SET (operands[0], x));
4760   DONE;
4761 })
4762
4763 ;; V2DF/V2DI splat
4764 ;; We separate the register splat insn from the memory splat insn to force the
4765 ;; register allocator to generate the indexed form of the SPLAT when it is
4766 ;; given an offsettable memory reference.  Otherwise, if the register and
4767 ;; memory insns were combined into a single insn, the register allocator will
4768 ;; load the value into a register, and then do a double word permute.
4769 (define_expand "vsx_splat_<mode>"
4770   [(set (match_operand:VSX_D 0 "vsx_register_operand")
4771         (vec_duplicate:VSX_D
4772          (match_operand:<VEC_base> 1 "input_operand")))]
4773   "VECTOR_MEM_VSX_P (<MODE>mode)"
4774 {
4775   rtx op1 = operands[1];
4776   if (MEM_P (op1))
4777     operands[1] = rs6000_force_indexed_or_indirect_mem (op1);
4778   else
4779     operands[1] = force_reg (<VSX_D:VEC_base>mode, op1);
4780 })
4781
4782 (define_insn "vsx_splat_<mode>_reg"
4783   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa,we")
4784         (vec_duplicate:VSX_D
4785          (match_operand:<VEC_base> 1 "gpc_reg_operand" "wa,b")))]
4786   "VECTOR_MEM_VSX_P (<MODE>mode)"
4787   "@
4788    xxpermdi %x0,%x1,%x1,0
4789    mtvsrdd %x0,%1,%1"
4790   [(set_attr "type" "vecperm,vecmove")])
4791
4792 (define_insn "vsx_splat_<mode>_mem"
4793   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
4794         (vec_duplicate:VSX_D
4795          (match_operand:<VSX_D:VEC_base> 1 "memory_operand" "Z")))]
4796   "VECTOR_MEM_VSX_P (<MODE>mode)"
4797   "lxvdsx %x0,%y1"
4798   [(set_attr "type" "vecload")])
4799
4800 ;; V4SI splat support
4801 (define_insn "vsx_splat_v4si"
4802   [(set (match_operand:V4SI 0 "vsx_register_operand" "=wa,wa")
4803         (vec_duplicate:V4SI
4804          (match_operand:SI 1 "splat_input_operand" "r,Z")))]
4805   "TARGET_P9_VECTOR"
4806   "@
4807    mtvsrws %x0,%1
4808    lxvwsx %x0,%y1"
4809   [(set_attr "type" "vecperm,vecload")])
4810
4811 ;; SImode is not currently allowed in vector registers.  This pattern
4812 ;; allows us to use direct move to get the value in a vector register
4813 ;; so that we can use XXSPLTW
4814 (define_insn "vsx_splat_v4si_di"
4815   [(set (match_operand:V4SI 0 "vsx_register_operand" "=wa,we")
4816         (vec_duplicate:V4SI
4817          (truncate:SI
4818           (match_operand:DI 1 "gpc_reg_operand" "wa,r"))))]
4819   "VECTOR_MEM_VSX_P (V4SImode) && TARGET_DIRECT_MOVE_64BIT"
4820   "@
4821    xxspltw %x0,%x1,1
4822    mtvsrws %x0,%1"
4823   [(set_attr "type" "vecperm")
4824    (set_attr "isa" "p8v,*")])
4825
4826 ;; V4SF splat (ISA 3.0)
4827 (define_insn_and_split "vsx_splat_v4sf"
4828   [(set (match_operand:V4SF 0 "vsx_register_operand" "=wa,wa,wa")
4829         (vec_duplicate:V4SF
4830          (match_operand:SF 1 "splat_input_operand" "Z,wa,r")))]
4831   "TARGET_P9_VECTOR"
4832   "@
4833    lxvwsx %x0,%y1
4834    #
4835    mtvsrws %x0,%1"
4836   "&& reload_completed && vsx_register_operand (operands[1], SFmode)"
4837   [(set (match_dup 0)
4838         (unspec:V4SF [(match_dup 1)] UNSPEC_VSX_CVDPSPN))
4839    (set (match_dup 0)
4840         (unspec:V4SF [(match_dup 0)
4841                       (const_int 0)] UNSPEC_VSX_XXSPLTW))]
4842   ""
4843   [(set_attr "type" "vecload,vecperm,vecperm")
4844    (set_attr "length" "*,8,*")
4845    (set_attr "isa" "*,p8v,*")])
4846
4847 ;; V4SF/V4SI splat from a vector element
4848 (define_insn "vsx_xxspltw_<mode>"
4849   [(set (match_operand:VSX_W 0 "vsx_register_operand" "=wa")
4850         (vec_duplicate:VSX_W
4851          (vec_select:<VEC_base>
4852           (match_operand:VSX_W 1 "vsx_register_operand" "wa")
4853           (parallel
4854            [(match_operand:QI 2 "u5bit_cint_operand" "n")]))))]
4855   "VECTOR_MEM_VSX_P (<MODE>mode)"
4856 {
4857   if (!BYTES_BIG_ENDIAN)
4858     operands[2] = GEN_INT (3 - INTVAL (operands[2]));
4859
4860   return "xxspltw %x0,%x1,%2";
4861 }
4862   [(set_attr "type" "vecperm")])
4863
4864 (define_insn "vsx_xxspltw_<mode>_direct"
4865   [(set (match_operand:VSX_W 0 "vsx_register_operand" "=wa")
4866         (unspec:VSX_W [(match_operand:VSX_W 1 "vsx_register_operand" "wa")
4867                        (match_operand:QI 2 "u5bit_cint_operand" "i")]
4868                       UNSPEC_VSX_XXSPLTW))]
4869   "VECTOR_MEM_VSX_P (<MODE>mode)"
4870   "xxspltw %x0,%x1,%2"
4871   [(set_attr "type" "vecperm")])
4872
4873 ;; V16QI/V8HI splat support on ISA 2.07
4874 (define_insn "vsx_vsplt<VSX_SPLAT_SUFFIX>_di"
4875   [(set (match_operand:VSX_SPLAT_I 0 "altivec_register_operand" "=v")
4876         (vec_duplicate:VSX_SPLAT_I
4877          (truncate:<VEC_base>
4878           (match_operand:DI 1 "altivec_register_operand" "v"))))]
4879   "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_DIRECT_MOVE_64BIT"
4880   "vsplt<VSX_SPLAT_SUFFIX> %0,%1,<VSX_SPLAT_COUNT>"
4881   [(set_attr "type" "vecperm")])
4882
4883 ;; V2DF/V2DI splat for use by vec_splat builtin
4884 (define_insn "vsx_xxspltd_<mode>"
4885   [(set (match_operand:VSX_D 0 "vsx_register_operand" "=wa")
4886         (unspec:VSX_D [(match_operand:VSX_D 1 "vsx_register_operand" "wa")
4887                        (match_operand:QI 2 "u5bit_cint_operand" "i")]
4888                       UNSPEC_VSX_XXSPLTD))]
4889   "VECTOR_MEM_VSX_P (<MODE>mode)"
4890 {
4891   if ((BYTES_BIG_ENDIAN && INTVAL (operands[2]) == 0)
4892       || (!BYTES_BIG_ENDIAN && INTVAL (operands[2]) == 1))
4893     return "xxpermdi %x0,%x1,%x1,0";
4894   else
4895     return "xxpermdi %x0,%x1,%x1,3";
4896 }
4897   [(set_attr "type" "vecperm")])
4898
4899 ;; Shift left double by word immediate
4900 (define_insn "vsx_xxsldwi_<mode>"
4901   [(set (match_operand:VSX_L 0 "vsx_register_operand" "=wa")
4902         (unspec:VSX_L [(match_operand:VSX_L 1 "vsx_register_operand" "wa")
4903                        (match_operand:VSX_L 2 "vsx_register_operand" "wa")
4904                        (match_operand:QI 3 "u5bit_cint_operand" "i")]
4905                       UNSPEC_VSX_SLDWI))]
4906   "VECTOR_MEM_VSX_P (<MODE>mode)"
4907   "xxsldwi %x0,%x1,%x2,%3"
4908   [(set_attr "type" "vecperm")
4909    (set_attr "isa" "<VSisa>")])
4910
4911 \f
4912 ;; Vector reduction insns and splitters
4913
4914 (define_insn_and_split "vsx_reduc_<VEC_reduc_name>_v2df"
4915   [(set (match_operand:V2DF 0 "vfloat_operand" "=&wa,wa")
4916         (VEC_reduc:V2DF
4917          (vec_concat:V2DF
4918           (vec_select:DF
4919            (match_operand:V2DF 1 "vfloat_operand" "wa,wa")
4920            (parallel [(const_int 1)]))
4921           (vec_select:DF
4922            (match_dup 1)
4923            (parallel [(const_int 0)])))
4924          (match_dup 1)))
4925    (clobber (match_scratch:V2DF 2 "=0,&wa"))]
4926   "VECTOR_UNIT_VSX_P (V2DFmode)"
4927   "#"
4928   "&& 1"
4929   [(const_int 0)]
4930 {
4931   rtx tmp = (GET_CODE (operands[2]) == SCRATCH)
4932              ? gen_reg_rtx (V2DFmode)
4933              : operands[2];
4934   emit_insn (gen_vsx_xxsldwi_v2df (tmp, operands[1], operands[1], const2_rtx));
4935   emit_insn (gen_<VEC_reduc_rtx>v2df3 (operands[0], tmp, operands[1]));
4936   DONE;
4937 }
4938   [(set_attr "length" "8")
4939    (set_attr "type" "veccomplex")])
4940
4941 (define_insn_and_split "vsx_reduc_<VEC_reduc_name>_v4sf"
4942   [(set (match_operand:V4SF 0 "vfloat_operand" "=wa")
4943         (VEC_reduc:V4SF
4944          (unspec:V4SF [(const_int 0)] UNSPEC_REDUC)
4945          (match_operand:V4SF 1 "vfloat_operand" "wa")))
4946    (clobber (match_scratch:V4SF 2 "=&wa"))
4947    (clobber (match_scratch:V4SF 3 "=&wa"))]
4948   "VECTOR_UNIT_VSX_P (V4SFmode)"
4949   "#"
4950   "&& 1"
4951   [(const_int 0)]
4952 {
4953   rtx op0 = operands[0];
4954   rtx op1 = operands[1];
4955   rtx tmp2, tmp3, tmp4;
4956
4957   if (can_create_pseudo_p ())
4958     {
4959       tmp2 = gen_reg_rtx (V4SFmode);
4960       tmp3 = gen_reg_rtx (V4SFmode);
4961       tmp4 = gen_reg_rtx (V4SFmode);
4962     }
4963   else
4964     {
4965       tmp2 = operands[2];
4966       tmp3 = operands[3];
4967       tmp4 = tmp2;
4968     }
4969
4970   emit_insn (gen_vsx_xxsldwi_v4sf (tmp2, op1, op1, const2_rtx));
4971   emit_insn (gen_<VEC_reduc_rtx>v4sf3 (tmp3, tmp2, op1));
4972   emit_insn (gen_vsx_xxsldwi_v4sf (tmp4, tmp3, tmp3, GEN_INT (3)));
4973   emit_insn (gen_<VEC_reduc_rtx>v4sf3 (op0, tmp4, tmp3));
4974   DONE;
4975 }
4976   [(set_attr "length" "16")
4977    (set_attr "type" "veccomplex")])
4978
4979 ;; Combiner patterns with the vector reduction patterns that knows we can get
4980 ;; to the top element of the V2DF array without doing an extract.
4981
4982 (define_insn_and_split "*vsx_reduc_<VEC_reduc_name>_v2df_scalar"
4983   [(set (match_operand:DF 0 "vfloat_operand" "=&wa,wa")
4984         (vec_select:DF
4985          (VEC_reduc:V2DF
4986           (vec_concat:V2DF
4987            (vec_select:DF
4988             (match_operand:V2DF 1 "vfloat_operand" "wa,wa")
4989             (parallel [(const_int 1)]))
4990            (vec_select:DF
4991             (match_dup 1)
4992             (parallel [(const_int 0)])))
4993           (match_dup 1))
4994          (parallel [(const_int 1)])))
4995    (clobber (match_scratch:DF 2 "=0,&wa"))]
4996   "BYTES_BIG_ENDIAN && VECTOR_UNIT_VSX_P (V2DFmode)"
4997   "#"
4998   "&& 1"
4999   [(const_int 0)]
5000 {
5001   rtx hi = gen_highpart (DFmode, operands[1]);
5002   rtx lo = (GET_CODE (operands[2]) == SCRATCH)
5003             ? gen_reg_rtx (DFmode)
5004             : operands[2];
5005
5006   emit_insn (gen_vsx_extract_v2df (lo, operands[1], const1_rtx));
5007   emit_insn (gen_<VEC_reduc_rtx>df3 (operands[0], hi, lo));
5008   DONE;
5009 }
5010   [(set_attr "length" "8")
5011    (set_attr "type" "veccomplex")])
5012
5013 (define_insn_and_split "*vsx_reduc_<VEC_reduc_name>_v4sf_scalar"
5014   [(set (match_operand:SF 0 "vfloat_operand" "=f")
5015         (vec_select:SF
5016          (VEC_reduc:V4SF
5017           (unspec:V4SF [(const_int 0)] UNSPEC_REDUC)
5018           (match_operand:V4SF 1 "vfloat_operand" "wa"))
5019          (parallel [(const_int 3)])))
5020    (clobber (match_scratch:V4SF 2 "=&wa"))
5021    (clobber (match_scratch:V4SF 3 "=&wa"))
5022    (clobber (match_scratch:V4SF 4 "=0"))]
5023   "BYTES_BIG_ENDIAN && VECTOR_UNIT_VSX_P (V4SFmode)"
5024   "#"
5025   "&& 1"
5026   [(const_int 0)]
5027 {
5028   rtx op0 = operands[0];
5029   rtx op1 = operands[1];
5030   rtx tmp2, tmp3, tmp4, tmp5;
5031
5032   if (can_create_pseudo_p ())
5033     {
5034       tmp2 = gen_reg_rtx (V4SFmode);
5035       tmp3 = gen_reg_rtx (V4SFmode);
5036       tmp4 = gen_reg_rtx (V4SFmode);
5037       tmp5 = gen_reg_rtx (V4SFmode);
5038     }
5039   else
5040     {
5041       tmp2 = operands[2];
5042       tmp3 = operands[3];
5043       tmp4 = tmp2;
5044       tmp5 = operands[4];
5045     }
5046
5047   emit_insn (gen_vsx_xxsldwi_v4sf (tmp2, op1, op1, const2_rtx));
5048   emit_insn (gen_<VEC_reduc_rtx>v4sf3 (tmp3, tmp2, op1));
5049   emit_insn (gen_vsx_xxsldwi_v4sf (tmp4, tmp3, tmp3, GEN_INT (3)));
5050   emit_insn (gen_<VEC_reduc_rtx>v4sf3 (tmp5, tmp4, tmp3));
5051   emit_insn (gen_vsx_xscvspdp_scalar2 (op0, tmp5));
5052   DONE;
5053 }
5054   [(set_attr "length" "20")
5055    (set_attr "type" "veccomplex")])
5056
5057 \f
5058 ;; Power8 Vector fusion.  The fused ops must be physically adjacent.
5059 (define_peephole
5060   [(set (match_operand:P 0 "base_reg_operand")
5061         (match_operand:P 1 "short_cint_operand"))
5062    (set (match_operand:VSX_M 2 "vsx_register_operand")
5063         (mem:VSX_M (plus:P (match_dup 0)
5064                            (match_operand:P 3 "int_reg_operand"))))]
5065   "TARGET_VSX && TARGET_P8_FUSION && !TARGET_P9_VECTOR"
5066   "li %0,%1\;lx<VSX_M:VSm>x %x2,%0,%3\t\t\t# vector load fusion"
5067   [(set_attr "length" "8")
5068    (set_attr "type" "vecload")])
5069
5070 (define_peephole
5071   [(set (match_operand:P 0 "base_reg_operand")
5072         (match_operand:P 1 "short_cint_operand"))
5073    (set (match_operand:VSX_M 2 "vsx_register_operand")
5074         (mem:VSX_M (plus:P (match_operand:P 3 "int_reg_operand")
5075                            (match_dup 0))))]
5076   "TARGET_VSX && TARGET_P8_FUSION && !TARGET_P9_VECTOR"
5077   "li %0,%1\;lx<VSX_M:VSm>x %x2,%0,%3\t\t\t# vector load fusion"
5078   [(set_attr "length" "8")
5079    (set_attr "type" "vecload")])
5080
5081 \f
5082 ;; ISA 3.1 vector extend sign support
5083 (define_insn "vsx_sign_extend_v2di_v1ti"
5084   [(set (match_operand:V1TI 0 "vsx_register_operand" "=v")
5085         (unspec:V1TI [(match_operand:V2DI 1 "vsx_register_operand" "v")]
5086                      UNSPEC_VSX_SIGN_EXTEND))]
5087   "TARGET_POWER10"
5088  "vextsd2q %0,%1"
5089 [(set_attr "type" "vecexts")])
5090
5091 ;; ISA 3.0 vector extend sign support
5092
5093 (define_insn "vsx_sign_extend_v16qi_<mode>"
5094   [(set (match_operand:VSINT_84 0 "vsx_register_operand" "=v")
5095         (unspec:VSINT_84
5096          [(match_operand:V16QI 1 "vsx_register_operand" "v")]
5097          UNSPEC_VSX_SIGN_EXTEND))]
5098   "TARGET_P9_VECTOR"
5099   "vextsb2<wd> %0,%1"
5100   [(set_attr "type" "vecexts")])
5101
5102 (define_insn "vsx_sign_extend_v8hi_<mode>"
5103   [(set (match_operand:VSINT_84 0 "vsx_register_operand" "=v")
5104         (unspec:VSINT_84
5105          [(match_operand:V8HI 1 "vsx_register_operand" "v")]
5106          UNSPEC_VSX_SIGN_EXTEND))]
5107   "TARGET_P9_VECTOR"
5108   "vextsh2<wd> %0,%1"
5109   [(set_attr "type" "vecexts")])
5110
5111 (define_insn "vsx_sign_extend_v4si_v2di"
5112   [(set (match_operand:V2DI 0 "vsx_register_operand" "=v")
5113         (unspec:V2DI [(match_operand:V4SI 1 "vsx_register_operand" "v")]
5114                      UNSPEC_VSX_SIGN_EXTEND))]
5115   "TARGET_P9_VECTOR"
5116   "vextsw2d %0,%1"
5117   [(set_attr "type" "vecexts")])
5118
5119 ;; Sign extend DI to TI.  We provide both GPR targets and Altivec targets on
5120 ;; power10.  On earlier systems, the machine independent code will generate a
5121 ;; shift left to sign extend the 64-bit value to 128-bit.
5122 ;;
5123 ;; If the register allocator prefers to use GPR registers, we will use a shift
5124 ;; left instruction to sign extend the 64-bit value to 128-bit.
5125 ;;
5126 ;; If the register allocator prefers to use Altivec registers on power10,
5127 ;; generate the vextsd2q instruction.
5128 (define_insn_and_split "extendditi2"
5129   [(set (match_operand:TI 0 "register_operand" "=r,r,v,v,v")
5130         (sign_extend:TI (match_operand:DI 1 "input_operand" "r,m,b,wa,Z")))
5131    (clobber (reg:DI CA_REGNO))]
5132   "TARGET_POWERPC64 && TARGET_POWER10"
5133   "#"
5134   "&& reload_completed"
5135   [(pc)]
5136 {
5137   rtx dest = operands[0];
5138   rtx src = operands[1];
5139   int dest_regno = reg_or_subregno (dest);
5140
5141   /* Handle conversion to GPR registers.  Load up the low part and then do
5142      a sign extension to the upper part.  */
5143   if (INT_REGNO_P (dest_regno))
5144     {
5145       rtx dest_hi = gen_highpart (DImode, dest);
5146       rtx dest_lo = gen_lowpart (DImode, dest);
5147
5148       emit_move_insn (dest_lo, src);
5149       /* In case src is a MEM, we have to use the destination, which is a
5150          register, instead of re-using the source.  */
5151       rtx src2 = (REG_P (src) || SUBREG_P (src)) ? src : dest_lo;
5152       emit_insn (gen_ashrdi3 (dest_hi, src2, GEN_INT (63)));
5153       DONE;
5154     }
5155
5156   /* For conversion to an Altivec register, generate either a splat operation
5157      or a load rightmost double word instruction.  Both instructions gets the
5158      DImode value into the lower 64 bits, and then do the vextsd2q
5159      instruction.  */
5160
5161   else if (ALTIVEC_REGNO_P (dest_regno))
5162     {
5163       if (MEM_P (src))
5164         emit_insn (gen_vsx_lxvrdx (dest, src));
5165       else
5166         {
5167           rtx dest_v2di = gen_rtx_REG (V2DImode, dest_regno);
5168           emit_insn (gen_vsx_splat_v2di (dest_v2di, src));
5169         }
5170
5171       emit_insn (gen_extendditi2_vector (dest, dest));
5172       DONE;
5173     }
5174
5175   else
5176     gcc_unreachable ();
5177 }
5178   [(set_attr "length" "8")
5179    (set_attr "type" "shift,load,vecmove,vecperm,load")])
5180
5181 ;; Sign extend 64-bit value in TI reg, word 1, to 128-bit value in TI reg
5182 (define_insn "extendditi2_vector"
5183   [(set (match_operand:TI 0 "gpc_reg_operand" "=v")
5184         (unspec:TI [(match_operand:TI 1 "gpc_reg_operand" "v")]
5185                      UNSPEC_EXTENDDITI2))]
5186   "TARGET_POWER10"
5187   "vextsd2q %0,%1"
5188   [(set_attr "type" "vecexts")])
5189
5190 \f
5191 ;; ISA 3.0 Binary Floating-Point Support
5192
5193 ;; VSX Scalar Extract Exponent Quad-Precision
5194 (define_insn "xsxexpqp_<IEEE128:mode>_<V2DI_DI:mode>"
5195   [(set (match_operand:V2DI_DI 0 "altivec_register_operand" "=v")
5196         (unspec:V2DI_DI
5197           [(match_operand:IEEE128 1 "altivec_register_operand" "v")]
5198          UNSPEC_VSX_SXEXPDP))]
5199   "TARGET_P9_VECTOR"
5200   "xsxexpqp %0,%1"
5201   [(set_attr "type" "vecmove")])
5202
5203 ;; VSX Scalar Extract Exponent Double-Precision
5204 (define_insn "xsxexpdp_<mode>"
5205   [(set (match_operand:GPR 0 "register_operand" "=r")
5206         (unspec:GPR [(match_operand:DF 1 "vsx_register_operand" "wa")]
5207          UNSPEC_VSX_SXEXPDP))]
5208   "TARGET_P9_VECTOR"
5209   "xsxexpdp %0,%x1"
5210   [(set_attr "type" "integer")])
5211
5212 ;; VSX Scalar Extract Significand Quad-Precision
5213 (define_insn "xsxsigqp_<IEEE128:mode>_<VEC_TI:mode>"
5214   [(set (match_operand:VEC_TI 0 "altivec_register_operand" "=v")
5215         (unspec:VEC_TI [(match_operand:IEEE128 1
5216                             "altivec_register_operand" "v")]
5217          UNSPEC_VSX_SXSIG))]
5218   "TARGET_P9_VECTOR"
5219   "xsxsigqp %0,%1"
5220   [(set_attr "type" "vecmove")])
5221
5222 ;; VSX Scalar Extract Significand Double-Precision
5223 (define_insn "xsxsigdp"
5224   [(set (match_operand:DI 0 "register_operand" "=r")
5225         (unspec:DI [(match_operand:DF 1 "vsx_register_operand" "wa")]
5226          UNSPEC_VSX_SXSIG))]
5227   "TARGET_P9_VECTOR && TARGET_POWERPC64"
5228   "xsxsigdp %0,%x1"
5229   [(set_attr "type" "integer")])
5230
5231 ;; VSX Scalar Insert Exponent Quad-Precision Floating Point Argument
5232 (define_insn "xsiexpqpf_<mode>"
5233   [(set (match_operand:IEEE128 0 "altivec_register_operand" "=v")
5234         (unspec:IEEE128
5235          [(match_operand:IEEE128 1 "altivec_register_operand" "v")
5236           (match_operand:DI 2 "altivec_register_operand" "v")]
5237          UNSPEC_VSX_SIEXPQP))]
5238   "TARGET_P9_VECTOR"
5239   "xsiexpqp %0,%1,%2"
5240   [(set_attr "type" "vecmove")])
5241
5242 ;; VSX Scalar Insert Exponent Quad-Precision
5243 (define_insn "xsiexpqp_<IEEE128:mode>_<V2DI_DI:mode>"
5244   [(set (match_operand:IEEE128 0 "altivec_register_operand" "=v")
5245         (unspec:IEEE128 [(match_operand:<DI_to_TI> 1
5246                           "altivec_register_operand" "v")
5247                          (match_operand:V2DI_DI 2
5248                           "altivec_register_operand" "v")]
5249          UNSPEC_VSX_SIEXPQP))]
5250   "TARGET_P9_VECTOR"
5251   "xsiexpqp %0,%1,%2"
5252   [(set_attr "type" "vecmove")])
5253
5254 ;; VSX Scalar Insert Exponent Double-Precision
5255 (define_insn "xsiexpdp_<mode>"
5256   [(set (match_operand:DF 0 "vsx_register_operand" "=wa")
5257         (unspec:DF [(match_operand:DI 1 "register_operand" "r")
5258                     (match_operand:GPR 2 "register_operand" "r")]
5259          UNSPEC_VSX_SIEXPDP))]
5260   "TARGET_P9_VECTOR && TARGET_POWERPC64"
5261   "xsiexpdp %x0,%1,%2"
5262   [(set_attr "type" "fpsimple")])
5263
5264 ;; VSX Scalar Insert Exponent Double-Precision Floating Point Argument
5265 (define_insn "xsiexpdpf_<mode>"
5266   [(set (match_operand:DF 0 "vsx_register_operand" "=wa")
5267         (unspec:DF [(match_operand:DF 1 "register_operand" "r")
5268                     (match_operand:GPR 2 "register_operand" "r")]
5269          UNSPEC_VSX_SIEXPDP))]
5270   "TARGET_P9_VECTOR && TARGET_POWERPC64"
5271   "xsiexpdp %x0,%1,%2"
5272   [(set_attr "type" "fpsimple")])
5273
5274 ;; VSX Scalar Compare Exponents Double-Precision
5275 (define_expand "xscmpexpdp_<code>"
5276   [(set (match_dup 3)
5277         (compare:CCFP
5278          (unspec:DF
5279           [(match_operand:DF 1 "vsx_register_operand" "wa")
5280            (match_operand:DF 2 "vsx_register_operand" "wa")]
5281           UNSPEC_VSX_SCMPEXPDP)
5282          (const_int 0)))
5283    (set (match_operand:SI 0 "register_operand" "=r")
5284         (CMP_TEST:SI (match_dup 3)
5285                      (const_int 0)))]
5286   "TARGET_P9_VECTOR"
5287 {
5288   if (<CODE> == UNORDERED && !HONOR_NANS (DFmode))
5289     {
5290       emit_move_insn (operands[0], const0_rtx);
5291       DONE;
5292     }
5293
5294   operands[3] = gen_reg_rtx (CCFPmode);
5295 })
5296
5297 (define_insn "*xscmpexpdp"
5298   [(set (match_operand:CCFP 0 "cc_reg_operand" "=y")
5299         (compare:CCFP
5300          (unspec:DF [(match_operand:DF 1 "vsx_register_operand" "wa")
5301                      (match_operand:DF 2 "vsx_register_operand" "wa")]
5302           UNSPEC_VSX_SCMPEXPDP)
5303          (match_operand:SI 3 "zero_constant" "j")))]
5304   "TARGET_P9_VECTOR"
5305   "xscmpexpdp %0,%x1,%x2"
5306   [(set_attr "type" "fpcompare")])
5307
5308 ;; VSX Scalar Compare Exponents Quad-Precision
5309 (define_expand "xscmpexpqp_<code>_<mode>"
5310   [(set (match_dup 3)
5311         (compare:CCFP
5312          (unspec:IEEE128
5313           [(match_operand:IEEE128 1 "vsx_register_operand" "v")
5314            (match_operand:IEEE128 2 "vsx_register_operand" "v")]
5315           UNSPEC_VSX_SCMPEXPQP)
5316          (const_int 0)))
5317    (set (match_operand:SI 0 "register_operand" "=r")
5318         (CMP_TEST:SI (match_dup 3)
5319                      (const_int 0)))]
5320   "TARGET_P9_VECTOR"
5321 {
5322   if (<CODE> == UNORDERED && !HONOR_NANS (<MODE>mode))
5323     {
5324       emit_move_insn (operands[0], const0_rtx);
5325       DONE;
5326     }
5327
5328   operands[3] = gen_reg_rtx (CCFPmode);
5329 })
5330
5331 (define_insn "*xscmpexpqp"
5332   [(set (match_operand:CCFP 0 "cc_reg_operand" "=y")
5333         (compare:CCFP
5334          (unspec:IEEE128 [(match_operand:IEEE128 1 "altivec_register_operand" "v")
5335                           (match_operand:IEEE128 2 "altivec_register_operand" "v")]
5336           UNSPEC_VSX_SCMPEXPQP)
5337          (match_operand:SI 3 "zero_constant" "j")))]
5338   "TARGET_P9_VECTOR"
5339   "xscmpexpqp %0,%1,%2"
5340   [(set_attr "type" "fpcompare")])
5341
5342 ;; VSX Scalar Test Data Class Quad-Precision
5343 ;;  (Expansion for scalar_test_data_class (__ieee128, int))
5344 ;;   (Has side effect of setting the lt bit if operand 1 is negative,
5345 ;;    setting the eq bit if any of the conditions tested by operand 2
5346 ;;    are satisfied, and clearing the gt and undordered bits to zero.)
5347 (define_expand "xststdcqp_<mode>"
5348   [(set (match_dup 3)
5349         (compare:CCFP
5350          (unspec:IEEE128
5351           [(match_operand:IEEE128 1 "altivec_register_operand" "v")
5352            (match_operand:SI 2 "u7bit_cint_operand" "n")]
5353           UNSPEC_VSX_STSTDC)
5354          (const_int 0)))
5355    (set (match_operand:SI 0 "register_operand" "=r")
5356         (eq:SI (match_dup 3)
5357                (const_int 0)))]
5358   "TARGET_P9_VECTOR"
5359 {
5360   operands[3] = gen_reg_rtx (CCFPmode);
5361 })
5362
5363 ;; VSX Scalar Test Data Class Double- and Single-Precision
5364 ;;  (The lt bit is set if operand 1 is negative.  The eq bit is set
5365 ;;   if any of the conditions tested by operand 2 are satisfied.
5366 ;;   The gt and unordered bits are cleared to zero.)
5367 (define_expand "xststdc<sd>p"
5368   [(set (match_dup 3)
5369         (compare:CCFP
5370          (unspec:SFDF
5371           [(match_operand:SFDF 1 "vsx_register_operand" "wa")
5372            (match_operand:SI 2 "u7bit_cint_operand" "n")]
5373           UNSPEC_VSX_STSTDC)
5374          (match_dup 4)))
5375    (set (match_operand:SI 0 "register_operand" "=r")
5376         (eq:SI (match_dup 3)
5377                (const_int 0)))]
5378   "TARGET_P9_VECTOR"
5379 {
5380   operands[3] = gen_reg_rtx (CCFPmode);
5381   operands[4] = CONST0_RTX (SImode);
5382 })
5383
5384 ;; The VSX Scalar Test Negative Quad-Precision
5385 (define_expand "xststdcnegqp_<mode>"
5386   [(set (match_dup 2)
5387         (compare:CCFP
5388          (unspec:IEEE128
5389           [(match_operand:IEEE128 1 "altivec_register_operand" "v")
5390            (const_int 0)]
5391           UNSPEC_VSX_STSTDC)
5392          (const_int 0)))
5393    (set (match_operand:SI 0 "register_operand" "=r")
5394         (lt:SI (match_dup 2)
5395                (const_int 0)))]
5396   "TARGET_P9_VECTOR"
5397 {
5398   operands[2] = gen_reg_rtx (CCFPmode);
5399 })
5400
5401 ;; The VSX Scalar Test Negative Double- and Single-Precision
5402 (define_expand "xststdcneg<sd>p"
5403   [(set (match_dup 2)
5404         (compare:CCFP
5405          (unspec:SFDF
5406           [(match_operand:SFDF 1 "vsx_register_operand" "wa")
5407            (const_int 0)]
5408           UNSPEC_VSX_STSTDC)
5409          (match_dup 3)))
5410    (set (match_operand:SI 0 "register_operand" "=r")
5411         (lt:SI (match_dup 2)
5412                (const_int 0)))]
5413   "TARGET_P9_VECTOR"
5414 {
5415   operands[2] = gen_reg_rtx (CCFPmode);
5416   operands[3] = CONST0_RTX (SImode);
5417 })
5418
5419 (define_insn "*xststdcqp_<mode>"
5420   [(set (match_operand:CCFP 0 "" "=y")
5421         (compare:CCFP
5422          (unspec:IEEE128
5423           [(match_operand:IEEE128 1 "altivec_register_operand" "v")
5424            (match_operand:SI 2 "u7bit_cint_operand" "n")]
5425           UNSPEC_VSX_STSTDC)
5426          (const_int 0)))]
5427   "TARGET_P9_VECTOR"
5428   "xststdcqp %0,%1,%2"
5429   [(set_attr "type" "fpcompare")])
5430
5431 (define_insn "*xststdc<sd>p"
5432   [(set (match_operand:CCFP 0 "" "=y")
5433         (compare:CCFP
5434          (unspec:SFDF [(match_operand:SFDF 1 "vsx_register_operand" "wa")
5435                        (match_operand:SI 2 "u7bit_cint_operand" "n")]
5436           UNSPEC_VSX_STSTDC)
5437          (match_operand:SI 3 "zero_constant" "j")))]
5438   "TARGET_P9_VECTOR"
5439   "xststdc<sd>p %0,%x1,%2"
5440   [(set_attr "type" "fpcompare")])
5441
5442 ;; VSX Vector Extract Exponent Double and Single Precision
5443 (define_insn "xvxexp<sd>p"
5444   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
5445         (unspec:VSX_F
5446          [(match_operand:VSX_F 1 "vsx_register_operand" "wa")]
5447          UNSPEC_VSX_VXEXP))]
5448   "TARGET_P9_VECTOR"
5449   "xvxexp<sd>p %x0,%x1"
5450   [(set_attr "type" "vecsimple")])
5451
5452 ;; VSX Vector Extract Significand Double and Single Precision
5453 (define_insn "xvxsig<sd>p"
5454   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
5455         (unspec:VSX_F
5456          [(match_operand:VSX_F 1 "vsx_register_operand" "wa")]
5457          UNSPEC_VSX_VXSIG))]
5458   "TARGET_P9_VECTOR"
5459   "xvxsig<sd>p %x0,%x1"
5460   [(set_attr "type" "vecsimple")])
5461
5462 ;; VSX Vector Insert Exponent Double and Single Precision
5463 (define_insn "xviexp<sd>p"
5464   [(set (match_operand:VSX_F 0 "vsx_register_operand" "=wa")
5465         (unspec:VSX_F
5466          [(match_operand:VSX_F 1 "vsx_register_operand" "wa")
5467           (match_operand:VSX_F 2 "vsx_register_operand" "wa")]
5468          UNSPEC_VSX_VIEXP))]
5469   "TARGET_P9_VECTOR"
5470   "xviexp<sd>p %x0,%x1,%x2"
5471   [(set_attr "type" "vecsimple")])
5472
5473 ;; VSX Vector Test Data Class Double and Single Precision
5474 ;; The corresponding elements of the result vector are all ones
5475 ;; if any of the conditions tested by operand 3 are satisfied.
5476 (define_insn "xvtstdc<sd>p"
5477   [(set (match_operand:<VSI> 0 "vsx_register_operand" "=wa")
5478         (unspec:<VSI>
5479          [(match_operand:VSX_F 1 "vsx_register_operand" "wa")
5480           (match_operand:SI 2 "u7bit_cint_operand" "n")]
5481          UNSPEC_VSX_VTSTDC))]
5482   "TARGET_P9_VECTOR"
5483   "xvtstdc<sd>p %x0,%x1,%2"
5484   [(set_attr "type" "vecsimple")])
5485
5486 ;; ISA 3.0 String Operations Support
5487
5488 ;; Compare vectors producing a vector result and a predicate, setting CR6
5489 ;; to indicate a combined status.  This pattern matches v16qi, v8hi, and
5490 ;; v4si modes.  It does not match v2df, v4sf, or v2di modes.  There's no
5491 ;; need to match v4sf, v2df, or v2di modes because those are expanded
5492 ;; to use Power8 instructions.
5493 (define_insn "*vsx_ne_<mode>_p"
5494   [(set (reg:CC CR6_REGNO)
5495         (unspec:CC
5496          [(ne:CC (match_operand:VSX_EXTRACT_I 1 "gpc_reg_operand" "v")
5497                  (match_operand:VSX_EXTRACT_I 2 "gpc_reg_operand" "v"))]
5498          UNSPEC_PREDICATE))
5499    (set (match_operand:VSX_EXTRACT_I 0 "gpc_reg_operand" "=v")
5500         (ne:VSX_EXTRACT_I (match_dup 1)
5501                           (match_dup 2)))]
5502   "TARGET_P9_VECTOR"
5503   "vcmpne<VSX_EXTRACT_WIDTH>. %0,%1,%2"
5504   [(set_attr "type" "vecsimple")])
5505
5506 (define_insn "*vector_nez_<mode>_p"
5507   [(set (reg:CC CR6_REGNO)
5508         (unspec:CC [(unspec:VI
5509                      [(match_operand:VI 1 "gpc_reg_operand" "v")
5510                       (match_operand:VI 2 "gpc_reg_operand" "v")]
5511                      UNSPEC_NEZ_P)]
5512          UNSPEC_PREDICATE))
5513    (set (match_operand:VI 0 "gpc_reg_operand" "=v")
5514         (unspec:VI [(match_dup 1)
5515                     (match_dup 2)]
5516          UNSPEC_NEZ_P))]
5517   "TARGET_P9_VECTOR"
5518   "vcmpnez<VSX_EXTRACT_WIDTH>. %0,%1,%2"
5519   [(set_attr "type" "vecsimple")])
5520
5521 ;; Return first position of match between vectors using natural order
5522 ;; for both LE and BE execution modes.
5523 (define_expand "first_match_index_<mode>"
5524   [(match_operand:SI 0 "register_operand")
5525    (unspec:SI [(match_operand:VSX_EXTRACT_I 1 "register_operand")
5526                (match_operand:VSX_EXTRACT_I 2 "register_operand")]
5527   UNSPEC_VSX_FIRST_MATCH_INDEX)]
5528   "TARGET_P9_VECTOR"
5529 {
5530   int sh;
5531
5532   rtx cmp_result = gen_reg_rtx (<MODE>mode);
5533   rtx not_result = gen_reg_rtx (<MODE>mode);
5534
5535   emit_insn (gen_vcmpne<VSX_EXTRACT_WIDTH> (cmp_result, operands[1],
5536                                             operands[2]));
5537   emit_insn (gen_one_cmpl<mode>2 (not_result, cmp_result));
5538
5539   sh = GET_MODE_SIZE (GET_MODE_INNER (<MODE>mode)) / 2;
5540
5541   if (<MODE>mode == V16QImode)
5542     {
5543       if (!BYTES_BIG_ENDIAN)
5544         emit_insn (gen_vctzlsbb_<mode> (operands[0], not_result));
5545       else
5546         emit_insn (gen_vclzlsbb_<mode> (operands[0], not_result));
5547     }
5548   else
5549     {
5550       rtx tmp = gen_reg_rtx (SImode);
5551       if (!BYTES_BIG_ENDIAN)
5552         emit_insn (gen_vctzlsbb_<mode> (tmp, not_result));
5553       else
5554         emit_insn (gen_vclzlsbb_<mode> (tmp, not_result));
5555       emit_insn (gen_lshrsi3 (operands[0], tmp, GEN_INT (sh)));
5556     }
5557   DONE;
5558 })
5559
5560 ;; Return first position of match between vectors or end of string (EOS) using
5561 ;; natural element order for both LE and BE execution modes.
5562 (define_expand "first_match_or_eos_index_<mode>"
5563   [(match_operand:SI 0 "register_operand")
5564    (unspec: SI [(match_operand:VSX_EXTRACT_I 1 "register_operand")
5565    (match_operand:VSX_EXTRACT_I 2 "register_operand")]
5566   UNSPEC_VSX_FIRST_MATCH_EOS_INDEX)]
5567   "TARGET_P9_VECTOR"
5568 {
5569   int sh;
5570   rtx cmpz1_result = gen_reg_rtx (<MODE>mode);
5571   rtx cmpz2_result = gen_reg_rtx (<MODE>mode);
5572   rtx cmpz_result = gen_reg_rtx (<MODE>mode);
5573   rtx and_result = gen_reg_rtx (<MODE>mode);
5574   rtx result = gen_reg_rtx (<MODE>mode);
5575   rtx vzero = gen_reg_rtx (<MODE>mode);
5576
5577   /* Vector with zeros in elements that correspond to zeros in operands.  */
5578   emit_move_insn (vzero, CONST0_RTX (<MODE>mode));
5579   emit_insn (gen_vcmpne<VSX_EXTRACT_WIDTH> (cmpz1_result, operands[1], vzero));
5580   emit_insn (gen_vcmpne<VSX_EXTRACT_WIDTH> (cmpz2_result, operands[2], vzero));
5581   emit_insn (gen_and<mode>3 (and_result, cmpz1_result, cmpz2_result));
5582
5583   /* Vector with ones in elments that do not match.  */
5584   emit_insn (gen_vcmpnez<VSX_EXTRACT_WIDTH> (cmpz_result, operands[1],
5585                                              operands[2]));
5586
5587   /* Create vector with ones in elements where there was a zero in one of
5588      the source elements or the elements that match.  */
5589   emit_insn (gen_nand<mode>3 (result, and_result, cmpz_result));
5590   sh = GET_MODE_SIZE (GET_MODE_INNER (<MODE>mode)) / 2;
5591
5592   if (<MODE>mode == V16QImode)
5593     {
5594       if (!BYTES_BIG_ENDIAN)
5595         emit_insn (gen_vctzlsbb_<mode> (operands[0], result));
5596       else
5597         emit_insn (gen_vclzlsbb_<mode> (operands[0], result));
5598     }
5599   else
5600     {
5601       rtx tmp = gen_reg_rtx (SImode);
5602       if (!BYTES_BIG_ENDIAN)
5603         emit_insn (gen_vctzlsbb_<mode> (tmp, result));
5604       else
5605         emit_insn (gen_vclzlsbb_<mode> (tmp, result));
5606       emit_insn (gen_lshrsi3 (operands[0], tmp, GEN_INT (sh)));
5607     }
5608   DONE;
5609 })
5610
5611 ;; Return first position of mismatch between vectors using natural
5612 ;; element order for both LE and BE execution modes.
5613 (define_expand "first_mismatch_index_<mode>"
5614   [(match_operand:SI 0 "register_operand")
5615    (unspec: SI [(match_operand:VSX_EXTRACT_I 1 "register_operand")
5616    (match_operand:VSX_EXTRACT_I 2 "register_operand")]
5617   UNSPEC_VSX_FIRST_MISMATCH_INDEX)]
5618   "TARGET_P9_VECTOR"
5619 {
5620   int sh;
5621   rtx cmp_result = gen_reg_rtx (<MODE>mode);
5622
5623   emit_insn (gen_vcmpne<VSX_EXTRACT_WIDTH> (cmp_result, operands[1],
5624                                             operands[2]));
5625   sh = GET_MODE_SIZE (GET_MODE_INNER (<MODE>mode)) / 2;
5626
5627   if (<MODE>mode == V16QImode)
5628     {
5629       if (!BYTES_BIG_ENDIAN)
5630         emit_insn (gen_vctzlsbb_<mode> (operands[0], cmp_result));
5631       else
5632         emit_insn (gen_vclzlsbb_<mode> (operands[0], cmp_result));
5633     }
5634   else
5635     {
5636       rtx tmp = gen_reg_rtx (SImode);
5637       if (!BYTES_BIG_ENDIAN)
5638         emit_insn (gen_vctzlsbb_<mode> (tmp, cmp_result));
5639       else
5640         emit_insn (gen_vclzlsbb_<mode> (tmp, cmp_result));
5641       emit_insn (gen_lshrsi3 (operands[0], tmp, GEN_INT (sh)));
5642     }
5643   DONE;
5644 })
5645
5646 ;; Return first position of mismatch between vectors or end of string (EOS)
5647 ;; using natural element order for both LE and BE execution modes.
5648 (define_expand "first_mismatch_or_eos_index_<mode>"
5649   [(match_operand:SI 0 "register_operand")
5650    (unspec: SI [(match_operand:VSX_EXTRACT_I 1 "register_operand")
5651    (match_operand:VSX_EXTRACT_I 2 "register_operand")]
5652   UNSPEC_VSX_FIRST_MISMATCH_EOS_INDEX)]
5653   "TARGET_P9_VECTOR"
5654 {
5655   int sh;
5656   rtx cmpz1_result = gen_reg_rtx (<MODE>mode);
5657   rtx cmpz2_result = gen_reg_rtx (<MODE>mode);
5658   rtx cmpz_result = gen_reg_rtx (<MODE>mode);
5659   rtx not_cmpz_result = gen_reg_rtx (<MODE>mode);
5660   rtx and_result = gen_reg_rtx (<MODE>mode);
5661   rtx result = gen_reg_rtx (<MODE>mode);
5662   rtx vzero = gen_reg_rtx (<MODE>mode);
5663
5664   /* Vector with zeros in elements that correspond to zeros in operands.  */
5665   emit_move_insn (vzero, CONST0_RTX (<MODE>mode));
5666
5667   emit_insn (gen_vcmpne<VSX_EXTRACT_WIDTH> (cmpz1_result, operands[1], vzero));
5668   emit_insn (gen_vcmpne<VSX_EXTRACT_WIDTH> (cmpz2_result, operands[2], vzero));
5669   emit_insn (gen_and<mode>3 (and_result, cmpz1_result, cmpz2_result));
5670
5671   /* Vector with ones in elments that match.  */
5672   emit_insn (gen_vcmpnez<VSX_EXTRACT_WIDTH> (cmpz_result, operands[1],
5673                                              operands[2]));
5674   emit_insn (gen_one_cmpl<mode>2 (not_cmpz_result, cmpz_result));
5675
5676   /* Create vector with ones in elements where there was a zero in one of
5677      the source elements or the elements did not match.  */
5678   emit_insn (gen_nand<mode>3 (result, and_result, not_cmpz_result));
5679   sh = GET_MODE_SIZE (GET_MODE_INNER (<MODE>mode)) / 2;
5680
5681   if (<MODE>mode == V16QImode)
5682     {
5683       if (!BYTES_BIG_ENDIAN)
5684         emit_insn (gen_vctzlsbb_<mode> (operands[0], result));
5685       else
5686         emit_insn (gen_vclzlsbb_<mode> (operands[0], result));
5687     }
5688   else
5689     {
5690       rtx tmp = gen_reg_rtx (SImode);
5691       if (!BYTES_BIG_ENDIAN)
5692         emit_insn (gen_vctzlsbb_<mode> (tmp, result));
5693       else
5694         emit_insn (gen_vclzlsbb_<mode> (tmp, result));
5695       emit_insn (gen_lshrsi3 (operands[0], tmp, GEN_INT (sh)));
5696     }
5697   DONE;
5698 })
5699
5700 ;; Load VSX Vector with Length
5701 (define_expand "lxvl"
5702   [(set (match_dup 3)
5703         (ashift:DI (match_operand:DI 2 "register_operand")
5704                    (const_int 56)))
5705    (set (match_operand:V16QI 0 "vsx_register_operand")
5706         (unspec:V16QI
5707          [(match_operand:DI 1 "gpc_reg_operand")
5708           (mem:V16QI (match_dup 1))
5709           (match_dup 3)]
5710          UNSPEC_LXVL))]
5711   "TARGET_P9_VECTOR && TARGET_64BIT"
5712 {
5713   operands[3] = gen_reg_rtx (DImode);
5714 })
5715
5716 (define_insn "*lxvl"
5717   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
5718         (unspec:V16QI
5719          [(match_operand:DI 1 "gpc_reg_operand" "b")
5720           (mem:V16QI (match_dup 1))
5721           (match_operand:DI 2 "register_operand" "r")]
5722          UNSPEC_LXVL))]
5723   "TARGET_P9_VECTOR && TARGET_64BIT"
5724   "lxvl %x0,%1,%2"
5725   [(set_attr "type" "vecload")])
5726
5727 (define_insn "lxvll"
5728   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
5729         (unspec:V16QI [(match_operand:DI 1 "gpc_reg_operand" "b")
5730                        (mem:V16QI (match_dup 1))
5731                        (match_operand:DI 2 "register_operand" "r")]
5732                       UNSPEC_LXVLL))]
5733   "TARGET_P9_VECTOR"
5734   "lxvll %x0,%1,%2"
5735   [(set_attr "type" "vecload")])
5736
5737 ;; Expand for builtin xl_len_r
5738 (define_expand "xl_len_r"
5739   [(match_operand:V16QI 0 "vsx_register_operand")
5740    (match_operand:DI 1 "register_operand")
5741    (match_operand:DI 2 "register_operand")]
5742   ""
5743 {
5744   rtx shift_mask = gen_reg_rtx (V16QImode);
5745   rtx rtx_vtmp = gen_reg_rtx (V16QImode);
5746   rtx tmp = gen_reg_rtx (DImode);
5747
5748   emit_insn (gen_altivec_lvsl_reg_di (shift_mask, operands[2]));
5749   emit_insn (gen_ashldi3 (tmp, operands[2], GEN_INT (56)));
5750   emit_insn (gen_lxvll (rtx_vtmp, operands[1], tmp));
5751   emit_insn (gen_altivec_vperm_v8hiv16qi (operands[0], rtx_vtmp, rtx_vtmp,
5752              shift_mask));
5753   DONE;
5754 })
5755
5756 (define_insn "stxvll"
5757   [(set (mem:V16QI (match_operand:DI 1 "gpc_reg_operand" "b"))
5758         (unspec:V16QI [(match_operand:V16QI 0 "vsx_register_operand" "wa")
5759                        (mem:V16QI (match_dup 1))
5760                        (match_operand:DI 2 "register_operand" "r")]
5761                       UNSPEC_STXVLL))]
5762   "TARGET_P9_VECTOR"
5763   "stxvll %x0,%1,%2"
5764   [(set_attr "type" "vecstore")])
5765
5766 ;; Store VSX Vector with Length
5767 (define_expand "stxvl"
5768   [(set (match_dup 3)
5769         (ashift:DI (match_operand:DI 2 "register_operand")
5770                    (const_int 56)))
5771    (set (mem:V16QI (match_operand:DI 1 "gpc_reg_operand"))
5772         (unspec:V16QI
5773          [(match_operand:V16QI 0 "vsx_register_operand")
5774           (mem:V16QI (match_dup 1))
5775           (match_dup 3)]
5776          UNSPEC_STXVL))]
5777   "TARGET_P9_VECTOR && TARGET_64BIT"
5778 {
5779   operands[3] = gen_reg_rtx (DImode);
5780 })
5781
5782 ;; Define optab for vector access with length vectorization exploitation.
5783 (define_expand "len_load_v16qi"
5784   [(match_operand:V16QI 0 "vlogical_operand")
5785    (match_operand:V16QI 1 "memory_operand")
5786    (match_operand:QI 2 "gpc_reg_operand")
5787    (match_operand:QI 3 "zero_constant")]
5788   "TARGET_P9_VECTOR && TARGET_64BIT"
5789 {
5790   rtx mem = XEXP (operands[1], 0);
5791   mem = force_reg (DImode, mem);
5792   rtx len = gen_lowpart (DImode, operands[2]);
5793   emit_insn (gen_lxvl (operands[0], mem, len));
5794   DONE;
5795 })
5796
5797 (define_expand "len_store_v16qi"
5798   [(match_operand:V16QI 0 "memory_operand")
5799    (match_operand:V16QI 1 "vlogical_operand")
5800    (match_operand:QI 2 "gpc_reg_operand")
5801    (match_operand:QI 3 "zero_constant")
5802   ]
5803   "TARGET_P9_VECTOR && TARGET_64BIT"
5804 {
5805   rtx mem = XEXP (operands[0], 0);
5806   mem = force_reg (DImode, mem);
5807   rtx len = gen_lowpart (DImode, operands[2]);
5808   emit_insn (gen_stxvl (operands[1], mem, len));
5809   DONE;
5810 })
5811
5812 (define_insn "*stxvl"
5813   [(set (mem:V16QI (match_operand:DI 1 "gpc_reg_operand" "b"))
5814         (unspec:V16QI
5815          [(match_operand:V16QI 0 "vsx_register_operand" "wa")
5816           (mem:V16QI (match_dup 1))
5817           (match_operand:DI 2 "register_operand" "r")]
5818          UNSPEC_STXVL))]
5819   "TARGET_P9_VECTOR && TARGET_64BIT"
5820   "stxvl %x0,%1,%2"
5821   [(set_attr "type" "vecstore")])
5822
5823 ;; Expand for builtin xst_len_r
5824 (define_expand "xst_len_r"
5825   [(match_operand:V16QI 0 "vsx_register_operand" "=wa")
5826    (match_operand:DI 1 "register_operand" "b")
5827    (match_operand:DI 2 "register_operand" "r")]
5828   "UNSPEC_XST_LEN_R"
5829 {
5830   rtx shift_mask = gen_reg_rtx (V16QImode);
5831   rtx rtx_vtmp = gen_reg_rtx (V16QImode);
5832   rtx tmp = gen_reg_rtx (DImode);
5833
5834   emit_insn (gen_altivec_lvsr_reg_di (shift_mask, operands[2]));
5835   emit_insn (gen_altivec_vperm_v8hiv16qi (rtx_vtmp, operands[0], operands[0],
5836              shift_mask));
5837   emit_insn (gen_ashldi3 (tmp, operands[2], GEN_INT (56)));
5838   emit_insn (gen_stxvll (rtx_vtmp, operands[1], tmp));
5839   DONE;
5840 })
5841
5842 ;; Vector Compare Not Equal Byte (specified/not+eq:)
5843 (define_insn "vcmpneb"
5844   [(set (match_operand:V16QI 0 "altivec_register_operand" "=v")
5845          (not:V16QI
5846            (eq:V16QI (match_operand:V16QI 1 "altivec_register_operand" "v")
5847                      (match_operand:V16QI 2 "altivec_register_operand" "v"))))]
5848   "TARGET_P9_VECTOR"
5849   "vcmpneb %0,%1,%2"
5850   [(set_attr "type" "vecsimple")])
5851
5852 ;; Vector Compare Not Equal v1ti (specified/not+eq:)
5853 (define_expand "vcmpnet"
5854   [(set (match_operand:V1TI 0 "altivec_register_operand")
5855         (not:V1TI
5856           (eq:V1TI (match_operand:V1TI 1 "altivec_register_operand")
5857                    (match_operand:V1TI 2 "altivec_register_operand"))))]
5858    "TARGET_POWER10"
5859 {
5860   emit_insn (gen_eqvv1ti3 (operands[0], operands[1], operands[2]));
5861   emit_insn (gen_one_cmplv1ti2 (operands[0], operands[0]));
5862   DONE;
5863 })
5864
5865 ;; Vector Compare Not Equal or Zero Byte
5866 (define_insn "vcmpnezb"
5867   [(set (match_operand:V16QI 0 "altivec_register_operand" "=v")
5868         (unspec:V16QI
5869          [(match_operand:V16QI 1 "altivec_register_operand" "v")
5870           (match_operand:V16QI 2 "altivec_register_operand" "v")]
5871          UNSPEC_VCMPNEZB))]
5872   "TARGET_P9_VECTOR"
5873   "vcmpnezb %0,%1,%2"
5874   [(set_attr "type" "vecsimple")])
5875
5876 ;; Vector Compare Not Equal or Zero Byte predicate or record-form
5877 (define_insn "vcmpnezb_p"
5878   [(set (reg:CC CR6_REGNO)
5879         (unspec:CC
5880          [(match_operand:V16QI 1 "altivec_register_operand" "v")
5881           (match_operand:V16QI 2 "altivec_register_operand" "v")]
5882          UNSPEC_VCMPNEZB))
5883    (set (match_operand:V16QI 0 "altivec_register_operand" "=v")
5884         (unspec:V16QI
5885          [(match_dup 1)
5886           (match_dup 2)]
5887          UNSPEC_VCMPNEZB))]
5888   "TARGET_P9_VECTOR"
5889   "vcmpnezb. %0,%1,%2"
5890   [(set_attr "type" "vecsimple")])
5891
5892 ;; Vector Compare Not Equal Half Word (specified/not+eq:)
5893 (define_insn "vcmpneh"
5894   [(set (match_operand:V8HI 0 "altivec_register_operand" "=v")
5895         (not:V8HI
5896           (eq:V8HI (match_operand:V8HI 1 "altivec_register_operand" "v")
5897                    (match_operand:V8HI 2 "altivec_register_operand" "v"))))]
5898   "TARGET_P9_VECTOR"
5899   "vcmpneh %0,%1,%2"
5900   [(set_attr "type" "vecsimple")])
5901
5902 ;; Vector Compare Not Equal or Zero Half Word
5903 (define_insn "vcmpnezh"
5904   [(set (match_operand:V8HI 0 "altivec_register_operand" "=v")
5905         (unspec:V8HI [(match_operand:V8HI 1 "altivec_register_operand" "v")
5906                       (match_operand:V8HI 2 "altivec_register_operand" "v")]
5907          UNSPEC_VCMPNEZH))]
5908   "TARGET_P9_VECTOR"
5909   "vcmpnezh %0,%1,%2"
5910   [(set_attr "type" "vecsimple")])
5911
5912 ;; Vector Compare Not Equal Word (specified/not+eq:)
5913 (define_insn "vcmpnew"
5914   [(set (match_operand:V4SI 0 "altivec_register_operand" "=v")
5915         (not:V4SI
5916           (eq:V4SI (match_operand:V4SI 1 "altivec_register_operand" "v")
5917                    (match_operand:V4SI 2 "altivec_register_operand" "v"))))]
5918   "TARGET_P9_VECTOR"
5919   "vcmpnew %0,%1,%2"
5920   [(set_attr "type" "vecsimple")])
5921
5922 ;; Vector Compare Not Equal or Zero Word
5923 (define_insn "vcmpnezw"
5924   [(set (match_operand:V4SI 0 "altivec_register_operand" "=v")
5925         (unspec:V4SI [(match_operand:V4SI 1 "altivec_register_operand" "v")
5926                       (match_operand:V4SI 2 "altivec_register_operand" "v")]
5927          UNSPEC_VCMPNEZW))]
5928   "TARGET_P9_VECTOR"
5929   "vcmpnezw %0,%1,%2"
5930   [(set_attr "type" "vecsimple")])
5931
5932 ;; Vector Count Leading/Trailing Zero Least-Significant Bits Byte
5933 (define_insn "*vc<vczlsbb_char>zlsbb_zext_<mode>"
5934   [(set (match_operand:DI 0 "register_operand" "=r")
5935           (zero_extend:DI
5936             (unspec:SI
5937               [(match_operand:VSX_EXTRACT_I 1 "altivec_register_operand" "v")]
5938               VCZLSBB)))]
5939   "TARGET_P9_VECTOR"
5940   "vc<vczlsbb_char>zlsbb %0,%1"
5941   [(set_attr "type" "vecsimple")])
5942
5943 (define_insn "vc<vczlsbb_char>zlsbb_<mode>"
5944   [(set (match_operand:SI 0 "register_operand" "=r")
5945           (unspec:SI
5946             [(match_operand:VSX_EXTRACT_I 1 "altivec_register_operand" "v")]
5947             VCZLSBB))]
5948   "TARGET_P9_VECTOR"
5949   "vc<vczlsbb_char>zlsbb %0,%1"
5950   [(set_attr "type" "vecsimple")])
5951
5952 ;; Vector Extract Unsigned Byte Left-Indexed
5953 (define_insn "vextublx"
5954   [(set (match_operand:SI 0 "register_operand" "=r")
5955         (unspec:SI
5956          [(match_operand:SI 1 "register_operand" "r")
5957           (match_operand:V16QI 2 "altivec_register_operand" "v")]
5958          UNSPEC_VEXTUBLX))]
5959   "TARGET_P9_VECTOR"
5960   "vextublx %0,%1,%2"
5961   [(set_attr "type" "vecsimple")])
5962
5963 ;; Vector Extract Unsigned Byte Right-Indexed
5964 (define_insn "vextubrx"
5965   [(set (match_operand:SI 0 "register_operand" "=r")
5966         (unspec:SI
5967          [(match_operand:SI 1 "register_operand" "r")
5968           (match_operand:V16QI 2 "altivec_register_operand" "v")]
5969          UNSPEC_VEXTUBRX))]
5970   "TARGET_P9_VECTOR"
5971   "vextubrx %0,%1,%2"
5972   [(set_attr "type" "vecsimple")])
5973
5974 ;; Vector Extract Unsigned Half Word Left-Indexed
5975 (define_insn "vextuhlx"
5976   [(set (match_operand:SI 0 "register_operand" "=r")
5977         (unspec:SI
5978          [(match_operand:SI 1 "register_operand" "r")
5979           (match_operand:V8HI 2 "altivec_register_operand" "v")]
5980          UNSPEC_VEXTUHLX))]
5981   "TARGET_P9_VECTOR"
5982   "vextuhlx %0,%1,%2"
5983   [(set_attr "type" "vecsimple")])
5984
5985 ;; Vector Extract Unsigned Half Word Right-Indexed
5986 (define_insn "vextuhrx"
5987   [(set (match_operand:SI 0 "register_operand" "=r")
5988         (unspec:SI
5989          [(match_operand:SI 1 "register_operand" "r")
5990           (match_operand:V8HI 2 "altivec_register_operand" "v")]
5991          UNSPEC_VEXTUHRX))]
5992   "TARGET_P9_VECTOR"
5993   "vextuhrx %0,%1,%2"
5994   [(set_attr "type" "vecsimple")])
5995
5996 ;; Vector Extract Unsigned Word Left-Indexed
5997 (define_insn "vextuwlx"
5998   [(set (match_operand:SI 0 "register_operand" "=r")
5999         (unspec:SI
6000          [(match_operand:SI 1 "register_operand" "r")
6001           (match_operand:V4SI 2 "altivec_register_operand" "v")]
6002          UNSPEC_VEXTUWLX))]
6003   "TARGET_P9_VECTOR"
6004   "vextuwlx %0,%1,%2"
6005   [(set_attr "type" "vecsimple")])
6006
6007 ;; Vector Extract Unsigned Word Right-Indexed
6008 (define_insn "vextuwrx"
6009   [(set (match_operand:SI 0 "register_operand" "=r")
6010         (unspec:SI
6011          [(match_operand:SI 1 "register_operand" "r")
6012           (match_operand:V4SI 2 "altivec_register_operand" "v")]
6013          UNSPEC_VEXTUWRX))]
6014   "TARGET_P9_VECTOR"
6015   "vextuwrx %0,%1,%2"
6016   [(set_attr "type" "vecsimple")])
6017
6018 ;; Vector insert/extract word at arbitrary byte values.  Note, the little
6019 ;; endian version needs to adjust the byte number, and the V4SI element in
6020 ;; vinsert4b.
6021 (define_insn "extract4b"
6022   [(set (match_operand:V2DI 0 "vsx_register_operand")
6023        (unspec:V2DI [(match_operand:V16QI 1 "vsx_register_operand" "wa")
6024                      (match_operand:QI 2 "const_0_to_12_operand" "n")]
6025                     UNSPEC_XXEXTRACTUW))]
6026   "TARGET_P9_VECTOR"
6027 {
6028   if (!BYTES_BIG_ENDIAN)
6029     operands[2] = GEN_INT (12 - INTVAL (operands[2]));
6030
6031   return "xxextractuw %x0,%x1,%2";
6032 })
6033
6034 (define_expand "insert4b"
6035   [(set (match_operand:V16QI 0 "vsx_register_operand")
6036         (unspec:V16QI [(match_operand:V4SI 1 "vsx_register_operand")
6037                        (match_operand:V16QI 2 "vsx_register_operand")
6038                        (match_operand:QI 3 "const_0_to_12_operand")]
6039                    UNSPEC_XXINSERTW))]
6040   "TARGET_P9_VECTOR"
6041 {
6042   if (!BYTES_BIG_ENDIAN)
6043     {
6044       rtx op1 = operands[1];
6045       rtx v4si_tmp = gen_reg_rtx (V4SImode);
6046       emit_insn (gen_vsx_xxpermdi_v4si_be (v4si_tmp, op1, op1, const1_rtx));
6047       operands[1] = v4si_tmp;
6048       operands[3] = GEN_INT (12 - INTVAL (operands[3]));
6049     }
6050 })
6051
6052 (define_insn "*insert4b_internal"
6053   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
6054         (unspec:V16QI [(match_operand:V4SI 1 "vsx_register_operand" "wa")
6055                        (match_operand:V16QI 2 "vsx_register_operand" "0")
6056                        (match_operand:QI 3 "const_0_to_12_operand" "n")]
6057                    UNSPEC_XXINSERTW))]
6058   "TARGET_P9_VECTOR"
6059   "xxinsertw %x0,%x1,%3"
6060   [(set_attr "type" "vecperm")])
6061
6062
6063 ;; Generate vector extract four float 32 values from left four elements
6064 ;; of eight element vector of float 16 values.
6065 (define_expand "vextract_fp_from_shorth"
6066   [(set (match_operand:V4SF 0 "register_operand" "=wa")
6067         (unspec:V4SF [(match_operand:V8HI 1 "register_operand" "wa")]
6068    UNSPEC_VSX_VEXTRACT_FP_FROM_SHORTH))]
6069   "TARGET_P9_VECTOR"
6070 {
6071   int i;
6072   int vals_le[16] = {15, 14, 0, 0, 13, 12, 0, 0, 11, 10, 0, 0, 9, 8, 0, 0};
6073   int vals_be[16] = {0, 0, 0, 1, 0, 0, 2, 3, 0, 0, 4, 5, 0, 0, 6, 7};
6074
6075   rtx rvals[16];
6076   rtx mask = gen_reg_rtx (V16QImode);
6077   rtx tmp = gen_reg_rtx (V16QImode);
6078   rtvec v;
6079
6080   for (i = 0; i < 16; i++)
6081     if (!BYTES_BIG_ENDIAN)
6082       rvals[i] = GEN_INT (vals_le[i]);
6083     else
6084       rvals[i] = GEN_INT (vals_be[i]);
6085
6086   /* xvcvhpsp - vector convert F16 to vector F32 requires the four F16
6087      inputs in half words 1,3,5,7 (IBM numbering).  Use xxperm to move
6088      src half words 0,1,2,3 (LE), src half words 4,5,6,7 (BE) for the
6089      conversion instruction.  */
6090   v = gen_rtvec_v (16, rvals);
6091   emit_insn (gen_vec_initv16qiqi (mask, gen_rtx_PARALLEL (V16QImode, v)));
6092   emit_insn (gen_altivec_vperm_v8hiv16qi (tmp, operands[1],
6093                                           operands[1], mask));
6094   emit_insn (gen_vsx_xvcvhpsp (operands[0], tmp));
6095   DONE;
6096 })
6097
6098 ;; Generate vector extract four float 32 values from right four elements
6099 ;; of eight element vector of float 16 values.
6100 (define_expand "vextract_fp_from_shortl"
6101   [(set (match_operand:V4SF 0 "register_operand" "=wa")
6102         (unspec:V4SF [(match_operand:V8HI 1 "register_operand" "wa")]
6103         UNSPEC_VSX_VEXTRACT_FP_FROM_SHORTL))]
6104   "TARGET_P9_VECTOR"
6105 {
6106   int vals_le[16] = {7, 6, 0, 0, 5, 4, 0, 0, 3, 2, 0, 0, 1, 0, 0, 0};
6107   int vals_be[16] = {0, 0, 8, 9, 0, 0, 10, 11, 0, 0, 12, 13, 0, 0, 14, 15};
6108
6109   int i;
6110   rtx rvals[16];
6111   rtx mask = gen_reg_rtx (V16QImode);
6112   rtx tmp = gen_reg_rtx (V16QImode);
6113   rtvec v;
6114
6115   for (i = 0; i < 16; i++)
6116     if (!BYTES_BIG_ENDIAN)
6117       rvals[i] = GEN_INT (vals_le[i]);
6118     else
6119       rvals[i] = GEN_INT (vals_be[i]);
6120
6121   /* xvcvhpsp - vector convert F16 to vector F32 requires the four F16
6122      inputs in half words 1,3,5,7 (IBM numbering).  Use xxperm to move
6123      src half words 4,5,6,7 (LE), src half words 0,1,2,3 (BE) for the
6124      conversion instruction.  */
6125   v = gen_rtvec_v (16, rvals);
6126   emit_insn (gen_vec_initv16qiqi (mask, gen_rtx_PARALLEL (V16QImode, v)));
6127   emit_insn (gen_altivec_vperm_v8hiv16qi (tmp, operands[1],
6128                                           operands[1], mask));
6129   emit_insn (gen_vsx_xvcvhpsp (operands[0], tmp));
6130   DONE;
6131 })
6132
6133 ;; Support for ISA 3.0 vector byte reverse
6134
6135 ;; Swap all bytes with in a vector
6136 (define_insn "p9_xxbrq_v1ti"
6137   [(set (match_operand:V1TI 0 "vsx_register_operand" "=wa")
6138         (bswap:V1TI (match_operand:V1TI 1 "vsx_register_operand" "wa")))]
6139   "TARGET_P9_VECTOR"
6140   "xxbrq %x0,%x1"
6141   [(set_attr "type" "vecperm")])
6142
6143 (define_expand "p9_xxbrq_v16qi"
6144   [(use (match_operand:V16QI 0 "vsx_register_operand" "=wa"))
6145    (use (match_operand:V16QI 1 "vsx_register_operand" "wa"))]
6146   "TARGET_P9_VECTOR"
6147 {
6148   rtx op0 = gen_reg_rtx (V1TImode);
6149   rtx op1 = gen_lowpart (V1TImode, operands[1]);
6150   emit_insn (gen_p9_xxbrq_v1ti (op0, op1));
6151   emit_move_insn (operands[0], gen_lowpart (V16QImode, op0));
6152   DONE;
6153 })
6154
6155 ;; Swap all bytes in each 64-bit element
6156 (define_insn "p9_xxbrd_v2di"
6157   [(set (match_operand:V2DI 0 "vsx_register_operand" "=wa")
6158         (bswap:V2DI (match_operand:V2DI 1 "vsx_register_operand" "wa")))]
6159   "TARGET_P9_VECTOR"
6160   "xxbrd %x0,%x1"
6161   [(set_attr "type" "vecperm")])
6162
6163 (define_expand "p9_xxbrd_v2df"
6164   [(use (match_operand:V2DF 0 "vsx_register_operand" "=wa"))
6165    (use (match_operand:V2DF 1 "vsx_register_operand" "wa"))]
6166   "TARGET_P9_VECTOR"
6167 {
6168   rtx op0 = gen_reg_rtx (V2DImode);
6169   rtx op1 = gen_lowpart (V2DImode, operands[1]);
6170   emit_insn (gen_p9_xxbrd_v2di (op0, op1));
6171   emit_move_insn (operands[0], gen_lowpart (V2DFmode, op0));
6172   DONE;
6173 })
6174
6175 ;; Swap all bytes in each 32-bit element
6176 (define_insn "p9_xxbrw_v4si"
6177   [(set (match_operand:V4SI 0 "vsx_register_operand" "=wa")
6178         (bswap:V4SI (match_operand:V4SI 1 "vsx_register_operand" "wa")))]
6179   "TARGET_P9_VECTOR"
6180   "xxbrw %x0,%x1"
6181   [(set_attr "type" "vecperm")])
6182
6183 (define_expand "p9_xxbrw_v4sf"
6184   [(use (match_operand:V4SF 0 "vsx_register_operand" "=wa"))
6185    (use (match_operand:V4SF 1 "vsx_register_operand" "wa"))]
6186   "TARGET_P9_VECTOR"
6187 {
6188   rtx op0 = gen_reg_rtx (V4SImode);
6189   rtx op1 = gen_lowpart (V4SImode, operands[1]);
6190   emit_insn (gen_p9_xxbrw_v4si (op0, op1));
6191   emit_move_insn (operands[0], gen_lowpart (V4SFmode, op0));
6192   DONE;
6193 })
6194
6195 ;; Swap all bytes in each element of vector
6196 (define_expand "revb_<mode>"
6197   [(use (match_operand:VEC_REVB 0 "vsx_register_operand"))
6198    (use (match_operand:VEC_REVB 1 "vsx_register_operand"))]
6199   ""
6200 {
6201   if (TARGET_P9_VECTOR)
6202     emit_insn (gen_p9_xxbr<VSX_XXBR>_<mode> (operands[0], operands[1]));
6203   else
6204     {
6205       if (<MODE>mode == V8HImode)
6206         {
6207           rtx splt = gen_reg_rtx (V8HImode);
6208           emit_insn (gen_altivec_vspltish (splt, GEN_INT (8)));
6209           emit_insn (gen_altivec_vrlh (operands[0], operands[1], splt));
6210         }
6211       else
6212         {
6213           /* Want to have the elements in reverse order relative
6214              to the endian mode in use, i.e. in LE mode, put elements
6215              in BE order.  */
6216           rtx sel = swap_endian_selector_for_mode (<MODE>mode);
6217           emit_insn (gen_altivec_vperm_<mode>_direct (operands[0], operands[1],
6218                                                       operands[1], sel));
6219         }
6220     }
6221
6222   DONE;
6223 })
6224
6225 ;; Reversing bytes in vector char is just a NOP.
6226 (define_expand "revb_v16qi"
6227   [(set (match_operand:V16QI 0 "vsx_register_operand")
6228         (bswap:V16QI (match_operand:V16QI 1 "vsx_register_operand")))]
6229   ""
6230 {
6231   emit_move_insn (operands[0], operands[1]);
6232   DONE;
6233 })
6234
6235 ;; Swap all bytes in each 16-bit element
6236 (define_insn "p9_xxbrh_v8hi"
6237   [(set (match_operand:V8HI 0 "vsx_register_operand" "=wa")
6238         (bswap:V8HI (match_operand:V8HI 1 "vsx_register_operand" "wa")))]
6239   "TARGET_P9_VECTOR"
6240   "xxbrh %x0,%x1"
6241   [(set_attr "type" "vecperm")])
6242 \f
6243
6244 ;; Operand numbers for the following peephole2
6245 (define_constants
6246   [(SFBOOL_TMP_GPR               0)             ;; GPR temporary
6247    (SFBOOL_TMP_VSX               1)             ;; vector temporary
6248    (SFBOOL_MFVSR_D               2)             ;; move to gpr dest
6249    (SFBOOL_MFVSR_A               3)             ;; move to gpr src
6250    (SFBOOL_BOOL_D                4)             ;; and/ior/xor dest
6251    (SFBOOL_BOOL_A1               5)             ;; and/ior/xor arg1
6252    (SFBOOL_BOOL_A2               6)             ;; and/ior/xor arg1
6253    (SFBOOL_SHL_D                 7)             ;; shift left dest
6254    (SFBOOL_SHL_A                 8)             ;; shift left arg
6255    (SFBOOL_MTVSR_D               9)             ;; move to vecter dest
6256    (SFBOOL_MFVSR_A_V4SF         10)             ;; SFBOOL_MFVSR_A as V4SFmode
6257    (SFBOOL_BOOL_A_DI            11)             ;; SFBOOL_BOOL_A1/A2 as DImode
6258    (SFBOOL_TMP_VSX_DI           12)             ;; SFBOOL_TMP_VSX as DImode
6259    (SFBOOL_MTVSR_D_V4SF         13)])           ;; SFBOOL_MTVSRD_D as V4SFmode
6260
6261 ;; Attempt to optimize some common GLIBC operations using logical operations to
6262 ;; pick apart SFmode operations.  For example, there is code from e_powf.c
6263 ;; after macro expansion that looks like:
6264 ;;
6265 ;;      typedef union {
6266 ;;        float value;
6267 ;;        uint32_t word;
6268 ;;      } ieee_float_shape_type;
6269 ;;
6270 ;;      float t1;
6271 ;;      int32_t is;
6272 ;;
6273 ;;      do {
6274 ;;        ieee_float_shape_type gf_u;
6275 ;;        gf_u.value = (t1);
6276 ;;        (is) = gf_u.word;
6277 ;;      } while (0);
6278 ;;
6279 ;;      do {
6280 ;;        ieee_float_shape_type sf_u;
6281 ;;        sf_u.word = (is & 0xfffff000);
6282 ;;        (t1) = sf_u.value;
6283 ;;      } while (0);
6284 ;;
6285 ;;
6286 ;; This would result in two direct move operations (convert to memory format,
6287 ;; direct move to GPR, do the AND operation, direct move to VSX, convert to
6288 ;; scalar format).  With this peephole, we eliminate the direct move to the
6289 ;; GPR, and instead move the integer mask value to the vector register after a
6290 ;; shift and do the VSX logical operation.
6291
6292 ;; The insns for dealing with SFmode in GPR registers looks like:
6293 ;; (set (reg:V4SF reg2) (unspec:V4SF [(reg:SF reg1)] UNSPEC_VSX_CVDPSPN))
6294 ;;
6295 ;; (set (reg:DI reg3) (unspec:DI [(reg:V4SF reg2)] UNSPEC_P8V_RELOAD_FROM_VSX))
6296 ;;
6297 ;; (set (reg:DI reg4) (and:DI (reg:DI reg3) (reg:DI reg3)))
6298 ;;
6299 ;; (set (reg:DI reg5) (ashift:DI (reg:DI reg4) (const_int 32)))
6300 ;;
6301 ;; (set (reg:SF reg6) (unspec:SF [(reg:DI reg5)] UNSPEC_P8V_MTVSRD))
6302 ;;
6303 ;; (set (reg:SF reg6) (unspec:SF [(reg:SF reg6)] UNSPEC_VSX_CVSPDPN))
6304
6305 (define_peephole2
6306   [(match_scratch:DI SFBOOL_TMP_GPR "r")
6307    (match_scratch:V4SF SFBOOL_TMP_VSX "wa")
6308
6309    ;; MFVSRWZ (aka zero_extend)
6310    (set (match_operand:DI SFBOOL_MFVSR_D "int_reg_operand")
6311         (zero_extend:DI
6312          (match_operand:SI SFBOOL_MFVSR_A "vsx_register_operand")))
6313
6314    ;; AND/IOR/XOR operation on int
6315    (set (match_operand:SI SFBOOL_BOOL_D "int_reg_operand")
6316         (and_ior_xor:SI (match_operand:SI SFBOOL_BOOL_A1 "int_reg_operand")
6317                         (match_operand:SI SFBOOL_BOOL_A2 "reg_or_cint_operand")))
6318
6319    ;; SLDI
6320    (set (match_operand:DI SFBOOL_SHL_D "int_reg_operand")
6321         (ashift:DI (match_operand:DI SFBOOL_SHL_A "int_reg_operand")
6322                    (const_int 32)))
6323
6324    ;; MTVSRD
6325    (set (match_operand:SF SFBOOL_MTVSR_D "vsx_register_operand")
6326         (unspec:SF [(match_dup SFBOOL_SHL_D)] UNSPEC_P8V_MTVSRD))]
6327
6328   "TARGET_POWERPC64 && TARGET_DIRECT_MOVE
6329    /* The REG_P (xxx) tests prevents SUBREG's, which allows us to use REGNO
6330       to compare registers, when the mode is different.  */
6331    && REG_P (operands[SFBOOL_MFVSR_D]) && REG_P (operands[SFBOOL_BOOL_D])
6332    && REG_P (operands[SFBOOL_BOOL_A1]) && REG_P (operands[SFBOOL_SHL_D])
6333    && REG_P (operands[SFBOOL_SHL_A])   && REG_P (operands[SFBOOL_MTVSR_D])
6334    && (REG_P (operands[SFBOOL_BOOL_A2])
6335        || CONST_INT_P (operands[SFBOOL_BOOL_A2]))
6336    && (REGNO (operands[SFBOOL_BOOL_D]) == REGNO (operands[SFBOOL_MFVSR_D])
6337        || peep2_reg_dead_p (2, operands[SFBOOL_MFVSR_D]))
6338    && (REGNO (operands[SFBOOL_MFVSR_D]) == REGNO (operands[SFBOOL_BOOL_A1])
6339        || (REG_P (operands[SFBOOL_BOOL_A2])
6340            && REGNO (operands[SFBOOL_MFVSR_D])
6341                 == REGNO (operands[SFBOOL_BOOL_A2])))
6342    && REGNO (operands[SFBOOL_BOOL_D]) == REGNO (operands[SFBOOL_SHL_A])
6343    && (REGNO (operands[SFBOOL_SHL_D]) == REGNO (operands[SFBOOL_BOOL_D])
6344        || peep2_reg_dead_p (3, operands[SFBOOL_BOOL_D]))
6345    && peep2_reg_dead_p (4, operands[SFBOOL_SHL_D])"
6346   [(set (match_dup SFBOOL_TMP_GPR)
6347         (ashift:DI (match_dup SFBOOL_BOOL_A_DI)
6348                    (const_int 32)))
6349
6350    (set (match_dup SFBOOL_TMP_VSX_DI)
6351         (match_dup SFBOOL_TMP_GPR))
6352
6353    (set (match_dup SFBOOL_MTVSR_D_V4SF)
6354         (and_ior_xor:V4SF (match_dup SFBOOL_MFVSR_A_V4SF)
6355                           (match_dup SFBOOL_TMP_VSX)))]
6356 {
6357   rtx bool_a1 = operands[SFBOOL_BOOL_A1];
6358   rtx bool_a2 = operands[SFBOOL_BOOL_A2];
6359   int regno_mfvsr_d = REGNO (operands[SFBOOL_MFVSR_D]);
6360   int regno_mfvsr_a = REGNO (operands[SFBOOL_MFVSR_A]);
6361   int regno_tmp_vsx = REGNO (operands[SFBOOL_TMP_VSX]);
6362   int regno_mtvsr_d = REGNO (operands[SFBOOL_MTVSR_D]);
6363
6364   if (CONST_INT_P (bool_a2))
6365     {
6366       rtx tmp_gpr = operands[SFBOOL_TMP_GPR];
6367       emit_move_insn (tmp_gpr, bool_a2);
6368       operands[SFBOOL_BOOL_A_DI] = tmp_gpr;
6369     }
6370   else
6371     {
6372       int regno_bool_a1 = REGNO (bool_a1);
6373       int regno_bool_a2 = REGNO (bool_a2);
6374       int regno_bool_a = (regno_mfvsr_d == regno_bool_a1
6375                           ? regno_bool_a2 : regno_bool_a1);
6376       operands[SFBOOL_BOOL_A_DI] = gen_rtx_REG (DImode, regno_bool_a);
6377     }
6378
6379   operands[SFBOOL_MFVSR_A_V4SF] = gen_rtx_REG (V4SFmode, regno_mfvsr_a);
6380   operands[SFBOOL_TMP_VSX_DI] = gen_rtx_REG (DImode, regno_tmp_vsx);
6381   operands[SFBOOL_MTVSR_D_V4SF] = gen_rtx_REG (V4SFmode, regno_mtvsr_d);
6382 })
6383
6384 ;; Support signed/unsigned long long to float conversion vectorization.
6385 ;; Note that any_float (pc) here is just for code attribute <su>.
6386 (define_expand "vec_pack<su>_float_v2di"
6387   [(match_operand:V4SF 0 "vfloat_operand")
6388    (match_operand:V2DI 1 "vint_operand")
6389    (match_operand:V2DI 2 "vint_operand")
6390    (any_float (pc))]
6391   "TARGET_VSX"
6392 {
6393   rtx r1 = gen_reg_rtx (V4SFmode);
6394   rtx r2 = gen_reg_rtx (V4SFmode);
6395   emit_insn (gen_vsx_xvcv<su>xdsp (r1, operands[1]));
6396   emit_insn (gen_vsx_xvcv<su>xdsp (r2, operands[2]));
6397   rs6000_expand_extract_even (operands[0], r1, r2);
6398   DONE;
6399 })
6400
6401 ;; Support float to signed/unsigned long long conversion vectorization.
6402 ;; Note that any_fix (pc) here is just for code attribute <su>.
6403 (define_expand "vec_unpack_<su>fix_trunc_hi_v4sf"
6404   [(match_operand:V2DI 0 "vint_operand")
6405    (match_operand:V4SF 1 "vfloat_operand")
6406    (any_fix (pc))]
6407   "TARGET_VSX"
6408 {
6409   rtx reg = gen_reg_rtx (V4SFmode);
6410   rs6000_expand_interleave (reg, operands[1], operands[1], BYTES_BIG_ENDIAN);
6411   emit_insn (gen_vsx_xvcvsp<su>xds (operands[0], reg));
6412   DONE;
6413 })
6414
6415 ;; Note that any_fix (pc) here is just for code attribute <su>.
6416 (define_expand "vec_unpack_<su>fix_trunc_lo_v4sf"
6417   [(match_operand:V2DI 0 "vint_operand")
6418    (match_operand:V4SF 1 "vfloat_operand")
6419    (any_fix (pc))]
6420   "TARGET_VSX"
6421 {
6422   rtx reg = gen_reg_rtx (V4SFmode);
6423   rs6000_expand_interleave (reg, operands[1], operands[1], !BYTES_BIG_ENDIAN);
6424   emit_insn (gen_vsx_xvcvsp<su>xds (operands[0], reg));
6425   DONE;
6426 })
6427
6428 (define_insn "vsx_<xvcvbf16>"
6429   [(set (match_operand:V16QI 0 "vsx_register_operand" "=wa")
6430         (unspec:V16QI [(match_operand:V16QI 1 "vsx_register_operand" "wa")]
6431                       XVCVBF16))]
6432   "TARGET_POWER10"
6433   "<xvcvbf16> %x0,%x1"
6434   [(set_attr "type" "vecfloat")])
6435
6436 (define_insn "vec_mtvsrbmi"
6437   [(set (match_operand:V16QI 0 "altivec_register_operand" "=v")
6438         (unspec:V16QI [(match_operand:QI 1 "u6bit_cint_operand" "n")]
6439         UNSPEC_MTVSBM))]
6440   "TARGET_POWER10"
6441   "mtvsrbmi %0,%1"
6442 )
6443
6444 (define_insn "vec_mtvsr_<mode>"
6445   [(set (match_operand:VSX_MM 0 "altivec_register_operand" "=v")
6446         (unspec:VSX_MM [(match_operand:DI 1 "gpc_reg_operand" "r")]
6447         UNSPEC_MTVSBM))]
6448   "TARGET_POWER10"
6449   "mtvsr<wd>m %0,%1";
6450   [(set_attr "type" "vecsimple")])
6451
6452 (define_insn "vec_cntmb_<mode>"
6453   [(set (match_operand:DI 0 "gpc_reg_operand" "=r")
6454         (unspec:DI [(match_operand:VSX_MM4 1 "altivec_register_operand" "v")
6455                     (match_operand:QI 2 "const_0_to_1_operand" "n")]
6456         UNSPEC_VCNTMB))]
6457   "TARGET_POWER10"
6458   "vcntmb<wd> %0,%1,%2"
6459   [(set_attr "type" "vecsimple")])
6460
6461 (define_insn "vec_extract_<mode>"
6462   [(set (match_operand:SI 0 "register_operand" "=r")
6463         (unspec:SI [(match_operand:VSX_MM 1 "altivec_register_operand" "v")]
6464         UNSPEC_VEXTRACT))]
6465   "TARGET_POWER10"
6466   "vextract<wd>m %0,%1"
6467   [(set_attr "type" "vecsimple")])
6468
6469 (define_insn "vec_expand_<mode>"
6470   [(set (match_operand:VSX_MM 0 "vsx_register_operand" "=v")
6471         (unspec:VSX_MM [(match_operand:VSX_MM 1 "vsx_register_operand" "v")]
6472         UNSPEC_VEXPAND))]
6473   "TARGET_POWER10"
6474   "vexpand<wd>m %0,%1"
6475   [(set_attr "type" "vecsimple")])
6476
6477 (define_insn "dives_<mode>"
6478   [(set (match_operand:VIlong 0 "vsx_register_operand" "=v")
6479         (unspec:VIlong [(match_operand:VIlong 1 "vsx_register_operand" "v")
6480                         (match_operand:VIlong 2 "vsx_register_operand" "v")]
6481         UNSPEC_VDIVES))]
6482   "TARGET_POWER10"
6483   "vdives<wd> %0,%1,%2"
6484   [(set_attr "type" "vecdiv")
6485    (set_attr "size" "<bits>")])
6486
6487 (define_insn "diveu_<mode>"
6488   [(set (match_operand:VIlong 0 "vsx_register_operand" "=v")
6489         (unspec:VIlong [(match_operand:VIlong 1 "vsx_register_operand" "v")
6490                         (match_operand:VIlong 2 "vsx_register_operand" "v")]
6491         UNSPEC_VDIVEU))]
6492   "TARGET_POWER10"
6493   "vdiveu<wd> %0,%1,%2"
6494   [(set_attr "type" "vecdiv")
6495    (set_attr "size" "<bits>")])
6496
6497 (define_insn "div<mode>3"
6498   [(set (match_operand:VIlong 0 "vsx_register_operand" "=v")
6499         (div:VIlong (match_operand:VIlong 1 "vsx_register_operand" "v")
6500                     (match_operand:VIlong 2 "vsx_register_operand" "v")))]
6501   "TARGET_POWER10"
6502   "vdivs<wd> %0,%1,%2"
6503   [(set_attr "type" "vecdiv")
6504    (set_attr "size" "<bits>")])
6505
6506 (define_insn "udiv<mode>3"
6507   [(set (match_operand:VIlong 0 "vsx_register_operand" "=v")
6508         (udiv:VIlong (match_operand:VIlong 1 "vsx_register_operand" "v")
6509                     (match_operand:VIlong 2 "vsx_register_operand" "v")))]
6510   "TARGET_POWER10"
6511   "vdivu<wd> %0,%1,%2"
6512   [(set_attr "type" "vecdiv")
6513    (set_attr "size" "<bits>")])
6514
6515 (define_insn "mod<mode>3"
6516   [(set (match_operand:VIlong 0 "vsx_register_operand" "=v")
6517         (mod:VIlong (match_operand:VIlong 1 "vsx_register_operand" "v")
6518                     (match_operand:VIlong 2 "vsx_register_operand" "v")))]
6519   "TARGET_POWER10"
6520   "vmods<wd> %0,%1,%2"
6521   [(set_attr "type" "vecdiv")
6522    (set_attr "size" "<bits>")])
6523
6524 (define_insn "umod<mode>3"
6525   [(set (match_operand:VIlong 0 "vsx_register_operand" "=v")
6526         (umod:VIlong (match_operand:VIlong 1 "vsx_register_operand" "v")
6527                      (match_operand:VIlong 2 "vsx_register_operand" "v")))]
6528   "TARGET_POWER10"
6529   "vmodu<wd> %0,%1,%2"
6530   [(set_attr "type" "vecdiv")
6531    (set_attr "size" "<bits>")])
6532
6533 (define_insn "smul<mode>3_highpart"
6534   [(set (match_operand:VIlong 0 "vsx_register_operand" "=v")
6535         (mult:VIlong (ashiftrt
6536                        (match_operand:VIlong 1 "vsx_register_operand" "v")
6537                        (const_int 32))
6538                      (ashiftrt
6539                        (match_operand:VIlong 2 "vsx_register_operand" "v")
6540                        (const_int 32))))]
6541   "TARGET_POWER10"
6542   "vmulhs<wd> %0,%1,%2"
6543   [(set_attr "type" "veccomplex")])
6544
6545 (define_insn "umul<mode>3_highpart"
6546   [(set (match_operand:VIlong 0 "vsx_register_operand" "=v")
6547         (us_mult:VIlong (ashiftrt
6548                           (match_operand:VIlong 1 "vsx_register_operand" "v")
6549                           (const_int 32))
6550                         (ashiftrt
6551                           (match_operand:VIlong 2 "vsx_register_operand" "v")
6552                           (const_int 32))))]
6553   "TARGET_POWER10"
6554   "vmulhu<wd> %0,%1,%2"
6555   [(set_attr "type" "veccomplex")])
6556
6557 ;; Vector multiply low double word
6558 (define_insn "mulv2di3"
6559   [(set (match_operand:V2DI 0 "vsx_register_operand" "=v")
6560         (mult:V2DI (match_operand:V2DI 1 "vsx_register_operand" "v")
6561                    (match_operand:V2DI 2 "vsx_register_operand" "v")))]
6562   "TARGET_POWER10"
6563   "vmulld %0,%1,%2"
6564   [(set_attr "type" "veccomplex")])
6565
6566 \f
6567 ;; XXSPLTIW built-in function support
6568 (define_insn "xxspltiw_v4si"
6569   [(set (match_operand:V4SI 0 "register_operand" "=wa")
6570         (unspec:V4SI [(match_operand:SI 1 "s32bit_cint_operand" "n")]
6571                      UNSPEC_XXSPLTIW))]
6572  "TARGET_POWER10"
6573  "xxspltiw %x0,%1"
6574  [(set_attr "type" "vecperm")
6575   (set_attr "prefixed" "yes")])
6576
6577 (define_expand "xxspltiw_v4sf"
6578   [(set (match_operand:V4SF 0 "register_operand" "=wa")
6579         (unspec:V4SF [(match_operand:SF 1 "const_double_operand" "n")]
6580                      UNSPEC_XXSPLTIW))]
6581  "TARGET_POWER10"
6582 {
6583   long value = rs6000_const_f32_to_i32 (operands[1]);
6584   emit_insn (gen_xxspltiw_v4sf_inst (operands[0], GEN_INT (value)));
6585   DONE;
6586 })
6587
6588 (define_insn "xxspltiw_v4sf_inst"
6589   [(set (match_operand:V4SF 0 "register_operand" "=wa")
6590         (unspec:V4SF [(match_operand:SI 1 "c32bit_cint_operand" "n")]
6591                      UNSPEC_XXSPLTIW))]
6592  "TARGET_POWER10"
6593  "xxspltiw %x0,%1"
6594  [(set_attr "type" "vecperm")
6595   (set_attr "prefixed" "yes")])
6596
6597 ;; XXSPLTIDP built-in function support
6598 (define_expand "xxspltidp_v2df"
6599   [(set (match_operand:V2DF 0 "register_operand" )
6600         (unspec:V2DF [(match_operand:SF 1 "const_double_operand")]
6601                      UNSPEC_XXSPLTIDP))]
6602  "TARGET_POWER10"
6603 {
6604   long value = rs6000_const_f32_to_i32 (operands[1]);
6605   rs6000_emit_xxspltidp_v2df (operands[0], value);
6606   DONE;
6607 })
6608
6609 (define_insn "xxspltidp_v2df_inst"
6610   [(set (match_operand:V2DF 0 "register_operand" "=wa")
6611         (unspec:V2DF [(match_operand:SI 1 "c32bit_cint_operand" "n")]
6612                      UNSPEC_XXSPLTIDP))]
6613   "TARGET_POWER10"
6614   "xxspltidp %x0,%1"
6615   [(set_attr "type" "vecperm")
6616    (set_attr "prefixed" "yes")])
6617
6618 ;; XXSPLTI32DX built-in function support
6619 (define_expand "xxsplti32dx_v4si"
6620   [(set (match_operand:V4SI 0 "register_operand" "=wa")
6621         (unspec:V4SI [(match_operand:V4SI 1 "register_operand" "0")
6622                       (match_operand:QI 2 "u1bit_cint_operand" "n")
6623                       (match_operand:SI 3 "s32bit_cint_operand" "n")]
6624                      UNSPEC_XXSPLTI32DX))]
6625  "TARGET_POWER10"
6626 {
6627   int index = INTVAL (operands[2]);
6628
6629   if (!BYTES_BIG_ENDIAN)
6630     index = 1 - index;
6631
6632    emit_insn (gen_xxsplti32dx_v4si_inst (operands[0], operands[1],
6633                                          GEN_INT (index), operands[3]));
6634    DONE;
6635 }
6636  [(set_attr "type" "vecperm")])
6637
6638 (define_insn "xxsplti32dx_v4si_inst"
6639   [(set (match_operand:V4SI 0 "register_operand" "=wa")
6640         (unspec:V4SI [(match_operand:V4SI 1 "register_operand" "0")
6641                       (match_operand:QI 2 "u1bit_cint_operand" "n")
6642                       (match_operand:SI 3 "s32bit_cint_operand" "n")]
6643                      UNSPEC_XXSPLTI32DX))]
6644   "TARGET_POWER10"
6645   "xxsplti32dx %x0,%2,%3"
6646   [(set_attr "type" "vecperm")
6647    (set_attr "prefixed" "yes")])
6648
6649 (define_expand "xxsplti32dx_v4sf"
6650   [(set (match_operand:V4SF 0 "register_operand" "=wa")
6651         (unspec:V4SF [(match_operand:V4SF 1 "register_operand" "0")
6652                       (match_operand:QI 2 "u1bit_cint_operand" "n")
6653                       (match_operand:SF 3 "const_double_operand" "n")]
6654                      UNSPEC_XXSPLTI32DX))]
6655   "TARGET_POWER10"
6656 {
6657   int index = INTVAL (operands[2]);
6658   long value = rs6000_const_f32_to_i32 (operands[3]);
6659   if (!BYTES_BIG_ENDIAN)
6660     index = 1 - index;
6661
6662    emit_insn (gen_xxsplti32dx_v4sf_inst (operands[0], operands[1],
6663                                          GEN_INT (index), GEN_INT (value)));
6664    DONE;
6665 })
6666
6667 (define_insn "xxsplti32dx_v4sf_inst"
6668   [(set (match_operand:V4SF 0 "register_operand" "=wa")
6669         (unspec:V4SF [(match_operand:V4SF 1 "register_operand" "0")
6670                       (match_operand:QI 2 "u1bit_cint_operand" "n")
6671                       (match_operand:SI 3 "s32bit_cint_operand" "n")]
6672                      UNSPEC_XXSPLTI32DX))]
6673   "TARGET_POWER10"
6674   "xxsplti32dx %x0,%2,%3"
6675   [(set_attr "type" "vecperm")
6676    (set_attr "prefixed" "yes")])
6677
6678 ;; XXBLEND built-in function support
6679 (define_insn "xxblend_<mode>"
6680   [(set (match_operand:VM3 0 "register_operand" "=wa")
6681         (unspec:VM3 [(match_operand:VM3 1 "register_operand" "wa")
6682                      (match_operand:VM3 2 "register_operand" "wa")
6683                      (match_operand:VM3 3 "register_operand" "wa")]
6684                     UNSPEC_XXBLEND))]
6685   "TARGET_POWER10"
6686   "xxblendv<VM3_char> %x0,%x1,%x2,%x3"
6687   [(set_attr "type" "vecperm")
6688    (set_attr "prefixed" "yes")])
6689
6690 ;; XXPERMX built-in function support
6691 (define_expand "xxpermx"
6692   [(set (match_operand:V2DI 0 "register_operand" "+wa")
6693         (unspec:V2DI [(match_operand:V2DI 1 "register_operand" "wa")
6694                       (match_operand:V2DI 2 "register_operand" "wa")
6695                       (match_operand:V16QI 3 "register_operand" "wa")
6696                       (match_operand:QI 4 "u8bit_cint_operand" "n")]
6697                      UNSPEC_XXPERMX))]
6698   "TARGET_POWER10"
6699 {
6700   if (BYTES_BIG_ENDIAN)
6701     emit_insn (gen_xxpermx_inst (operands[0], operands[1],
6702                                  operands[2], operands[3],
6703                                  operands[4]));
6704   else
6705     {
6706       /* Reverse value of byte element indexes by XORing with 0xFF.
6707          Reverse the 32-byte section identifier match by subracting bits [0:2]
6708          of elemet from 7.  */
6709       int value = INTVAL (operands[4]);
6710       rtx vreg = gen_reg_rtx (V16QImode);
6711
6712       emit_insn (gen_xxspltib_v16qi (vreg, GEN_INT (-1)));
6713       emit_insn (gen_xorv16qi3 (operands[3], operands[3], vreg));
6714       value = 7 - value;
6715       emit_insn (gen_xxpermx_inst (operands[0], operands[2],
6716                                    operands[1], operands[3],
6717                                    GEN_INT (value)));
6718     }
6719
6720   DONE;
6721 }
6722   [(set_attr "type" "vecperm")])
6723
6724 (define_insn "xxpermx_inst"
6725   [(set (match_operand:V2DI 0 "register_operand" "+v")
6726         (unspec:V2DI [(match_operand:V2DI 1 "register_operand" "v")
6727                       (match_operand:V2DI 2 "register_operand" "v")
6728                       (match_operand:V16QI 3 "register_operand" "v")
6729                       (match_operand:QI 4 "u3bit_cint_operand" "n")]
6730                      UNSPEC_XXPERMX))]
6731   "TARGET_POWER10"
6732   "xxpermx %x0,%x1,%x2,%x3,%4"
6733   [(set_attr "type" "vecperm")
6734    (set_attr "prefixed" "yes")])
6735
6736 ;; XXEVAL built-in function support
6737 (define_insn "xxeval"
6738   [(set (match_operand:V2DI 0 "register_operand" "=wa")
6739         (unspec:V2DI [(match_operand:V2DI 1 "register_operand" "wa")
6740                       (match_operand:V2DI 2 "register_operand" "wa")
6741                       (match_operand:V2DI 3 "register_operand" "wa")
6742                       (match_operand:QI 4 "u8bit_cint_operand" "n")]
6743                      UNSPEC_XXEVAL))]
6744    "TARGET_POWER10"
6745    "xxeval %x0,%x1,%x2,%x3,%4"
6746    [(set_attr "type" "vecperm")
6747     (set_attr "prefixed" "yes")])
6748
6749 ;; Construct V1TI by vsx_concat_v2di
6750 (define_split
6751   [(set (match_operand:V1TI 0 "vsx_register_operand")
6752         (subreg:V1TI
6753           (match_operand:TI 1 "int_reg_operand") 0 ))]
6754   "TARGET_P9_VECTOR && !reload_completed"
6755   [(const_int 0)]
6756 {
6757   rtx tmp1 = simplify_gen_subreg (DImode, operands[1], TImode, 0);
6758   rtx tmp2 = simplify_gen_subreg (DImode, operands[1], TImode, 8);
6759   rtx tmp3 = gen_reg_rtx (V2DImode);
6760   emit_insn (gen_vsx_concat_v2di (tmp3, tmp1, tmp2));
6761   rtx tmp4 = simplify_gen_subreg (V1TImode, tmp3, V2DImode, 0);
6762   emit_move_insn (operands[0], tmp4);
6763   DONE;
6764 })
6765
6766 ;; vmsumcud
6767 (define_insn "vmsumcud"
6768 [(set (match_operand:V1TI 0 "register_operand" "+v")
6769       (unspec:V1TI [(match_operand:V2DI 1 "register_operand" "v")
6770                     (match_operand:V2DI 2 "register_operand" "v")
6771                     (match_operand:V1TI 3 "register_operand" "v")]
6772                    UNSPEC_VMSUMCUD))]
6773   "TARGET_POWER10"
6774   "vmsumcud %0,%1,%2,%3"
6775   [(set_attr "type" "veccomplex")]
6776 )
6777
6778 (define_split
6779   [(set (match_operand:V1TI 0 "gpc_reg_operand")
6780        (match_operand:V1TI 1 "vsx_register_operand"))]
6781   "reload_completed
6782    && TARGET_DIRECT_MOVE_64BIT
6783    && int_reg_operand (operands[0], V1TImode)
6784    && vsx_register_operand (operands[1], V1TImode)"
6785    [(pc)]
6786 {
6787   rtx src_op = gen_rtx_REG (V2DImode, REGNO (operands[1]));
6788   rtx dest_op0 = gen_rtx_REG (DImode, REGNO (operands[0]));
6789   rtx dest_op1 = gen_rtx_REG (DImode, REGNO (operands[0]) + 1);
6790   emit_insn (gen_vsx_extract_v2di (dest_op0, src_op, const0_rtx));
6791   emit_insn (gen_vsx_extract_v2di (dest_op1, src_op, const1_rtx));
6792   DONE;
6793 })