gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2018 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "backend.h"
  25 #include "target.h"
  26 #include "rtl.h"
  27 #include "tree.h"
  28 #include "memmodel.h"
  29 #include "predict.h"
  30 #include "tm_p.h"
  31 #include "expmed.h"
  32 #include "optabs.h"
  33 #include "emit-rtl.h"
  34 #include "recog.h"
  35 #include "diagnostic-core.h"
  36 #include "rtx-vector-builder.h"
  37
  38 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  39    is properly defined.  */
  40 #include "stor-layout.h"
  41 #include "except.h"
  42 #include "dojump.h"
  43 #include "explow.h"
  44 #include "expr.h"
  45 #include "optabs-tree.h"
  46 #include "libfuncs.h"
  47
  48 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  49                                    machine_mode *);
  50 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  51 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  52
  53 /* Debug facility for use in GDB.  */
  54 void debug_optab_libfuncs (void);
  55 \f
  56 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
  57    the result of operation CODE applied to OP0 (and OP1 if it is a binary
  58    operation).
  59
  60    If the last insn does not set TARGET, don't do anything, but return 1.
  61
  62    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
  63    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
  64    try again, ensuring that TARGET is not one of the operands.  */
  65
  66 static int
  67 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
  68 {
  69   rtx_insn *last_insn;
  70   rtx set;
  71   rtx note;
  72
  73   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
  74
  75   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
  76       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
  77       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
  78       && GET_RTX_CLASS (code) != RTX_COMPARE
  79       && GET_RTX_CLASS (code) != RTX_UNARY)
  80     return 1;
  81
  82   if (GET_CODE (target) == ZERO_EXTRACT)
  83     return 1;
  84
  85   for (last_insn = insns;
  86        NEXT_INSN (last_insn) != NULL_RTX;
  87        last_insn = NEXT_INSN (last_insn))
  88     ;
  89
  90   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
  91      a value changing in the insn, so the note would be invalid for CSE.  */
  92   if (reg_overlap_mentioned_p (target, op0)
  93       || (op1 && reg_overlap_mentioned_p (target, op1)))
  94     {
  95       if (MEM_P (target)
  96           && (rtx_equal_p (target, op0)
  97               || (op1 && rtx_equal_p (target, op1))))
  98         {
  99           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 100              over expanding it as temp = MEM op X, MEM = temp.  If the target
 101              supports MEM = MEM op X instructions, it is sometimes too hard
 102              to reconstruct that form later, especially if X is also a memory,
 103              and due to multiple occurrences of addresses the address might
 104              be forced into register unnecessarily.
 105              Note that not emitting the REG_EQUIV note might inhibit
 106              CSE in some cases.  */
 107           set = single_set (last_insn);
 108           if (set
 109               && GET_CODE (SET_SRC (set)) == code
 110               && MEM_P (SET_DEST (set))
 111               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 112                   || (op1 && rtx_equal_p (SET_DEST (set),
 113                                           XEXP (SET_SRC (set), 1)))))
 114             return 1;
 115         }
 116       return 0;
 117     }
 118
 119   set = set_for_reg_notes (last_insn);
 120   if (set == NULL_RTX)
 121     return 1;
 122
 123   if (! rtx_equal_p (SET_DEST (set), target)
 124       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 125       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 126           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 127     return 1;
 128
 129   if (GET_RTX_CLASS (code) == RTX_UNARY)
 130     switch (code)
 131       {
 132       case FFS:
 133       case CLZ:
 134       case CTZ:
 135       case CLRSB:
 136       case POPCOUNT:
 137       case PARITY:
 138       case BSWAP:
 139         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 140           {
 141             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 142             if (GET_MODE_UNIT_SIZE (GET_MODE (op0))
 143                 > GET_MODE_UNIT_SIZE (GET_MODE (target)))
 144               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 145                                          note, GET_MODE (op0));
 146             else
 147               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 148                                          note, GET_MODE (op0));
 149             break;
 150           }
 151         /* FALLTHRU */
 152       default:
 153         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 154         break;
 155       }
 156   else
 157     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 158
 159   set_unique_reg_note (last_insn, REG_EQUAL, note);
 160
 161   return 1;
 162 }
 163 \f
 164 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 165    for a widening operation would be.  In most cases this would be OP0, but if
 166    that's a constant it'll be VOIDmode, which isn't useful.  */
 167
 168 static machine_mode
 169 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 170 {
 171   machine_mode m0 = GET_MODE (op0);
 172   machine_mode m1 = GET_MODE (op1);
 173   machine_mode result;
 174
 175   if (m0 == VOIDmode && m1 == VOIDmode)
 176     return to_mode;
 177   else if (m0 == VOIDmode || GET_MODE_UNIT_SIZE (m0) < GET_MODE_UNIT_SIZE (m1))
 178     result = m1;
 179   else
 180     result = m0;
 181
 182   if (GET_MODE_UNIT_SIZE (result) > GET_MODE_UNIT_SIZE (to_mode))
 183     return to_mode;
 184
 185   return result;
 186 }
 187 \f
 188 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 189    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 190    not actually do a sign-extend or zero-extend, but can leave the
 191    higher-order bits of the result rtx undefined, for example, in the case
 192    of logical operations, but not right shifts.  */
 193
 194 static rtx
 195 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 196                int unsignedp, int no_extend)
 197 {
 198   rtx result;
 199   scalar_int_mode int_mode;
 200
 201   /* If we don't have to extend and this is a constant, return it.  */
 202   if (no_extend && GET_MODE (op) == VOIDmode)
 203     return op;
 204
 205   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 206      extend since it will be more efficient to do so unless the signedness of
 207      a promoted object differs from our extension.  */
 208   if (! no_extend
 209       || !is_a <scalar_int_mode> (mode, &int_mode)
 210       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 211           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 212     return convert_modes (mode, oldmode, op, unsignedp);
 213
 214   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 215      SUBREG.  */
 216   if (GET_MODE_SIZE (int_mode) <= UNITS_PER_WORD)
 217     return gen_lowpart (int_mode, force_reg (GET_MODE (op), op));
 218
 219   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 220      part to OP.  */
 221
 222   result = gen_reg_rtx (int_mode);
 223   emit_clobber (result);
 224   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 225   return result;
 226 }
 227 \f
 228 /* Expand vector widening operations.
 229
 230    There are two different classes of operations handled here:
 231    1) Operations whose result is wider than all the arguments to the operation.
 232       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 233       In this case OP0 and optionally OP1 would be initialized,
 234       but WIDE_OP wouldn't (not relevant for this case).
 235    2) Operations whose result is of the same size as the last argument to the
 236       operation, but wider than all the other arguments to the operation.
 237       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 238       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 239
 240    E.g, when called to expand the following operations, this is how
 241    the arguments will be initialized:
 242                                 nops    OP0     OP1     WIDE_OP
 243    widening-sum                 2       oprnd0  -       oprnd1
 244    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 245    widening-mult                2       oprnd0  oprnd1  -
 246    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 247
 248 rtx
 249 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 250                            rtx target, int unsignedp)
 251 {
 252   struct expand_operand eops[4];
 253   tree oprnd0, oprnd1, oprnd2;
 254   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 255   optab widen_pattern_optab;
 256   enum insn_code icode;
 257   int nops = TREE_CODE_LENGTH (ops->code);
 258   int op;
 259
 260   oprnd0 = ops->op0;
 261   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 262   widen_pattern_optab =
 263     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 264   if (ops->code == WIDEN_MULT_PLUS_EXPR
 265       || ops->code == WIDEN_MULT_MINUS_EXPR)
 266     icode = find_widening_optab_handler (widen_pattern_optab,
 267                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 268                                          tmode0);
 269   else
 270     icode = optab_handler (widen_pattern_optab, tmode0);
 271   gcc_assert (icode != CODE_FOR_nothing);
 272
 273   if (nops >= 2)
 274     {
 275       oprnd1 = ops->op1;
 276       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 277     }
 278
 279   /* The last operand is of a wider mode than the rest of the operands.  */
 280   if (nops == 2)
 281     wmode = tmode1;
 282   else if (nops == 3)
 283     {
 284       gcc_assert (tmode1 == tmode0);
 285       gcc_assert (op1);
 286       oprnd2 = ops->op2;
 287       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 288     }
 289
 290   op = 0;
 291   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 292   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 293   if (op1)
 294     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 295   if (wide_op)
 296     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 297   expand_insn (icode, op, eops);
 298   return eops[0].value;
 299 }
 300
 301 /* Generate code to perform an operation specified by TERNARY_OPTAB
 302    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 303
 304    UNSIGNEDP is for the case where we have to widen the operands
 305    to perform the operation.  It says to use zero-extension.
 306
 307    If TARGET is nonzero, the value
 308    is generated there, if it is convenient to do so.
 309    In all cases an rtx is returned for the locus of the value;
 310    this may or may not be TARGET.  */
 311
 312 rtx
 313 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 314                    rtx op1, rtx op2, rtx target, int unsignedp)
 315 {
 316   struct expand_operand ops[4];
 317   enum insn_code icode = optab_handler (ternary_optab, mode);
 318
 319   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 320
 321   create_output_operand (&ops[0], target, mode);
 322   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 323   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 324   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 325   expand_insn (icode, 4, ops);
 326   return ops[0].value;
 327 }
 328
 329
 330 /* Like expand_binop, but return a constant rtx if the result can be
 331    calculated at compile time.  The arguments and return value are
 332    otherwise the same as for expand_binop.  */
 333
 334 rtx
 335 simplify_expand_binop (machine_mode mode, optab binoptab,
 336                        rtx op0, rtx op1, rtx target, int unsignedp,
 337                        enum optab_methods methods)
 338 {
 339   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 340     {
 341       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 342                                          mode, op0, op1);
 343       if (x)
 344         return x;
 345     }
 346
 347   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 348 }
 349
 350 /* Like simplify_expand_binop, but always put the result in TARGET.
 351    Return true if the expansion succeeded.  */
 352
 353 bool
 354 force_expand_binop (machine_mode mode, optab binoptab,
 355                     rtx op0, rtx op1, rtx target, int unsignedp,
 356                     enum optab_methods methods)
 357 {
 358   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 359                                  target, unsignedp, methods);
 360   if (x == 0)
 361     return false;
 362   if (x != target)
 363     emit_move_insn (target, x);
 364   return true;
 365 }
 366
 367 /* Create a new vector value in VMODE with all elements set to OP.  The
 368    mode of OP must be the element mode of VMODE.  If OP is a constant,
 369    then the return value will be a constant.  */
 370
 371 rtx
 372 expand_vector_broadcast (machine_mode vmode, rtx op)
 373 {
 374   int n;
 375   rtvec vec;
 376
 377   gcc_checking_assert (VECTOR_MODE_P (vmode));
 378
 379   if (valid_for_const_vector_p (vmode, op))
 380     return gen_const_vec_duplicate (vmode, op);
 381
 382   insn_code icode = optab_handler (vec_duplicate_optab, vmode);
 383   if (icode != CODE_FOR_nothing)
 384     {
 385       struct expand_operand ops[2];
 386       create_output_operand (&ops[0], NULL_RTX, vmode);
 387       create_input_operand (&ops[1], op, GET_MODE (op));
 388       expand_insn (icode, 2, ops);
 389       return ops[0].value;
 390     }
 391
 392   if (!GET_MODE_NUNITS (vmode).is_constant (&n))
 393     return NULL;
 394
 395   /* ??? If the target doesn't have a vec_init, then we have no easy way
 396      of performing this operation.  Most of this sort of generic support
 397      is hidden away in the vector lowering support in gimple.  */
 398   icode = convert_optab_handler (vec_init_optab, vmode,
 399                                  GET_MODE_INNER (vmode));
 400   if (icode == CODE_FOR_nothing)
 401     return NULL;
 402
 403   vec = rtvec_alloc (n);
 404   for (int i = 0; i < n; ++i)
 405     RTVEC_ELT (vec, i) = op;
 406   rtx ret = gen_reg_rtx (vmode);
 407   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 408
 409   return ret;
 410 }
 411
 412 /* This subroutine of expand_doubleword_shift handles the cases in which
 413    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 414    value are the same as for the parent routine, except that SUPERWORD_OP1
 415    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 416    INTO_TARGET may be null if the caller has decided to calculate it.  */
 417
 418 static bool
 419 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 420                         rtx outof_target, rtx into_target,
 421                         int unsignedp, enum optab_methods methods)
 422 {
 423   if (into_target != 0)
 424     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 425                              into_target, unsignedp, methods))
 426       return false;
 427
 428   if (outof_target != 0)
 429     {
 430       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 431          of the sign bit, otherwise we must fill it with zeros.  */
 432       if (binoptab != ashr_optab)
 433         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 434       else
 435         if (!force_expand_binop (word_mode, binoptab, outof_input,
 436                                  gen_int_shift_amount (word_mode,
 437                                                        BITS_PER_WORD - 1),
 438                                  outof_target, unsignedp, methods))
 439           return false;
 440     }
 441   return true;
 442 }
 443
 444 /* This subroutine of expand_doubleword_shift handles the cases in which
 445    the effective shift value is < BITS_PER_WORD.  The arguments and return
 446    value are the same as for the parent routine.  */
 447
 448 static bool
 449 expand_subword_shift (scalar_int_mode op1_mode, optab binoptab,
 450                       rtx outof_input, rtx into_input, rtx op1,
 451                       rtx outof_target, rtx into_target,
 452                       int unsignedp, enum optab_methods methods,
 453                       unsigned HOST_WIDE_INT shift_mask)
 454 {
 455   optab reverse_unsigned_shift, unsigned_shift;
 456   rtx tmp, carries;
 457
 458   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 459   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 460
 461   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 462      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 463      the opposite direction to BINOPTAB.  */
 464   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 465     {
 466       carries = outof_input;
 467       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 468                                             op1_mode), op1_mode);
 469       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 470                                    0, true, methods);
 471     }
 472   else
 473     {
 474       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 475          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 476          has unknown behavior.  Do a single shift first, then shift by the
 477          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 478          are truncated to the mode size.  */
 479       carries = expand_binop (word_mode, reverse_unsigned_shift,
 480                               outof_input, const1_rtx, 0, unsignedp, methods);
 481       if (shift_mask == BITS_PER_WORD - 1)
 482         {
 483           tmp = immed_wide_int_const
 484             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 485           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 486                                        0, true, methods);
 487         }
 488       else
 489         {
 490           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 491                                                 op1_mode), op1_mode);
 492           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 493                                        0, true, methods);
 494         }
 495     }
 496   if (tmp == 0 || carries == 0)
 497     return false;
 498   carries = expand_binop (word_mode, reverse_unsigned_shift,
 499                           carries, tmp, 0, unsignedp, methods);
 500   if (carries == 0)
 501     return false;
 502
 503   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 504      so the result can go directly into INTO_TARGET if convenient.  */
 505   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 506                       into_target, unsignedp, methods);
 507   if (tmp == 0)
 508     return false;
 509
 510   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 511   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 512                            into_target, unsignedp, methods))
 513     return false;
 514
 515   /* Use a standard word_mode shift for the out-of half.  */
 516   if (outof_target != 0)
 517     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 518                              outof_target, unsignedp, methods))
 519       return false;
 520
 521   return true;
 522 }
 523
 524
 525 /* Try implementing expand_doubleword_shift using conditional moves.
 526    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 527    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 528    are the shift counts to use in the former and latter case.  All other
 529    arguments are the same as the parent routine.  */
 530
 531 static bool
 532 expand_doubleword_shift_condmove (scalar_int_mode op1_mode, optab binoptab,
 533                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 534                                   rtx outof_input, rtx into_input,
 535                                   rtx subword_op1, rtx superword_op1,
 536                                   rtx outof_target, rtx into_target,
 537                                   int unsignedp, enum optab_methods methods,
 538                                   unsigned HOST_WIDE_INT shift_mask)
 539 {
 540   rtx outof_superword, into_superword;
 541
 542   /* Put the superword version of the output into OUTOF_SUPERWORD and
 543      INTO_SUPERWORD.  */
 544   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 545   if (outof_target != 0 && subword_op1 == superword_op1)
 546     {
 547       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 548          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 549       into_superword = outof_target;
 550       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 551                                    outof_superword, 0, unsignedp, methods))
 552         return false;
 553     }
 554   else
 555     {
 556       into_superword = gen_reg_rtx (word_mode);
 557       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 558                                    outof_superword, into_superword,
 559                                    unsignedp, methods))
 560         return false;
 561     }
 562
 563   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 564   if (!expand_subword_shift (op1_mode, binoptab,
 565                              outof_input, into_input, subword_op1,
 566                              outof_target, into_target,
 567                              unsignedp, methods, shift_mask))
 568     return false;
 569
 570   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 571      might be the current value of OUTOF_TARGET.  */
 572   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 573                               into_target, into_superword, word_mode, false))
 574     return false;
 575
 576   if (outof_target != 0)
 577     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 578                                 outof_target, outof_superword,
 579                                 word_mode, false))
 580       return false;
 581
 582   return true;
 583 }
 584
 585 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 586    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 587    input operand; the shift moves bits in the direction OUTOF_INPUT->
 588    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 589    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 590    If OP1 is constant, it will have been truncated as appropriate
 591    and is known to be nonzero.
 592
 593    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 594    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 595    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 596
 597    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 598    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 599    fill with zeros or sign bits as appropriate.
 600
 601    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 602    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 603    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
 604    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
 605    are undefined.
 606
 607    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
 608    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
 609    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
 610    function wants to calculate it itself.
 611
 612    Return true if the shift could be successfully synthesized.  */
 613
 614 static bool
 615 expand_doubleword_shift (scalar_int_mode op1_mode, optab binoptab,
 616                          rtx outof_input, rtx into_input, rtx op1,
 617                          rtx outof_target, rtx into_target,
 618                          int unsignedp, enum optab_methods methods,
 619                          unsigned HOST_WIDE_INT shift_mask)
 620 {
 621   rtx superword_op1, tmp, cmp1, cmp2;
 622   enum rtx_code cmp_code;
 623
 624   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
 625      fill the result with sign or zero bits as appropriate.  If so, the value
 626      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
 627      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
 628      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
 629
 630      This isn't worthwhile for constant shifts since the optimizers will
 631      cope better with in-range shift counts.  */
 632   if (shift_mask >= BITS_PER_WORD
 633       && outof_target != 0
 634       && !CONSTANT_P (op1))
 635     {
 636       if (!expand_doubleword_shift (op1_mode, binoptab,
 637                                     outof_input, into_input, op1,
 638                                     0, into_target,
 639                                     unsignedp, methods, shift_mask))
 640         return false;
 641       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 642                                outof_target, unsignedp, methods))
 643         return false;
 644       return true;
 645     }
 646
 647   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
 648      is true when the effective shift value is less than BITS_PER_WORD.
 649      Set SUPERWORD_OP1 to the shift count that should be used to shift
 650      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
 651   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
 652   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
 653     {
 654       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
 655          is a subword shift count.  */
 656       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
 657                                     0, true, methods);
 658       cmp2 = CONST0_RTX (op1_mode);
 659       cmp_code = EQ;
 660       superword_op1 = op1;
 661     }
 662   else
 663     {
 664       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
 665       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
 666                                     0, true, methods);
 667       cmp2 = CONST0_RTX (op1_mode);
 668       cmp_code = LT;
 669       superword_op1 = cmp1;
 670     }
 671   if (cmp1 == 0)
 672     return false;
 673
 674   /* If we can compute the condition at compile time, pick the
 675      appropriate subroutine.  */
 676   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
 677   if (tmp != 0 && CONST_INT_P (tmp))
 678     {
 679       if (tmp == const0_rtx)
 680         return expand_superword_shift (binoptab, outof_input, superword_op1,
 681                                        outof_target, into_target,
 682                                        unsignedp, methods);
 683       else
 684         return expand_subword_shift (op1_mode, binoptab,
 685                                      outof_input, into_input, op1,
 686                                      outof_target, into_target,
 687                                      unsignedp, methods, shift_mask);
 688     }
 689
 690   /* Try using conditional moves to generate straight-line code.  */
 691   if (HAVE_conditional_move)
 692     {
 693       rtx_insn *start = get_last_insn ();
 694       if (expand_doubleword_shift_condmove (op1_mode, binoptab,
 695                                             cmp_code, cmp1, cmp2,
 696                                             outof_input, into_input,
 697                                             op1, superword_op1,
 698                                             outof_target, into_target,
 699                                             unsignedp, methods, shift_mask))
 700         return true;
 701       delete_insns_since (start);
 702     }
 703
 704   /* As a last resort, use branches to select the correct alternative.  */
 705   rtx_code_label *subword_label = gen_label_rtx ();
 706   rtx_code_label *done_label = gen_label_rtx ();
 707
 708   NO_DEFER_POP;
 709   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
 710                            0, 0, subword_label,
 711                            profile_probability::uninitialized ());
 712   OK_DEFER_POP;
 713
 714   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 715                                outof_target, into_target,
 716                                unsignedp, methods))
 717     return false;
 718
 719   emit_jump_insn (targetm.gen_jump (done_label));
 720   emit_barrier ();
 721   emit_label (subword_label);
 722
 723   if (!expand_subword_shift (op1_mode, binoptab,
 724                              outof_input, into_input, op1,
 725                              outof_target, into_target,
 726                              unsignedp, methods, shift_mask))
 727     return false;
 728
 729   emit_label (done_label);
 730   return true;
 731 }
 732 \f
 733 /* Subroutine of expand_binop.  Perform a double word multiplication of
 734    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
 735    as the target's word_mode.  This function return NULL_RTX if anything
 736    goes wrong, in which case it may have already emitted instructions
 737    which need to be deleted.
 738
 739    If we want to multiply two two-word values and have normal and widening
 740    multiplies of single-word values, we can do this with three smaller
 741    multiplications.
 742
 743    The multiplication proceeds as follows:
 744                                  _______________________
 745                                 [__op0_high_|__op0_low__]
 746                                  _______________________
 747         *                       [__op1_high_|__op1_low__]
 748         _______________________________________________
 749                                  _______________________
 750     (1)                         [__op0_low__*__op1_low__]
 751                      _______________________
 752     (2a)            [__op0_low__*__op1_high_]
 753                      _______________________
 754     (2b)            [__op0_high_*__op1_low__]
 755          _______________________
 756     (3) [__op0_high_*__op1_high_]
 757
 758
 759   This gives a 4-word result.  Since we are only interested in the
 760   lower 2 words, partial result (3) and the upper words of (2a) and
 761   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
 762   calculated using non-widening multiplication.
 763
 764   (1), however, needs to be calculated with an unsigned widening
 765   multiplication.  If this operation is not directly supported we
 766   try using a signed widening multiplication and adjust the result.
 767   This adjustment works as follows:
 768
 769       If both operands are positive then no adjustment is needed.
 770
 771       If the operands have different signs, for example op0_low < 0 and
 772       op1_low >= 0, the instruction treats the most significant bit of
 773       op0_low as a sign bit instead of a bit with significance
 774       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
 775       with 2**BITS_PER_WORD - op0_low, and two's complements the
 776       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
 777       the result.
 778
 779       Similarly, if both operands are negative, we need to add
 780       (op0_low + op1_low) * 2**BITS_PER_WORD.
 781
 782       We use a trick to adjust quickly.  We logically shift op0_low right
 783       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
 784       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
 785       logical shift exists, we do an arithmetic right shift and subtract
 786       the 0 or -1.  */
 787
 788 static rtx
 789 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
 790                        bool umulp, enum optab_methods methods)
 791 {
 792   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
 793   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
 794   rtx wordm1 = (umulp ? NULL_RTX
 795                 : gen_int_shift_amount (word_mode, BITS_PER_WORD - 1));
 796   rtx product, adjust, product_high, temp;
 797
 798   rtx op0_high = operand_subword_force (op0, high, mode);
 799   rtx op0_low = operand_subword_force (op0, low, mode);
 800   rtx op1_high = operand_subword_force (op1, high, mode);
 801   rtx op1_low = operand_subword_force (op1, low, mode);
 802
 803   /* If we're using an unsigned multiply to directly compute the product
 804      of the low-order words of the operands and perform any required
 805      adjustments of the operands, we begin by trying two more multiplications
 806      and then computing the appropriate sum.
 807
 808      We have checked above that the required addition is provided.
 809      Full-word addition will normally always succeed, especially if
 810      it is provided at all, so we don't worry about its failure.  The
 811      multiplication may well fail, however, so we do handle that.  */
 812
 813   if (!umulp)
 814     {
 815       /* ??? This could be done with emit_store_flag where available.  */
 816       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
 817                            NULL_RTX, 1, methods);
 818       if (temp)
 819         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
 820                                  NULL_RTX, 0, OPTAB_DIRECT);
 821       else
 822         {
 823           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
 824                                NULL_RTX, 0, methods);
 825           if (!temp)
 826             return NULL_RTX;
 827           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
 828                                    NULL_RTX, 0, OPTAB_DIRECT);
 829         }
 830
 831       if (!op0_high)
 832         return NULL_RTX;
 833     }
 834
 835   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
 836                          NULL_RTX, 0, OPTAB_DIRECT);
 837   if (!adjust)
 838     return NULL_RTX;
 839
 840   /* OP0_HIGH should now be dead.  */
 841
 842   if (!umulp)
 843     {
 844       /* ??? This could be done with emit_store_flag where available.  */
 845       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
 846                            NULL_RTX, 1, methods);
 847       if (temp)
 848         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
 849                                  NULL_RTX, 0, OPTAB_DIRECT);
 850       else
 851         {
 852           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
 853                                NULL_RTX, 0, methods);
 854           if (!temp)
 855             return NULL_RTX;
 856           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
 857                                    NULL_RTX, 0, OPTAB_DIRECT);
 858         }
 859
 860       if (!op1_high)
 861         return NULL_RTX;
 862     }
 863
 864   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
 865                        NULL_RTX, 0, OPTAB_DIRECT);
 866   if (!temp)
 867     return NULL_RTX;
 868
 869   /* OP1_HIGH should now be dead.  */
 870
 871   adjust = expand_binop (word_mode, add_optab, adjust, temp,
 872                          NULL_RTX, 0, OPTAB_DIRECT);
 873
 874   if (target && !REG_P (target))
 875     target = NULL_RTX;
 876
 877   /* *_widen_optab needs to determine operand mode, make sure at least
 878      one operand has non-VOID mode.  */
 879   if (GET_MODE (op0_low) == VOIDmode && GET_MODE (op1_low) == VOIDmode)
 880     op0_low = force_reg (word_mode, op0_low);
 881
 882   if (umulp)
 883     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
 884                             target, 1, OPTAB_DIRECT);
 885   else
 886     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
 887                             target, 1, OPTAB_DIRECT);
 888
 889   if (!product)
 890     return NULL_RTX;
 891
 892   product_high = operand_subword (product, high, 1, mode);
 893   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
 894                          NULL_RTX, 0, OPTAB_DIRECT);
 895   emit_move_insn (product_high, adjust);
 896   return product;
 897 }
 898 \f
 899 /* Wrapper around expand_binop which takes an rtx code to specify
 900    the operation to perform, not an optab pointer.  All other
 901    arguments are the same.  */
 902 rtx
 903 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
 904                      rtx op1, rtx target, int unsignedp,
 905                      enum optab_methods methods)
 906 {
 907   optab binop = code_to_optab (code);
 908   gcc_assert (binop);
 909
 910   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
 911 }
 912
 913 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
 914    binop.  Order them according to commutative_operand_precedence and, if
 915    possible, try to put TARGET or a pseudo first.  */
 916 static bool
 917 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
 918 {
 919   int op0_prec = commutative_operand_precedence (op0);
 920   int op1_prec = commutative_operand_precedence (op1);
 921
 922   if (op0_prec < op1_prec)
 923     return true;
 924
 925   if (op0_prec > op1_prec)
 926     return false;
 927
 928   /* With equal precedence, both orders are ok, but it is better if the
 929      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
 930   if (target == 0 || REG_P (target))
 931     return (REG_P (op1) && !REG_P (op0)) || target == op1;
 932   else
 933     return rtx_equal_p (op1, target);
 934 }
 935
 936 /* Return true if BINOPTAB implements a shift operation.  */
 937
 938 static bool
 939 shift_optab_p (optab binoptab)
 940 {
 941   switch (optab_to_code (binoptab))
 942     {
 943     case ASHIFT:
 944     case SS_ASHIFT:
 945     case US_ASHIFT:
 946     case ASHIFTRT:
 947     case LSHIFTRT:
 948     case ROTATE:
 949     case ROTATERT:
 950       return true;
 951
 952     default:
 953       return false;
 954     }
 955 }
 956
 957 /* Return true if BINOPTAB implements a commutative binary operation.  */
 958
 959 static bool
 960 commutative_optab_p (optab binoptab)
 961 {
 962   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
 963           || binoptab == smul_widen_optab
 964           || binoptab == umul_widen_optab
 965           || binoptab == smul_highpart_optab
 966           || binoptab == umul_highpart_optab);
 967 }
 968
 969 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
 970    optimizing, and if the operand is a constant that costs more than
 971    1 instruction, force the constant into a register and return that
 972    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
 973
 974 static rtx
 975 avoid_expensive_constant (machine_mode mode, optab binoptab,
 976                           int opn, rtx x, bool unsignedp)
 977 {
 978   bool speed = optimize_insn_for_speed_p ();
 979
 980   if (mode != VOIDmode
 981       && optimize
 982       && CONSTANT_P (x)
 983       && (rtx_cost (x, mode, optab_to_code (binoptab), opn, speed)
 984           > set_src_cost (x, mode, speed)))
 985     {
 986       if (CONST_INT_P (x))
 987         {
 988           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
 989           if (intval != INTVAL (x))
 990             x = GEN_INT (intval);
 991         }
 992       else
 993         x = convert_modes (mode, VOIDmode, x, unsignedp);
 994       x = force_reg (mode, x);
 995     }
 996   return x;
 997 }
 998
 999 /* Helper function for expand_binop: handle the case where there
1000    is an insn ICODE that directly implements the indicated operation.
1001    Returns null if this is not possible.  */
1002 static rtx
1003 expand_binop_directly (enum insn_code icode, machine_mode mode, optab binoptab,
1004                        rtx op0, rtx op1,
1005                        rtx target, int unsignedp, enum optab_methods methods,
1006                        rtx_insn *last)
1007 {
1008   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1009   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1010   machine_mode mode0, mode1, tmp_mode;
1011   struct expand_operand ops[3];
1012   bool commutative_p;
1013   rtx_insn *pat;
1014   rtx xop0 = op0, xop1 = op1;
1015   bool canonicalize_op1 = false;
1016
1017   /* If it is a commutative operator and the modes would match
1018      if we would swap the operands, we can save the conversions.  */
1019   commutative_p = commutative_optab_p (binoptab);
1020   if (commutative_p
1021       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1022       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1023     std::swap (xop0, xop1);
1024
1025   /* If we are optimizing, force expensive constants into a register.  */
1026   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1027   if (!shift_optab_p (binoptab))
1028     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1029   else
1030     /* Shifts and rotates often use a different mode for op1 from op0;
1031        for VOIDmode constants we don't know the mode, so force it
1032        to be canonicalized using convert_modes.  */
1033     canonicalize_op1 = true;
1034
1035   /* In case the insn wants input operands in modes different from
1036      those of the actual operands, convert the operands.  It would
1037      seem that we don't need to convert CONST_INTs, but we do, so
1038      that they're properly zero-extended, sign-extended or truncated
1039      for their mode.  */
1040
1041   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1042   if (xmode0 != VOIDmode && xmode0 != mode0)
1043     {
1044       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1045       mode0 = xmode0;
1046     }
1047
1048   mode1 = ((GET_MODE (xop1) != VOIDmode || canonicalize_op1)
1049            ? GET_MODE (xop1) : mode);
1050   if (xmode1 != VOIDmode && xmode1 != mode1)
1051     {
1052       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1053       mode1 = xmode1;
1054     }
1055
1056   /* If operation is commutative,
1057      try to make the first operand a register.
1058      Even better, try to make it the same as the target.
1059      Also try to make the last operand a constant.  */
1060   if (commutative_p
1061       && swap_commutative_operands_with_target (target, xop0, xop1))
1062     std::swap (xop0, xop1);
1063
1064   /* Now, if insn's predicates don't allow our operands, put them into
1065      pseudo regs.  */
1066
1067   if (binoptab == vec_pack_trunc_optab
1068       || binoptab == vec_pack_usat_optab
1069       || binoptab == vec_pack_ssat_optab
1070       || binoptab == vec_pack_ufix_trunc_optab
1071       || binoptab == vec_pack_sfix_trunc_optab)
1072     {
1073       /* The mode of the result is different then the mode of the
1074          arguments.  */
1075       tmp_mode = insn_data[(int) icode].operand[0].mode;
1076       if (VECTOR_MODE_P (mode)
1077           && maybe_ne (GET_MODE_NUNITS (tmp_mode), 2 * GET_MODE_NUNITS (mode)))
1078         {
1079           delete_insns_since (last);
1080           return NULL_RTX;
1081         }
1082     }
1083   else
1084     tmp_mode = mode;
1085
1086   create_output_operand (&ops[0], target, tmp_mode);
1087   create_input_operand (&ops[1], xop0, mode0);
1088   create_input_operand (&ops[2], xop1, mode1);
1089   pat = maybe_gen_insn (icode, 3, ops);
1090   if (pat)
1091     {
1092       /* If PAT is composed of more than one insn, try to add an appropriate
1093          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1094          operand, call expand_binop again, this time without a target.  */
1095       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1096           && ! add_equal_note (pat, ops[0].value,
1097                                optab_to_code (binoptab),
1098                                ops[1].value, ops[2].value))
1099         {
1100           delete_insns_since (last);
1101           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1102                                unsignedp, methods);
1103         }
1104
1105       emit_insn (pat);
1106       return ops[0].value;
1107     }
1108   delete_insns_since (last);
1109   return NULL_RTX;
1110 }
1111
1112 /* Generate code to perform an operation specified by BINOPTAB
1113    on operands OP0 and OP1, with result having machine-mode MODE.
1114
1115    UNSIGNEDP is for the case where we have to widen the operands
1116    to perform the operation.  It says to use zero-extension.
1117
1118    If TARGET is nonzero, the value
1119    is generated there, if it is convenient to do so.
1120    In all cases an rtx is returned for the locus of the value;
1121    this may or may not be TARGET.  */
1122
1123 rtx
1124 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1125               rtx target, int unsignedp, enum optab_methods methods)
1126 {
1127   enum optab_methods next_methods
1128     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1129        ? OPTAB_WIDEN : methods);
1130   enum mode_class mclass;
1131   enum insn_code icode;
1132   machine_mode wider_mode;
1133   scalar_int_mode int_mode;
1134   rtx libfunc;
1135   rtx temp;
1136   rtx_insn *entry_last = get_last_insn ();
1137   rtx_insn *last;
1138
1139   mclass = GET_MODE_CLASS (mode);
1140
1141   /* If subtracting an integer constant, convert this into an addition of
1142      the negated constant.  */
1143
1144   if (binoptab == sub_optab && CONST_INT_P (op1))
1145     {
1146       op1 = negate_rtx (mode, op1);
1147       binoptab = add_optab;
1148     }
1149   /* For shifts, constant invalid op1 might be expanded from different
1150      mode than MODE.  As those are invalid, force them to a register
1151      to avoid further problems during expansion.  */
1152   else if (CONST_INT_P (op1)
1153            && shift_optab_p (binoptab)
1154            && UINTVAL (op1) >= GET_MODE_BITSIZE (GET_MODE_INNER (mode)))
1155     {
1156       op1 = gen_int_mode (INTVAL (op1), GET_MODE_INNER (mode));
1157       op1 = force_reg (GET_MODE_INNER (mode), op1);
1158     }
1159
1160   /* Record where to delete back to if we backtrack.  */
1161   last = get_last_insn ();
1162
1163   /* If we can do it with a three-operand insn, do so.  */
1164
1165   if (methods != OPTAB_MUST_WIDEN)
1166     {
1167       if (convert_optab_p (binoptab))
1168         {
1169           machine_mode from_mode = widened_mode (mode, op0, op1);
1170           icode = find_widening_optab_handler (binoptab, mode, from_mode);
1171         }
1172       else
1173         icode = optab_handler (binoptab, mode);
1174       if (icode != CODE_FOR_nothing)
1175         {
1176           temp = expand_binop_directly (icode, mode, binoptab, op0, op1,
1177                                         target, unsignedp, methods, last);
1178           if (temp)
1179             return temp;
1180         }
1181     }
1182
1183   /* If we were trying to rotate, and that didn't work, try rotating
1184      the other direction before falling back to shifts and bitwise-or.  */
1185   if (((binoptab == rotl_optab
1186         && (icode = optab_handler (rotr_optab, mode)) != CODE_FOR_nothing)
1187        || (binoptab == rotr_optab
1188            && (icode = optab_handler (rotl_optab, mode)) != CODE_FOR_nothing))
1189       && is_int_mode (mode, &int_mode))
1190     {
1191       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1192       rtx newop1;
1193       unsigned int bits = GET_MODE_PRECISION (int_mode);
1194
1195       if (CONST_INT_P (op1))
1196         newop1 = gen_int_shift_amount (int_mode, bits - INTVAL (op1));
1197       else if (targetm.shift_truncation_mask (int_mode) == bits - 1)
1198         newop1 = negate_rtx (GET_MODE (op1), op1);
1199       else
1200         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1201                                gen_int_mode (bits, GET_MODE (op1)), op1,
1202                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1203
1204       temp = expand_binop_directly (icode, int_mode, otheroptab, op0, newop1,
1205                                     target, unsignedp, methods, last);
1206       if (temp)
1207         return temp;
1208     }
1209
1210   /* If this is a multiply, see if we can do a widening operation that
1211      takes operands of this mode and makes a wider mode.  */
1212
1213   if (binoptab == smul_optab
1214       && GET_MODE_2XWIDER_MODE (mode).exists (&wider_mode)
1215       && (convert_optab_handler ((unsignedp
1216                                   ? umul_widen_optab
1217                                   : smul_widen_optab),
1218                                  wider_mode, mode) != CODE_FOR_nothing))
1219     {
1220       /* *_widen_optab needs to determine operand mode, make sure at least
1221          one operand has non-VOID mode.  */
1222       if (GET_MODE (op0) == VOIDmode && GET_MODE (op1) == VOIDmode)
1223         op0 = force_reg (mode, op0);
1224       temp = expand_binop (wider_mode,
1225                            unsignedp ? umul_widen_optab : smul_widen_optab,
1226                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1227
1228       if (temp != 0)
1229         {
1230           if (GET_MODE_CLASS (mode) == MODE_INT
1231               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1232             return gen_lowpart (mode, temp);
1233           else
1234             return convert_to_mode (mode, temp, unsignedp);
1235         }
1236     }
1237
1238   /* If this is a vector shift by a scalar, see if we can do a vector
1239      shift by a vector.  If so, broadcast the scalar into a vector.  */
1240   if (mclass == MODE_VECTOR_INT)
1241     {
1242       optab otheroptab = unknown_optab;
1243
1244       if (binoptab == ashl_optab)
1245         otheroptab = vashl_optab;
1246       else if (binoptab == ashr_optab)
1247         otheroptab = vashr_optab;
1248       else if (binoptab == lshr_optab)
1249         otheroptab = vlshr_optab;
1250       else if (binoptab == rotl_optab)
1251         otheroptab = vrotl_optab;
1252       else if (binoptab == rotr_optab)
1253         otheroptab = vrotr_optab;
1254
1255       if (otheroptab
1256           && (icode = optab_handler (otheroptab, mode)) != CODE_FOR_nothing)
1257         {
1258           /* The scalar may have been extended to be too wide.  Truncate
1259              it back to the proper size to fit in the broadcast vector.  */
1260           scalar_mode inner_mode = GET_MODE_INNER (mode);
1261           if (!CONST_INT_P (op1)
1262               && (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (op1)))
1263                   > GET_MODE_BITSIZE (inner_mode)))
1264             op1 = force_reg (inner_mode,
1265                              simplify_gen_unary (TRUNCATE, inner_mode, op1,
1266                                                  GET_MODE (op1)));
1267           rtx vop1 = expand_vector_broadcast (mode, op1);
1268           if (vop1)
1269             {
1270               temp = expand_binop_directly (icode, mode, otheroptab, op0, vop1,
1271                                             target, unsignedp, methods, last);
1272               if (temp)
1273                 return temp;
1274             }
1275         }
1276     }
1277
1278   /* Look for a wider mode of the same class for which we think we
1279      can open-code the operation.  Check for a widening multiply at the
1280      wider mode as well.  */
1281
1282   if (CLASS_HAS_WIDER_MODES_P (mclass)
1283       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1284     FOR_EACH_WIDER_MODE (wider_mode, mode)
1285       {
1286         machine_mode next_mode;
1287         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1288             || (binoptab == smul_optab
1289                 && GET_MODE_WIDER_MODE (wider_mode).exists (&next_mode)
1290                 && (find_widening_optab_handler ((unsignedp
1291                                                   ? umul_widen_optab
1292                                                   : smul_widen_optab),
1293                                                  next_mode, mode)
1294                     != CODE_FOR_nothing)))
1295           {
1296             rtx xop0 = op0, xop1 = op1;
1297             int no_extend = 0;
1298
1299             /* For certain integer operations, we need not actually extend
1300                the narrow operands, as long as we will truncate
1301                the results to the same narrowness.  */
1302
1303             if ((binoptab == ior_optab || binoptab == and_optab
1304                  || binoptab == xor_optab
1305                  || binoptab == add_optab || binoptab == sub_optab
1306                  || binoptab == smul_optab || binoptab == ashl_optab)
1307                 && mclass == MODE_INT)
1308               {
1309                 no_extend = 1;
1310                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1311                                                  xop0, unsignedp);
1312                 if (binoptab != ashl_optab)
1313                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1314                                                    xop1, unsignedp);
1315               }
1316
1317             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1318
1319             /* The second operand of a shift must always be extended.  */
1320             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1321                                   no_extend && binoptab != ashl_optab);
1322
1323             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1324                                  unsignedp, OPTAB_DIRECT);
1325             if (temp)
1326               {
1327                 if (mclass != MODE_INT
1328                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1329                   {
1330                     if (target == 0)
1331                       target = gen_reg_rtx (mode);
1332                     convert_move (target, temp, 0);
1333                     return target;
1334                   }
1335                 else
1336                   return gen_lowpart (mode, temp);
1337               }
1338             else
1339               delete_insns_since (last);
1340           }
1341       }
1342
1343   /* If operation is commutative,
1344      try to make the first operand a register.
1345      Even better, try to make it the same as the target.
1346      Also try to make the last operand a constant.  */
1347   if (commutative_optab_p (binoptab)
1348       && swap_commutative_operands_with_target (target, op0, op1))
1349     std::swap (op0, op1);
1350
1351   /* These can be done a word at a time.  */
1352   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1353       && is_int_mode (mode, &int_mode)
1354       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
1355       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1356     {
1357       int i;
1358       rtx_insn *insns;
1359
1360       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1361          won't be accurate, so use a new target.  */
1362       if (target == 0
1363           || target == op0
1364           || target == op1
1365           || !valid_multiword_target_p (target))
1366         target = gen_reg_rtx (int_mode);
1367
1368       start_sequence ();
1369
1370       /* Do the actual arithmetic.  */
1371       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
1372         {
1373           rtx target_piece = operand_subword (target, i, 1, int_mode);
1374           rtx x = expand_binop (word_mode, binoptab,
1375                                 operand_subword_force (op0, i, int_mode),
1376                                 operand_subword_force (op1, i, int_mode),
1377                                 target_piece, unsignedp, next_methods);
1378
1379           if (x == 0)
1380             break;
1381
1382           if (target_piece != x)
1383             emit_move_insn (target_piece, x);
1384         }
1385
1386       insns = get_insns ();
1387       end_sequence ();
1388
1389       if (i == GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD)
1390         {
1391           emit_insn (insns);
1392           return target;
1393         }
1394     }
1395
1396   /* Synthesize double word shifts from single word shifts.  */
1397   if ((binoptab == lshr_optab || binoptab == ashl_optab
1398        || binoptab == ashr_optab)
1399       && is_int_mode (mode, &int_mode)
1400       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1401       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1402       && GET_MODE_PRECISION (int_mode) == GET_MODE_BITSIZE (int_mode)
1403       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1404       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1405       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1406     {
1407       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1408       scalar_int_mode op1_mode;
1409
1410       double_shift_mask = targetm.shift_truncation_mask (int_mode);
1411       shift_mask = targetm.shift_truncation_mask (word_mode);
1412       op1_mode = (GET_MODE (op1) != VOIDmode
1413                   ? as_a <scalar_int_mode> (GET_MODE (op1))
1414                   : word_mode);
1415
1416       /* Apply the truncation to constant shifts.  */
1417       if (double_shift_mask > 0 && CONST_INT_P (op1))
1418         op1 = gen_int_mode (INTVAL (op1) & double_shift_mask, op1_mode);
1419
1420       if (op1 == CONST0_RTX (op1_mode))
1421         return op0;
1422
1423       /* Make sure that this is a combination that expand_doubleword_shift
1424          can handle.  See the comments there for details.  */
1425       if (double_shift_mask == 0
1426           || (shift_mask == BITS_PER_WORD - 1
1427               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1428         {
1429           rtx_insn *insns;
1430           rtx into_target, outof_target;
1431           rtx into_input, outof_input;
1432           int left_shift, outof_word;
1433
1434           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1435              won't be accurate, so use a new target.  */
1436           if (target == 0
1437               || target == op0
1438               || target == op1
1439               || !valid_multiword_target_p (target))
1440             target = gen_reg_rtx (int_mode);
1441
1442           start_sequence ();
1443
1444           /* OUTOF_* is the word we are shifting bits away from, and
1445              INTO_* is the word that we are shifting bits towards, thus
1446              they differ depending on the direction of the shift and
1447              WORDS_BIG_ENDIAN.  */
1448
1449           left_shift = binoptab == ashl_optab;
1450           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1451
1452           outof_target = operand_subword (target, outof_word, 1, int_mode);
1453           into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1454
1455           outof_input = operand_subword_force (op0, outof_word, int_mode);
1456           into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1457
1458           if (expand_doubleword_shift (op1_mode, binoptab,
1459                                        outof_input, into_input, op1,
1460                                        outof_target, into_target,
1461                                        unsignedp, next_methods, shift_mask))
1462             {
1463               insns = get_insns ();
1464               end_sequence ();
1465
1466               emit_insn (insns);
1467               return target;
1468             }
1469           end_sequence ();
1470         }
1471     }
1472
1473   /* Synthesize double word rotates from single word shifts.  */
1474   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1475       && is_int_mode (mode, &int_mode)
1476       && CONST_INT_P (op1)
1477       && GET_MODE_PRECISION (int_mode) == 2 * BITS_PER_WORD
1478       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1479       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1480     {
1481       rtx_insn *insns;
1482       rtx into_target, outof_target;
1483       rtx into_input, outof_input;
1484       rtx inter;
1485       int shift_count, left_shift, outof_word;
1486
1487       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1488          won't be accurate, so use a new target. Do this also if target is not
1489          a REG, first because having a register instead may open optimization
1490          opportunities, and second because if target and op0 happen to be MEMs
1491          designating the same location, we would risk clobbering it too early
1492          in the code sequence we generate below.  */
1493       if (target == 0
1494           || target == op0
1495           || target == op1
1496           || !REG_P (target)
1497           || !valid_multiword_target_p (target))
1498         target = gen_reg_rtx (int_mode);
1499
1500       start_sequence ();
1501
1502       shift_count = INTVAL (op1);
1503
1504       /* OUTOF_* is the word we are shifting bits away from, and
1505          INTO_* is the word that we are shifting bits towards, thus
1506          they differ depending on the direction of the shift and
1507          WORDS_BIG_ENDIAN.  */
1508
1509       left_shift = (binoptab == rotl_optab);
1510       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1511
1512       outof_target = operand_subword (target, outof_word, 1, int_mode);
1513       into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1514
1515       outof_input = operand_subword_force (op0, outof_word, int_mode);
1516       into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1517
1518       if (shift_count == BITS_PER_WORD)
1519         {
1520           /* This is just a word swap.  */
1521           emit_move_insn (outof_target, into_input);
1522           emit_move_insn (into_target, outof_input);
1523           inter = const0_rtx;
1524         }
1525       else
1526         {
1527           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1528           HOST_WIDE_INT first_shift_count, second_shift_count;
1529           optab reverse_unsigned_shift, unsigned_shift;
1530
1531           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1532                                     ? lshr_optab : ashl_optab);
1533
1534           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1535                             ? ashl_optab : lshr_optab);
1536
1537           if (shift_count > BITS_PER_WORD)
1538             {
1539               first_shift_count = shift_count - BITS_PER_WORD;
1540               second_shift_count = 2 * BITS_PER_WORD - shift_count;
1541             }
1542           else
1543             {
1544               first_shift_count = BITS_PER_WORD - shift_count;
1545               second_shift_count = shift_count;
1546             }
1547           rtx first_shift_count_rtx
1548             = gen_int_shift_amount (word_mode, first_shift_count);
1549           rtx second_shift_count_rtx
1550             = gen_int_shift_amount (word_mode, second_shift_count);
1551
1552           into_temp1 = expand_binop (word_mode, unsigned_shift,
1553                                      outof_input, first_shift_count_rtx,
1554                                      NULL_RTX, unsignedp, next_methods);
1555           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1556                                      into_input, second_shift_count_rtx,
1557                                      NULL_RTX, unsignedp, next_methods);
1558
1559           if (into_temp1 != 0 && into_temp2 != 0)
1560             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1561                                   into_target, unsignedp, next_methods);
1562           else
1563             inter = 0;
1564
1565           if (inter != 0 && inter != into_target)
1566             emit_move_insn (into_target, inter);
1567
1568           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1569                                       into_input, first_shift_count_rtx,
1570                                       NULL_RTX, unsignedp, next_methods);
1571           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1572                                       outof_input, second_shift_count_rtx,
1573                                       NULL_RTX, unsignedp, next_methods);
1574
1575           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1576             inter = expand_binop (word_mode, ior_optab,
1577                                   outof_temp1, outof_temp2,
1578                                   outof_target, unsignedp, next_methods);
1579
1580           if (inter != 0 && inter != outof_target)
1581             emit_move_insn (outof_target, inter);
1582         }
1583
1584       insns = get_insns ();
1585       end_sequence ();
1586
1587       if (inter != 0)
1588         {
1589           emit_insn (insns);
1590           return target;
1591         }
1592     }
1593
1594   /* These can be done a word at a time by propagating carries.  */
1595   if ((binoptab == add_optab || binoptab == sub_optab)
1596       && is_int_mode (mode, &int_mode)
1597       && GET_MODE_SIZE (int_mode) >= 2 * UNITS_PER_WORD
1598       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1599     {
1600       unsigned int i;
1601       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1602       const unsigned int nwords = GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD;
1603       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1604       rtx xop0, xop1, xtarget;
1605
1606       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1607          value is one of those, use it.  Otherwise, use 1 since it is the
1608          one easiest to get.  */
1609 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1610       int normalizep = STORE_FLAG_VALUE;
1611 #else
1612       int normalizep = 1;
1613 #endif
1614
1615       /* Prepare the operands.  */
1616       xop0 = force_reg (int_mode, op0);
1617       xop1 = force_reg (int_mode, op1);
1618
1619       xtarget = gen_reg_rtx (int_mode);
1620
1621       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1622         target = xtarget;
1623
1624       /* Indicate for flow that the entire target reg is being set.  */
1625       if (REG_P (target))
1626         emit_clobber (xtarget);
1627
1628       /* Do the actual arithmetic.  */
1629       for (i = 0; i < nwords; i++)
1630         {
1631           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1632           rtx target_piece = operand_subword (xtarget, index, 1, int_mode);
1633           rtx op0_piece = operand_subword_force (xop0, index, int_mode);
1634           rtx op1_piece = operand_subword_force (xop1, index, int_mode);
1635           rtx x;
1636
1637           /* Main add/subtract of the input operands.  */
1638           x = expand_binop (word_mode, binoptab,
1639                             op0_piece, op1_piece,
1640                             target_piece, unsignedp, next_methods);
1641           if (x == 0)
1642             break;
1643
1644           if (i + 1 < nwords)
1645             {
1646               /* Store carry from main add/subtract.  */
1647               carry_out = gen_reg_rtx (word_mode);
1648               carry_out = emit_store_flag_force (carry_out,
1649                                                  (binoptab == add_optab
1650                                                   ? LT : GT),
1651                                                  x, op0_piece,
1652                                                  word_mode, 1, normalizep);
1653             }
1654
1655           if (i > 0)
1656             {
1657               rtx newx;
1658
1659               /* Add/subtract previous carry to main result.  */
1660               newx = expand_binop (word_mode,
1661                                    normalizep == 1 ? binoptab : otheroptab,
1662                                    x, carry_in,
1663                                    NULL_RTX, 1, next_methods);
1664
1665               if (i + 1 < nwords)
1666                 {
1667                   /* Get out carry from adding/subtracting carry in.  */
1668                   rtx carry_tmp = gen_reg_rtx (word_mode);
1669                   carry_tmp = emit_store_flag_force (carry_tmp,
1670                                                      (binoptab == add_optab
1671                                                       ? LT : GT),
1672                                                      newx, x,
1673                                                      word_mode, 1, normalizep);
1674
1675                   /* Logical-ior the two poss. carry together.  */
1676                   carry_out = expand_binop (word_mode, ior_optab,
1677                                             carry_out, carry_tmp,
1678                                             carry_out, 0, next_methods);
1679                   if (carry_out == 0)
1680                     break;
1681                 }
1682               emit_move_insn (target_piece, newx);
1683             }
1684           else
1685             {
1686               if (x != target_piece)
1687                 emit_move_insn (target_piece, x);
1688             }
1689
1690           carry_in = carry_out;
1691         }
1692
1693       if (i == GET_MODE_BITSIZE (int_mode) / (unsigned) BITS_PER_WORD)
1694         {
1695           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing
1696               || ! rtx_equal_p (target, xtarget))
1697             {
1698               rtx_insn *temp = emit_move_insn (target, xtarget);
1699
1700               set_dst_reg_note (temp, REG_EQUAL,
1701                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
1702                                                 int_mode, copy_rtx (xop0),
1703                                                 copy_rtx (xop1)),
1704                                 target);
1705             }
1706           else
1707             target = xtarget;
1708
1709           return target;
1710         }
1711
1712       else
1713         delete_insns_since (last);
1714     }
1715
1716   /* Attempt to synthesize double word multiplies using a sequence of word
1717      mode multiplications.  We first attempt to generate a sequence using a
1718      more efficient unsigned widening multiply, and if that fails we then
1719      try using a signed widening multiply.  */
1720
1721   if (binoptab == smul_optab
1722       && is_int_mode (mode, &int_mode)
1723       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1724       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
1725       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
1726     {
1727       rtx product = NULL_RTX;
1728       if (convert_optab_handler (umul_widen_optab, int_mode, word_mode)
1729           != CODE_FOR_nothing)
1730         {
1731           product = expand_doubleword_mult (int_mode, op0, op1, target,
1732                                             true, methods);
1733           if (!product)
1734             delete_insns_since (last);
1735         }
1736
1737       if (product == NULL_RTX
1738           && (convert_optab_handler (smul_widen_optab, int_mode, word_mode)
1739               != CODE_FOR_nothing))
1740         {
1741           product = expand_doubleword_mult (int_mode, op0, op1, target,
1742                                             false, methods);
1743           if (!product)
1744             delete_insns_since (last);
1745         }
1746
1747       if (product != NULL_RTX)
1748         {
1749           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing)
1750             {
1751               rtx_insn *move = emit_move_insn (target ? target : product,
1752                                                product);
1753               set_dst_reg_note (move,
1754                                 REG_EQUAL,
1755                                 gen_rtx_fmt_ee (MULT, int_mode,
1756                                                 copy_rtx (op0),
1757                                                 copy_rtx (op1)),
1758                                 target ? target : product);
1759             }
1760           return product;
1761         }
1762     }
1763
1764   /* It can't be open-coded in this mode.
1765      Use a library call if one is available and caller says that's ok.  */
1766
1767   libfunc = optab_libfunc (binoptab, mode);
1768   if (libfunc
1769       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
1770     {
1771       rtx_insn *insns;
1772       rtx op1x = op1;
1773       machine_mode op1_mode = mode;
1774       rtx value;
1775
1776       start_sequence ();
1777
1778       if (shift_optab_p (binoptab))
1779         {
1780           op1_mode = targetm.libgcc_shift_count_mode ();
1781           /* Specify unsigned here,
1782              since negative shift counts are meaningless.  */
1783           op1x = convert_to_mode (op1_mode, op1, 1);
1784         }
1785
1786       if (GET_MODE (op0) != VOIDmode
1787           && GET_MODE (op0) != mode)
1788         op0 = convert_to_mode (mode, op0, unsignedp);
1789
1790       /* Pass 1 for NO_QUEUE so we don't lose any increments
1791          if the libcall is cse'd or moved.  */
1792       value = emit_library_call_value (libfunc,
1793                                        NULL_RTX, LCT_CONST, mode,
1794                                        op0, mode, op1x, op1_mode);
1795
1796       insns = get_insns ();
1797       end_sequence ();
1798
1799       bool trapv = trapv_binoptab_p (binoptab);
1800       target = gen_reg_rtx (mode);
1801       emit_libcall_block_1 (insns, target, value,
1802                             trapv ? NULL_RTX
1803                             : gen_rtx_fmt_ee (optab_to_code (binoptab),
1804                                               mode, op0, op1), trapv);
1805
1806       return target;
1807     }
1808
1809   delete_insns_since (last);
1810
1811   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1812
1813   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
1814          || methods == OPTAB_MUST_WIDEN))
1815     {
1816       /* Caller says, don't even try.  */
1817       delete_insns_since (entry_last);
1818       return 0;
1819     }
1820
1821   /* Compute the value of METHODS to pass to recursive calls.
1822      Don't allow widening to be tried recursively.  */
1823
1824   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
1825
1826   /* Look for a wider mode of the same class for which it appears we can do
1827      the operation.  */
1828
1829   if (CLASS_HAS_WIDER_MODES_P (mclass))
1830     {
1831       /* This code doesn't make sense for conversion optabs, since we
1832          wouldn't then want to extend the operands to be the same size
1833          as the result.  */
1834       gcc_assert (!convert_optab_p (binoptab));
1835       FOR_EACH_WIDER_MODE (wider_mode, mode)
1836         {
1837           if (optab_handler (binoptab, wider_mode)
1838               || (methods == OPTAB_LIB
1839                   && optab_libfunc (binoptab, wider_mode)))
1840             {
1841               rtx xop0 = op0, xop1 = op1;
1842               int no_extend = 0;
1843
1844               /* For certain integer operations, we need not actually extend
1845                  the narrow operands, as long as we will truncate
1846                  the results to the same narrowness.  */
1847
1848               if ((binoptab == ior_optab || binoptab == and_optab
1849                    || binoptab == xor_optab
1850                    || binoptab == add_optab || binoptab == sub_optab
1851                    || binoptab == smul_optab || binoptab == ashl_optab)
1852                   && mclass == MODE_INT)
1853                 no_extend = 1;
1854
1855               xop0 = widen_operand (xop0, wider_mode, mode,
1856                                     unsignedp, no_extend);
1857
1858               /* The second operand of a shift must always be extended.  */
1859               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1860                                     no_extend && binoptab != ashl_optab);
1861
1862               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1863                                    unsignedp, methods);
1864               if (temp)
1865                 {
1866                   if (mclass != MODE_INT
1867                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1868                     {
1869                       if (target == 0)
1870                         target = gen_reg_rtx (mode);
1871                       convert_move (target, temp, 0);
1872                       return target;
1873                     }
1874                   else
1875                     return gen_lowpart (mode, temp);
1876                 }
1877               else
1878                 delete_insns_since (last);
1879             }
1880         }
1881     }
1882
1883   delete_insns_since (entry_last);
1884   return 0;
1885 }
1886 \f
1887 /* Expand a binary operator which has both signed and unsigned forms.
1888    UOPTAB is the optab for unsigned operations, and SOPTAB is for
1889    signed operations.
1890
1891    If we widen unsigned operands, we may use a signed wider operation instead
1892    of an unsigned wider operation, since the result would be the same.  */
1893
1894 rtx
1895 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
1896                    rtx op0, rtx op1, rtx target, int unsignedp,
1897                    enum optab_methods methods)
1898 {
1899   rtx temp;
1900   optab direct_optab = unsignedp ? uoptab : soptab;
1901   bool save_enable;
1902
1903   /* Do it without widening, if possible.  */
1904   temp = expand_binop (mode, direct_optab, op0, op1, target,
1905                        unsignedp, OPTAB_DIRECT);
1906   if (temp || methods == OPTAB_DIRECT)
1907     return temp;
1908
1909   /* Try widening to a signed int.  Disable any direct use of any
1910      signed insn in the current mode.  */
1911   save_enable = swap_optab_enable (soptab, mode, false);
1912
1913   temp = expand_binop (mode, soptab, op0, op1, target,
1914                        unsignedp, OPTAB_WIDEN);
1915
1916   /* For unsigned operands, try widening to an unsigned int.  */
1917   if (!temp && unsignedp)
1918     temp = expand_binop (mode, uoptab, op0, op1, target,
1919                          unsignedp, OPTAB_WIDEN);
1920   if (temp || methods == OPTAB_WIDEN)
1921     goto egress;
1922
1923   /* Use the right width libcall if that exists.  */
1924   temp = expand_binop (mode, direct_optab, op0, op1, target,
1925                        unsignedp, OPTAB_LIB);
1926   if (temp || methods == OPTAB_LIB)
1927     goto egress;
1928
1929   /* Must widen and use a libcall, use either signed or unsigned.  */
1930   temp = expand_binop (mode, soptab, op0, op1, target,
1931                        unsignedp, methods);
1932   if (!temp && unsignedp)
1933     temp = expand_binop (mode, uoptab, op0, op1, target,
1934                          unsignedp, methods);
1935
1936  egress:
1937   /* Undo the fiddling above.  */
1938   if (save_enable)
1939     swap_optab_enable (soptab, mode, true);
1940   return temp;
1941 }
1942 \f
1943 /* Generate code to perform an operation specified by UNOPPTAB
1944    on operand OP0, with two results to TARG0 and TARG1.
1945    We assume that the order of the operands for the instruction
1946    is TARG0, TARG1, OP0.
1947
1948    Either TARG0 or TARG1 may be zero, but what that means is that
1949    the result is not actually wanted.  We will generate it into
1950    a dummy pseudo-reg and discard it.  They may not both be zero.
1951
1952    Returns 1 if this operation can be performed; 0 if not.  */
1953
1954 int
1955 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
1956                     int unsignedp)
1957 {
1958   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
1959   enum mode_class mclass;
1960   machine_mode wider_mode;
1961   rtx_insn *entry_last = get_last_insn ();
1962   rtx_insn *last;
1963
1964   mclass = GET_MODE_CLASS (mode);
1965
1966   if (!targ0)
1967     targ0 = gen_reg_rtx (mode);
1968   if (!targ1)
1969     targ1 = gen_reg_rtx (mode);
1970
1971   /* Record where to go back to if we fail.  */
1972   last = get_last_insn ();
1973
1974   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
1975     {
1976       struct expand_operand ops[3];
1977       enum insn_code icode = optab_handler (unoptab, mode);
1978
1979       create_fixed_operand (&ops[0], targ0);
1980       create_fixed_operand (&ops[1], targ1);
1981       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
1982       if (maybe_expand_insn (icode, 3, ops))
1983         return 1;
1984     }
1985
1986   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1987
1988   if (CLASS_HAS_WIDER_MODES_P (mclass))
1989     {
1990       FOR_EACH_WIDER_MODE (wider_mode, mode)
1991         {
1992           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
1993             {
1994               rtx t0 = gen_reg_rtx (wider_mode);
1995               rtx t1 = gen_reg_rtx (wider_mode);
1996               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
1997
1998               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
1999                 {
2000                   convert_move (targ0, t0, unsignedp);
2001                   convert_move (targ1, t1, unsignedp);
2002                   return 1;
2003                 }
2004               else
2005                 delete_insns_since (last);
2006             }
2007         }
2008     }
2009
2010   delete_insns_since (entry_last);
2011   return 0;
2012 }
2013 \f
2014 /* Generate code to perform an operation specified by BINOPTAB
2015    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2016    We assume that the order of the operands for the instruction
2017    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2018    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2019
2020    Either TARG0 or TARG1 may be zero, but what that means is that
2021    the result is not actually wanted.  We will generate it into
2022    a dummy pseudo-reg and discard it.  They may not both be zero.
2023
2024    Returns 1 if this operation can be performed; 0 if not.  */
2025
2026 int
2027 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2028                      int unsignedp)
2029 {
2030   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2031   enum mode_class mclass;
2032   machine_mode wider_mode;
2033   rtx_insn *entry_last = get_last_insn ();
2034   rtx_insn *last;
2035
2036   mclass = GET_MODE_CLASS (mode);
2037
2038   if (!targ0)
2039     targ0 = gen_reg_rtx (mode);
2040   if (!targ1)
2041     targ1 = gen_reg_rtx (mode);
2042
2043   /* Record where to go back to if we fail.  */
2044   last = get_last_insn ();
2045
2046   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2047     {
2048       struct expand_operand ops[4];
2049       enum insn_code icode = optab_handler (binoptab, mode);
2050       machine_mode mode0 = insn_data[icode].operand[1].mode;
2051       machine_mode mode1 = insn_data[icode].operand[2].mode;
2052       rtx xop0 = op0, xop1 = op1;
2053
2054       /* If we are optimizing, force expensive constants into a register.  */
2055       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2056       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2057
2058       create_fixed_operand (&ops[0], targ0);
2059       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2060       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2061       create_fixed_operand (&ops[3], targ1);
2062       if (maybe_expand_insn (icode, 4, ops))
2063         return 1;
2064       delete_insns_since (last);
2065     }
2066
2067   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2068
2069   if (CLASS_HAS_WIDER_MODES_P (mclass))
2070     {
2071       FOR_EACH_WIDER_MODE (wider_mode, mode)
2072         {
2073           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2074             {
2075               rtx t0 = gen_reg_rtx (wider_mode);
2076               rtx t1 = gen_reg_rtx (wider_mode);
2077               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2078               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2079
2080               if (expand_twoval_binop (binoptab, cop0, cop1,
2081                                        t0, t1, unsignedp))
2082                 {
2083                   convert_move (targ0, t0, unsignedp);
2084                   convert_move (targ1, t1, unsignedp);
2085                   return 1;
2086                 }
2087               else
2088                 delete_insns_since (last);
2089             }
2090         }
2091     }
2092
2093   delete_insns_since (entry_last);
2094   return 0;
2095 }
2096
2097 /* Expand the two-valued library call indicated by BINOPTAB, but
2098    preserve only one of the values.  If TARG0 is non-NULL, the first
2099    value is placed into TARG0; otherwise the second value is placed
2100    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2101    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2102    This routine assumes that the value returned by the library call is
2103    as if the return value was of an integral mode twice as wide as the
2104    mode of OP0.  Returns 1 if the call was successful.  */
2105
2106 bool
2107 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2108                              rtx targ0, rtx targ1, enum rtx_code code)
2109 {
2110   machine_mode mode;
2111   machine_mode libval_mode;
2112   rtx libval;
2113   rtx_insn *insns;
2114   rtx libfunc;
2115
2116   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2117   gcc_assert (!targ0 != !targ1);
2118
2119   mode = GET_MODE (op0);
2120   libfunc = optab_libfunc (binoptab, mode);
2121   if (!libfunc)
2122     return false;
2123
2124   /* The value returned by the library function will have twice as
2125      many bits as the nominal MODE.  */
2126   libval_mode = smallest_int_mode_for_size (2 * GET_MODE_BITSIZE (mode));
2127   start_sequence ();
2128   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2129                                     libval_mode,
2130                                     op0, mode,
2131                                     op1, mode);
2132   /* Get the part of VAL containing the value that we want.  */
2133   libval = simplify_gen_subreg (mode, libval, libval_mode,
2134                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2135   insns = get_insns ();
2136   end_sequence ();
2137   /* Move the into the desired location.  */
2138   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2139                       gen_rtx_fmt_ee (code, mode, op0, op1));
2140
2141   return true;
2142 }
2143
2144 \f
2145 /* Wrapper around expand_unop which takes an rtx code to specify
2146    the operation to perform, not an optab pointer.  All other
2147    arguments are the same.  */
2148 rtx
2149 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2150                     rtx target, int unsignedp)
2151 {
2152   optab unop = code_to_optab (code);
2153   gcc_assert (unop);
2154
2155   return expand_unop (mode, unop, op0, target, unsignedp);
2156 }
2157
2158 /* Try calculating
2159         (clz:narrow x)
2160    as
2161         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2162
2163    A similar operation can be used for clrsb.  UNOPTAB says which operation
2164    we are trying to expand.  */
2165 static rtx
2166 widen_leading (scalar_int_mode mode, rtx op0, rtx target, optab unoptab)
2167 {
2168   opt_scalar_int_mode wider_mode_iter;
2169   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2170     {
2171       scalar_int_mode wider_mode = wider_mode_iter.require ();
2172       if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2173         {
2174           rtx xop0, temp;
2175           rtx_insn *last;
2176
2177           last = get_last_insn ();
2178
2179           if (target == 0)
2180             target = gen_reg_rtx (mode);
2181           xop0 = widen_operand (op0, wider_mode, mode,
2182                                 unoptab != clrsb_optab, false);
2183           temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2184                               unoptab != clrsb_optab);
2185           if (temp != 0)
2186             temp = expand_binop
2187               (wider_mode, sub_optab, temp,
2188                gen_int_mode (GET_MODE_PRECISION (wider_mode)
2189                              - GET_MODE_PRECISION (mode),
2190                              wider_mode),
2191                target, true, OPTAB_DIRECT);
2192           if (temp == 0)
2193             delete_insns_since (last);
2194
2195           return temp;
2196         }
2197     }
2198   return 0;
2199 }
2200
2201 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2202    quantities, choosing which based on whether the high word is nonzero.  */
2203 static rtx
2204 expand_doubleword_clz (scalar_int_mode mode, rtx op0, rtx target)
2205 {
2206   rtx xop0 = force_reg (mode, op0);
2207   rtx subhi = gen_highpart (word_mode, xop0);
2208   rtx sublo = gen_lowpart (word_mode, xop0);
2209   rtx_code_label *hi0_label = gen_label_rtx ();
2210   rtx_code_label *after_label = gen_label_rtx ();
2211   rtx_insn *seq;
2212   rtx temp, result;
2213
2214   /* If we were not given a target, use a word_mode register, not a
2215      'mode' register.  The result will fit, and nobody is expecting
2216      anything bigger (the return type of __builtin_clz* is int).  */
2217   if (!target)
2218     target = gen_reg_rtx (word_mode);
2219
2220   /* In any case, write to a word_mode scratch in both branches of the
2221      conditional, so we can ensure there is a single move insn setting
2222      'target' to tag a REG_EQUAL note on.  */
2223   result = gen_reg_rtx (word_mode);
2224
2225   start_sequence ();
2226
2227   /* If the high word is not equal to zero,
2228      then clz of the full value is clz of the high word.  */
2229   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2230                            word_mode, true, hi0_label);
2231
2232   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2233   if (!temp)
2234     goto fail;
2235
2236   if (temp != result)
2237     convert_move (result, temp, true);
2238
2239   emit_jump_insn (targetm.gen_jump (after_label));
2240   emit_barrier ();
2241
2242   /* Else clz of the full value is clz of the low word plus the number
2243      of bits in the high word.  */
2244   emit_label (hi0_label);
2245
2246   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2247   if (!temp)
2248     goto fail;
2249   temp = expand_binop (word_mode, add_optab, temp,
2250                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2251                        result, true, OPTAB_DIRECT);
2252   if (!temp)
2253     goto fail;
2254   if (temp != result)
2255     convert_move (result, temp, true);
2256
2257   emit_label (after_label);
2258   convert_move (target, result, true);
2259
2260   seq = get_insns ();
2261   end_sequence ();
2262
2263   add_equal_note (seq, target, CLZ, xop0, 0);
2264   emit_insn (seq);
2265   return target;
2266
2267  fail:
2268   end_sequence ();
2269   return 0;
2270 }
2271
2272 /* Try calculating popcount of a double-word quantity as two popcount's of
2273    word-sized quantities and summing up the results.  */
2274 static rtx
2275 expand_doubleword_popcount (scalar_int_mode mode, rtx op0, rtx target)
2276 {
2277   rtx t0, t1, t;
2278   rtx_insn *seq;
2279
2280   start_sequence ();
2281
2282   t0 = expand_unop_direct (word_mode, popcount_optab,
2283                            operand_subword_force (op0, 0, mode), NULL_RTX,
2284                            true);
2285   t1 = expand_unop_direct (word_mode, popcount_optab,
2286                            operand_subword_force (op0, 1, mode), NULL_RTX,
2287                            true);
2288   if (!t0 || !t1)
2289     {
2290       end_sequence ();
2291       return NULL_RTX;
2292     }
2293
2294   /* If we were not given a target, use a word_mode register, not a
2295      'mode' register.  The result will fit, and nobody is expecting
2296      anything bigger (the return type of __builtin_popcount* is int).  */
2297   if (!target)
2298     target = gen_reg_rtx (word_mode);
2299
2300   t = expand_binop (word_mode, add_optab, t0, t1, target, 0, OPTAB_DIRECT);
2301
2302   seq = get_insns ();
2303   end_sequence ();
2304
2305   add_equal_note (seq, t, POPCOUNT, op0, 0);
2306   emit_insn (seq);
2307   return t;
2308 }
2309
2310 /* Try calculating
2311         (parity:wide x)
2312    as
2313         (parity:narrow (low (x) ^ high (x))) */
2314 static rtx
2315 expand_doubleword_parity (scalar_int_mode mode, rtx op0, rtx target)
2316 {
2317   rtx t = expand_binop (word_mode, xor_optab,
2318                         operand_subword_force (op0, 0, mode),
2319                         operand_subword_force (op0, 1, mode),
2320                         NULL_RTX, 0, OPTAB_DIRECT);
2321   return expand_unop (word_mode, parity_optab, t, target, true);
2322 }
2323
2324 /* Try calculating
2325         (bswap:narrow x)
2326    as
2327         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2328 static rtx
2329 widen_bswap (scalar_int_mode mode, rtx op0, rtx target)
2330 {
2331   rtx x;
2332   rtx_insn *last;
2333   opt_scalar_int_mode wider_mode_iter;
2334
2335   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2336     if (optab_handler (bswap_optab, wider_mode_iter.require ())
2337         != CODE_FOR_nothing)
2338       break;
2339
2340   if (!wider_mode_iter.exists ())
2341     return NULL_RTX;
2342
2343   scalar_int_mode wider_mode = wider_mode_iter.require ();
2344   last = get_last_insn ();
2345
2346   x = widen_operand (op0, wider_mode, mode, true, true);
2347   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2348
2349   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2350               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2351   if (x != 0)
2352     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2353                       GET_MODE_BITSIZE (wider_mode)
2354                       - GET_MODE_BITSIZE (mode),
2355                       NULL_RTX, true);
2356
2357   if (x != 0)
2358     {
2359       if (target == 0)
2360         target = gen_reg_rtx (mode);
2361       emit_move_insn (target, gen_lowpart (mode, x));
2362     }
2363   else
2364     delete_insns_since (last);
2365
2366   return target;
2367 }
2368
2369 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2370
2371 static rtx
2372 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2373 {
2374   rtx t0, t1;
2375
2376   t1 = expand_unop (word_mode, bswap_optab,
2377                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2378   t0 = expand_unop (word_mode, bswap_optab,
2379                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2380
2381   if (target == 0 || !valid_multiword_target_p (target))
2382     target = gen_reg_rtx (mode);
2383   if (REG_P (target))
2384     emit_clobber (target);
2385   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2386   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2387
2388   return target;
2389 }
2390
2391 /* Try calculating (parity x) as (and (popcount x) 1), where
2392    popcount can also be done in a wider mode.  */
2393 static rtx
2394 expand_parity (scalar_int_mode mode, rtx op0, rtx target)
2395 {
2396   enum mode_class mclass = GET_MODE_CLASS (mode);
2397   opt_scalar_int_mode wider_mode_iter;
2398   FOR_EACH_MODE_FROM (wider_mode_iter, mode)
2399     {
2400       scalar_int_mode wider_mode = wider_mode_iter.require ();
2401       if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2402         {
2403           rtx xop0, temp;
2404           rtx_insn *last;
2405
2406           last = get_last_insn ();
2407
2408           if (target == 0 || GET_MODE (target) != wider_mode)
2409             target = gen_reg_rtx (wider_mode);
2410
2411           xop0 = widen_operand (op0, wider_mode, mode, true, false);
2412           temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2413                               true);
2414           if (temp != 0)
2415             temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2416                                  target, true, OPTAB_DIRECT);
2417
2418           if (temp)
2419             {
2420               if (mclass != MODE_INT
2421                   || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2422                 return convert_to_mode (mode, temp, 0);
2423               else
2424                 return gen_lowpart (mode, temp);
2425             }
2426           else
2427             delete_insns_since (last);
2428         }
2429     }
2430   return 0;
2431 }
2432
2433 /* Try calculating ctz(x) as K - clz(x & -x) ,
2434    where K is GET_MODE_PRECISION(mode) - 1.
2435
2436    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2437    don't have to worry about what the hardware does in that case.  (If
2438    the clz instruction produces the usual value at 0, which is K, the
2439    result of this code sequence will be -1; expand_ffs, below, relies
2440    on this.  It might be nice to have it be K instead, for consistency
2441    with the (very few) processors that provide a ctz with a defined
2442    value, but that would take one more instruction, and it would be
2443    less convenient for expand_ffs anyway.  */
2444
2445 static rtx
2446 expand_ctz (scalar_int_mode mode, rtx op0, rtx target)
2447 {
2448   rtx_insn *seq;
2449   rtx temp;
2450
2451   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2452     return 0;
2453
2454   start_sequence ();
2455
2456   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2457   if (temp)
2458     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2459                          true, OPTAB_DIRECT);
2460   if (temp)
2461     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2462   if (temp)
2463     temp = expand_binop (mode, sub_optab,
2464                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2465                          temp, target,
2466                          true, OPTAB_DIRECT);
2467   if (temp == 0)
2468     {
2469       end_sequence ();
2470       return 0;
2471     }
2472
2473   seq = get_insns ();
2474   end_sequence ();
2475
2476   add_equal_note (seq, temp, CTZ, op0, 0);
2477   emit_insn (seq);
2478   return temp;
2479 }
2480
2481
2482 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2483    else with the sequence used by expand_clz.
2484
2485    The ffs builtin promises to return zero for a zero value and ctz/clz
2486    may have an undefined value in that case.  If they do not give us a
2487    convenient value, we have to generate a test and branch.  */
2488 static rtx
2489 expand_ffs (scalar_int_mode mode, rtx op0, rtx target)
2490 {
2491   HOST_WIDE_INT val = 0;
2492   bool defined_at_zero = false;
2493   rtx temp;
2494   rtx_insn *seq;
2495
2496   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2497     {
2498       start_sequence ();
2499
2500       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2501       if (!temp)
2502         goto fail;
2503
2504       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2505     }
2506   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2507     {
2508       start_sequence ();
2509       temp = expand_ctz (mode, op0, 0);
2510       if (!temp)
2511         goto fail;
2512
2513       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2514         {
2515           defined_at_zero = true;
2516           val = (GET_MODE_PRECISION (mode) - 1) - val;
2517         }
2518     }
2519   else
2520     return 0;
2521
2522   if (defined_at_zero && val == -1)
2523     /* No correction needed at zero.  */;
2524   else
2525     {
2526       /* We don't try to do anything clever with the situation found
2527          on some processors (eg Alpha) where ctz(0:mode) ==
2528          bitsize(mode).  If someone can think of a way to send N to -1
2529          and leave alone all values in the range 0..N-1 (where N is a
2530          power of two), cheaper than this test-and-branch, please add it.
2531
2532          The test-and-branch is done after the operation itself, in case
2533          the operation sets condition codes that can be recycled for this.
2534          (This is true on i386, for instance.)  */
2535
2536       rtx_code_label *nonzero_label = gen_label_rtx ();
2537       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2538                                mode, true, nonzero_label);
2539
2540       convert_move (temp, GEN_INT (-1), false);
2541       emit_label (nonzero_label);
2542     }
2543
2544   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2545      to produce a value in the range 0..bitsize.  */
2546   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2547                        target, false, OPTAB_DIRECT);
2548   if (!temp)
2549     goto fail;
2550
2551   seq = get_insns ();
2552   end_sequence ();
2553
2554   add_equal_note (seq, temp, FFS, op0, 0);
2555   emit_insn (seq);
2556   return temp;
2557
2558  fail:
2559   end_sequence ();
2560   return 0;
2561 }
2562
2563 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2564    conditions, VAL may already be a SUBREG against which we cannot generate
2565    a further SUBREG.  In this case, we expect forcing the value into a
2566    register will work around the situation.  */
2567
2568 static rtx
2569 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
2570                            machine_mode imode)
2571 {
2572   rtx ret;
2573   ret = lowpart_subreg (omode, val, imode);
2574   if (ret == NULL)
2575     {
2576       val = force_reg (imode, val);
2577       ret = lowpart_subreg (omode, val, imode);
2578       gcc_assert (ret != NULL);
2579     }
2580   return ret;
2581 }
2582
2583 /* Expand a floating point absolute value or negation operation via a
2584    logical operation on the sign bit.  */
2585
2586 static rtx
2587 expand_absneg_bit (enum rtx_code code, scalar_float_mode mode,
2588                    rtx op0, rtx target)
2589 {
2590   const struct real_format *fmt;
2591   int bitpos, word, nwords, i;
2592   scalar_int_mode imode;
2593   rtx temp;
2594   rtx_insn *insns;
2595
2596   /* The format has to have a simple sign bit.  */
2597   fmt = REAL_MODE_FORMAT (mode);
2598   if (fmt == NULL)
2599     return NULL_RTX;
2600
2601   bitpos = fmt->signbit_rw;
2602   if (bitpos < 0)
2603     return NULL_RTX;
2604
2605   /* Don't create negative zeros if the format doesn't support them.  */
2606   if (code == NEG && !fmt->has_signed_zero)
2607     return NULL_RTX;
2608
2609   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2610     {
2611       if (!int_mode_for_mode (mode).exists (&imode))
2612         return NULL_RTX;
2613       word = 0;
2614       nwords = 1;
2615     }
2616   else
2617     {
2618       imode = word_mode;
2619
2620       if (FLOAT_WORDS_BIG_ENDIAN)
2621         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2622       else
2623         word = bitpos / BITS_PER_WORD;
2624       bitpos = bitpos % BITS_PER_WORD;
2625       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2626     }
2627
2628   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2629   if (code == ABS)
2630     mask = ~mask;
2631
2632   if (target == 0
2633       || target == op0
2634       || (nwords > 1 && !valid_multiword_target_p (target)))
2635     target = gen_reg_rtx (mode);
2636
2637   if (nwords > 1)
2638     {
2639       start_sequence ();
2640
2641       for (i = 0; i < nwords; ++i)
2642         {
2643           rtx targ_piece = operand_subword (target, i, 1, mode);
2644           rtx op0_piece = operand_subword_force (op0, i, mode);
2645
2646           if (i == word)
2647             {
2648               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2649                                    op0_piece,
2650                                    immed_wide_int_const (mask, imode),
2651                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2652               if (temp != targ_piece)
2653                 emit_move_insn (targ_piece, temp);
2654             }
2655           else
2656             emit_move_insn (targ_piece, op0_piece);
2657         }
2658
2659       insns = get_insns ();
2660       end_sequence ();
2661
2662       emit_insn (insns);
2663     }
2664   else
2665     {
2666       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2667                            gen_lowpart (imode, op0),
2668                            immed_wide_int_const (mask, imode),
2669                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2670       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2671
2672       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2673                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2674                         target);
2675     }
2676
2677   return target;
2678 }
2679
2680 /* As expand_unop, but will fail rather than attempt the operation in a
2681    different mode or with a libcall.  */
2682 static rtx
2683 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
2684                     int unsignedp)
2685 {
2686   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2687     {
2688       struct expand_operand ops[2];
2689       enum insn_code icode = optab_handler (unoptab, mode);
2690       rtx_insn *last = get_last_insn ();
2691       rtx_insn *pat;
2692
2693       create_output_operand (&ops[0], target, mode);
2694       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2695       pat = maybe_gen_insn (icode, 2, ops);
2696       if (pat)
2697         {
2698           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
2699               && ! add_equal_note (pat, ops[0].value,
2700                                    optab_to_code (unoptab),
2701                                    ops[1].value, NULL_RTX))
2702             {
2703               delete_insns_since (last);
2704               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
2705             }
2706
2707           emit_insn (pat);
2708
2709           return ops[0].value;
2710         }
2711     }
2712   return 0;
2713 }
2714
2715 /* Generate code to perform an operation specified by UNOPTAB
2716    on operand OP0, with result having machine-mode MODE.
2717
2718    UNSIGNEDP is for the case where we have to widen the operands
2719    to perform the operation.  It says to use zero-extension.
2720
2721    If TARGET is nonzero, the value
2722    is generated there, if it is convenient to do so.
2723    In all cases an rtx is returned for the locus of the value;
2724    this may or may not be TARGET.  */
2725
2726 rtx
2727 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
2728              int unsignedp)
2729 {
2730   enum mode_class mclass = GET_MODE_CLASS (mode);
2731   machine_mode wider_mode;
2732   scalar_int_mode int_mode;
2733   scalar_float_mode float_mode;
2734   rtx temp;
2735   rtx libfunc;
2736
2737   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
2738   if (temp)
2739     return temp;
2740
2741   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
2742
2743   /* Widening (or narrowing) clz needs special treatment.  */
2744   if (unoptab == clz_optab)
2745     {
2746       if (is_a <scalar_int_mode> (mode, &int_mode))
2747         {
2748           temp = widen_leading (int_mode, op0, target, unoptab);
2749           if (temp)
2750             return temp;
2751
2752           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2753               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2754             {
2755               temp = expand_doubleword_clz (int_mode, op0, target);
2756               if (temp)
2757                 return temp;
2758             }
2759         }
2760
2761       goto try_libcall;
2762     }
2763
2764   if (unoptab == clrsb_optab)
2765     {
2766       if (is_a <scalar_int_mode> (mode, &int_mode))
2767         {
2768           temp = widen_leading (int_mode, op0, target, unoptab);
2769           if (temp)
2770             return temp;
2771         }
2772       goto try_libcall;
2773     }
2774
2775   if (unoptab == popcount_optab
2776       && is_a <scalar_int_mode> (mode, &int_mode)
2777       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2778       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2779       && optimize_insn_for_speed_p ())
2780     {
2781       temp = expand_doubleword_popcount (int_mode, op0, target);
2782       if (temp)
2783         return temp;
2784     }
2785
2786   if (unoptab == parity_optab
2787       && is_a <scalar_int_mode> (mode, &int_mode)
2788       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2789       && (optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2790           || optab_handler (popcount_optab, word_mode) != CODE_FOR_nothing)
2791       && optimize_insn_for_speed_p ())
2792     {
2793       temp = expand_doubleword_parity (int_mode, op0, target);
2794       if (temp)
2795         return temp;
2796     }
2797
2798   /* Widening (or narrowing) bswap needs special treatment.  */
2799   if (unoptab == bswap_optab)
2800     {
2801       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
2802          or ROTATERT.  First try these directly; if this fails, then try the
2803          obvious pair of shifts with allowed widening, as this will probably
2804          be always more efficient than the other fallback methods.  */
2805       if (mode == HImode)
2806         {
2807           rtx_insn *last;
2808           rtx temp1, temp2;
2809
2810           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
2811             {
2812               temp = expand_binop (mode, rotl_optab, op0,
2813                                    gen_int_shift_amount (mode, 8),
2814                                    target, unsignedp, OPTAB_DIRECT);
2815               if (temp)
2816                 return temp;
2817              }
2818
2819           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
2820             {
2821               temp = expand_binop (mode, rotr_optab, op0,
2822                                    gen_int_shift_amount (mode, 8),
2823                                    target, unsignedp, OPTAB_DIRECT);
2824               if (temp)
2825                 return temp;
2826             }
2827
2828           last = get_last_insn ();
2829
2830           temp1 = expand_binop (mode, ashl_optab, op0,
2831                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2832                                 unsignedp, OPTAB_WIDEN);
2833           temp2 = expand_binop (mode, lshr_optab, op0,
2834                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2835                                 unsignedp, OPTAB_WIDEN);
2836           if (temp1 && temp2)
2837             {
2838               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
2839                                    unsignedp, OPTAB_WIDEN);
2840               if (temp)
2841                 return temp;
2842             }
2843
2844           delete_insns_since (last);
2845         }
2846
2847       if (is_a <scalar_int_mode> (mode, &int_mode))
2848         {
2849           temp = widen_bswap (int_mode, op0, target);
2850           if (temp)
2851             return temp;
2852
2853           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2854               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2855             {
2856               temp = expand_doubleword_bswap (mode, op0, target);
2857               if (temp)
2858                 return temp;
2859             }
2860         }
2861
2862       goto try_libcall;
2863     }
2864
2865   if (CLASS_HAS_WIDER_MODES_P (mclass))
2866     FOR_EACH_WIDER_MODE (wider_mode, mode)
2867       {
2868         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2869           {
2870             rtx xop0 = op0;
2871             rtx_insn *last = get_last_insn ();
2872
2873             /* For certain operations, we need not actually extend
2874                the narrow operand, as long as we will truncate the
2875                results to the same narrowness.  */
2876
2877             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
2878                                   (unoptab == neg_optab
2879                                    || unoptab == one_cmpl_optab)
2880                                   && mclass == MODE_INT);
2881
2882             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2883                                 unsignedp);
2884
2885             if (temp)
2886               {
2887                 if (mclass != MODE_INT
2888                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2889                   {
2890                     if (target == 0)
2891                       target = gen_reg_rtx (mode);
2892                     convert_move (target, temp, 0);
2893                     return target;
2894                   }
2895                 else
2896                   return gen_lowpart (mode, temp);
2897               }
2898             else
2899               delete_insns_since (last);
2900           }
2901       }
2902
2903   /* These can be done a word at a time.  */
2904   if (unoptab == one_cmpl_optab
2905       && is_int_mode (mode, &int_mode)
2906       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
2907       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2908     {
2909       int i;
2910       rtx_insn *insns;
2911
2912       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
2913         target = gen_reg_rtx (int_mode);
2914
2915       start_sequence ();
2916
2917       /* Do the actual arithmetic.  */
2918       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
2919         {
2920           rtx target_piece = operand_subword (target, i, 1, int_mode);
2921           rtx x = expand_unop (word_mode, unoptab,
2922                                operand_subword_force (op0, i, int_mode),
2923                                target_piece, unsignedp);
2924
2925           if (target_piece != x)
2926             emit_move_insn (target_piece, x);
2927         }
2928
2929       insns = get_insns ();
2930       end_sequence ();
2931
2932       emit_insn (insns);
2933       return target;
2934     }
2935
2936   if (optab_to_code (unoptab) == NEG)
2937     {
2938       /* Try negating floating point values by flipping the sign bit.  */
2939       if (is_a <scalar_float_mode> (mode, &float_mode))
2940         {
2941           temp = expand_absneg_bit (NEG, float_mode, op0, target);
2942           if (temp)
2943             return temp;
2944         }
2945
2946       /* If there is no negation pattern, and we have no negative zero,
2947          try subtracting from zero.  */
2948       if (!HONOR_SIGNED_ZEROS (mode))
2949         {
2950           temp = expand_binop (mode, (unoptab == negv_optab
2951                                       ? subv_optab : sub_optab),
2952                                CONST0_RTX (mode), op0, target,
2953                                unsignedp, OPTAB_DIRECT);
2954           if (temp)
2955             return temp;
2956         }
2957     }
2958
2959   /* Try calculating parity (x) as popcount (x) % 2.  */
2960   if (unoptab == parity_optab && is_a <scalar_int_mode> (mode, &int_mode))
2961     {
2962       temp = expand_parity (int_mode, op0, target);
2963       if (temp)
2964         return temp;
2965     }
2966
2967   /* Try implementing ffs (x) in terms of clz (x).  */
2968   if (unoptab == ffs_optab && is_a <scalar_int_mode> (mode, &int_mode))
2969     {
2970       temp = expand_ffs (int_mode, op0, target);
2971       if (temp)
2972         return temp;
2973     }
2974
2975   /* Try implementing ctz (x) in terms of clz (x).  */
2976   if (unoptab == ctz_optab && is_a <scalar_int_mode> (mode, &int_mode))
2977     {
2978       temp = expand_ctz (int_mode, op0, target);
2979       if (temp)
2980         return temp;
2981     }
2982
2983  try_libcall:
2984   /* Now try a library call in this mode.  */
2985   libfunc = optab_libfunc (unoptab, mode);
2986   if (libfunc)
2987     {
2988       rtx_insn *insns;
2989       rtx value;
2990       rtx eq_value;
2991       machine_mode outmode = mode;
2992
2993       /* All of these functions return small values.  Thus we choose to
2994          have them return something that isn't a double-word.  */
2995       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
2996           || unoptab == clrsb_optab || unoptab == popcount_optab
2997           || unoptab == parity_optab)
2998         outmode
2999           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3000                                           optab_libfunc (unoptab, mode)));
3001
3002       start_sequence ();
3003
3004       /* Pass 1 for NO_QUEUE so we don't lose any increments
3005          if the libcall is cse'd or moved.  */
3006       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3007                                        op0, mode);
3008       insns = get_insns ();
3009       end_sequence ();
3010
3011       target = gen_reg_rtx (outmode);
3012       bool trapv = trapv_unoptab_p (unoptab);
3013       if (trapv)
3014         eq_value = NULL_RTX;
3015       else
3016         {
3017           eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3018           if (GET_MODE_UNIT_SIZE (outmode) < GET_MODE_UNIT_SIZE (mode))
3019             eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3020           else if (GET_MODE_UNIT_SIZE (outmode) > GET_MODE_UNIT_SIZE (mode))
3021             eq_value = simplify_gen_unary (ZERO_EXTEND,
3022                                            outmode, eq_value, mode);
3023         }
3024       emit_libcall_block_1 (insns, target, value, eq_value, trapv);
3025
3026       return target;
3027     }
3028
3029   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3030
3031   if (CLASS_HAS_WIDER_MODES_P (mclass))
3032     {
3033       FOR_EACH_WIDER_MODE (wider_mode, mode)
3034         {
3035           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3036               || optab_libfunc (unoptab, wider_mode))
3037             {
3038               rtx xop0 = op0;
3039               rtx_insn *last = get_last_insn ();
3040
3041               /* For certain operations, we need not actually extend
3042                  the narrow operand, as long as we will truncate the
3043                  results to the same narrowness.  */
3044               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3045                                     (unoptab == neg_optab
3046                                      || unoptab == one_cmpl_optab
3047                                      || unoptab == bswap_optab)
3048                                     && mclass == MODE_INT);
3049
3050               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3051                                   unsignedp);
3052
3053               /* If we are generating clz using wider mode, adjust the
3054                  result.  Similarly for clrsb.  */
3055               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3056                   && temp != 0)
3057                 {
3058                   scalar_int_mode wider_int_mode
3059                     = as_a <scalar_int_mode> (wider_mode);
3060                   int_mode = as_a <scalar_int_mode> (mode);
3061                   temp = expand_binop
3062                     (wider_mode, sub_optab, temp,
3063                      gen_int_mode (GET_MODE_PRECISION (wider_int_mode)
3064                                    - GET_MODE_PRECISION (int_mode),
3065                                    wider_int_mode),
3066                      target, true, OPTAB_DIRECT);
3067                 }
3068
3069               /* Likewise for bswap.  */
3070               if (unoptab == bswap_optab && temp != 0)
3071                 {
3072                   scalar_int_mode wider_int_mode
3073                     = as_a <scalar_int_mode> (wider_mode);
3074                   int_mode = as_a <scalar_int_mode> (mode);
3075                   gcc_assert (GET_MODE_PRECISION (wider_int_mode)
3076                               == GET_MODE_BITSIZE (wider_int_mode)
3077                               && GET_MODE_PRECISION (int_mode)
3078                                  == GET_MODE_BITSIZE (int_mode));
3079
3080                   temp = expand_shift (RSHIFT_EXPR, wider_int_mode, temp,
3081                                        GET_MODE_BITSIZE (wider_int_mode)
3082                                        - GET_MODE_BITSIZE (int_mode),
3083                                        NULL_RTX, true);
3084                 }
3085
3086               if (temp)
3087                 {
3088                   if (mclass != MODE_INT)
3089                     {
3090                       if (target == 0)
3091                         target = gen_reg_rtx (mode);
3092                       convert_move (target, temp, 0);
3093                       return target;
3094                     }
3095                   else
3096                     return gen_lowpart (mode, temp);
3097                 }
3098               else
3099                 delete_insns_since (last);
3100             }
3101         }
3102     }
3103
3104   /* One final attempt at implementing negation via subtraction,
3105      this time allowing widening of the operand.  */
3106   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3107     {
3108       rtx temp;
3109       temp = expand_binop (mode,
3110                            unoptab == negv_optab ? subv_optab : sub_optab,
3111                            CONST0_RTX (mode), op0,
3112                            target, unsignedp, OPTAB_LIB_WIDEN);
3113       if (temp)
3114         return temp;
3115     }
3116
3117   return 0;
3118 }
3119 \f
3120 /* Emit code to compute the absolute value of OP0, with result to
3121    TARGET if convenient.  (TARGET may be 0.)  The return value says
3122    where the result actually is to be found.
3123
3124    MODE is the mode of the operand; the mode of the result is
3125    different but can be deduced from MODE.
3126
3127  */
3128
3129 rtx
3130 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3131                    int result_unsignedp)
3132 {
3133   rtx temp;
3134
3135   if (GET_MODE_CLASS (mode) != MODE_INT
3136       || ! flag_trapv)
3137     result_unsignedp = 1;
3138
3139   /* First try to do it with a special abs instruction.  */
3140   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3141                       op0, target, 0);
3142   if (temp != 0)
3143     return temp;
3144
3145   /* For floating point modes, try clearing the sign bit.  */
3146   scalar_float_mode float_mode;
3147   if (is_a <scalar_float_mode> (mode, &float_mode))
3148     {
3149       temp = expand_absneg_bit (ABS, float_mode, op0, target);
3150       if (temp)
3151         return temp;
3152     }
3153
3154   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3155   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3156       && !HONOR_SIGNED_ZEROS (mode))
3157     {
3158       rtx_insn *last = get_last_insn ();
3159
3160       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3161                           op0, NULL_RTX, 0);
3162       if (temp != 0)
3163         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3164                              OPTAB_WIDEN);
3165
3166       if (temp != 0)
3167         return temp;
3168
3169       delete_insns_since (last);
3170     }
3171
3172   /* If this machine has expensive jumps, we can do integer absolute
3173      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3174      where W is the width of MODE.  */
3175
3176   scalar_int_mode int_mode;
3177   if (is_int_mode (mode, &int_mode)
3178       && BRANCH_COST (optimize_insn_for_speed_p (),
3179                       false) >= 2)
3180     {
3181       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3182                                    GET_MODE_PRECISION (int_mode) - 1,
3183                                    NULL_RTX, 0);
3184
3185       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3186                            OPTAB_LIB_WIDEN);
3187       if (temp != 0)
3188         temp = expand_binop (int_mode,
3189                              result_unsignedp ? sub_optab : subv_optab,
3190                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3191
3192       if (temp != 0)
3193         return temp;
3194     }
3195
3196   return NULL_RTX;
3197 }
3198
3199 rtx
3200 expand_abs (machine_mode mode, rtx op0, rtx target,
3201             int result_unsignedp, int safe)
3202 {
3203   rtx temp;
3204   rtx_code_label *op1;
3205
3206   if (GET_MODE_CLASS (mode) != MODE_INT
3207       || ! flag_trapv)
3208     result_unsignedp = 1;
3209
3210   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3211   if (temp != 0)
3212     return temp;
3213
3214   /* If that does not win, use conditional jump and negate.  */
3215
3216   /* It is safe to use the target if it is the same
3217      as the source if this is also a pseudo register */
3218   if (op0 == target && REG_P (op0)
3219       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3220     safe = 1;
3221
3222   op1 = gen_label_rtx ();
3223   if (target == 0 || ! safe
3224       || GET_MODE (target) != mode
3225       || (MEM_P (target) && MEM_VOLATILE_P (target))
3226       || (REG_P (target)
3227           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3228     target = gen_reg_rtx (mode);
3229
3230   emit_move_insn (target, op0);
3231   NO_DEFER_POP;
3232
3233   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3234                            NULL_RTX, NULL, op1,
3235                            profile_probability::uninitialized ());
3236
3237   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3238                      target, target, 0);
3239   if (op0 != target)
3240     emit_move_insn (target, op0);
3241   emit_label (op1);
3242   OK_DEFER_POP;
3243   return target;
3244 }
3245
3246 /* Emit code to compute the one's complement absolute value of OP0
3247    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3248    (TARGET may be NULL_RTX.)  The return value says where the result
3249    actually is to be found.
3250
3251    MODE is the mode of the operand; the mode of the result is
3252    different but can be deduced from MODE.  */
3253
3254 rtx
3255 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3256 {
3257   rtx temp;
3258
3259   /* Not applicable for floating point modes.  */
3260   if (FLOAT_MODE_P (mode))
3261     return NULL_RTX;
3262
3263   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3264   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3265     {
3266       rtx_insn *last = get_last_insn ();
3267
3268       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3269       if (temp != 0)
3270         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3271                              OPTAB_WIDEN);
3272
3273       if (temp != 0)
3274         return temp;
3275
3276       delete_insns_since (last);
3277     }
3278
3279   /* If this machine has expensive jumps, we can do one's complement
3280      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3281
3282   scalar_int_mode int_mode;
3283   if (is_int_mode (mode, &int_mode)
3284       && BRANCH_COST (optimize_insn_for_speed_p (),
3285                      false) >= 2)
3286     {
3287       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3288                                    GET_MODE_PRECISION (int_mode) - 1,
3289                                    NULL_RTX, 0);
3290
3291       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3292                            OPTAB_LIB_WIDEN);
3293
3294       if (temp != 0)
3295         return temp;
3296     }
3297
3298   return NULL_RTX;
3299 }
3300
3301 /* A subroutine of expand_copysign, perform the copysign operation using the
3302    abs and neg primitives advertised to exist on the target.  The assumption
3303    is that we have a split register file, and leaving op0 in fp registers,
3304    and not playing with subregs so much, will help the register allocator.  */
3305
3306 static rtx
3307 expand_copysign_absneg (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3308                         int bitpos, bool op0_is_abs)
3309 {
3310   scalar_int_mode imode;
3311   enum insn_code icode;
3312   rtx sign;
3313   rtx_code_label *label;
3314
3315   if (target == op1)
3316     target = NULL_RTX;
3317
3318   /* Check if the back end provides an insn that handles signbit for the
3319      argument's mode. */
3320   icode = optab_handler (signbit_optab, mode);
3321   if (icode != CODE_FOR_nothing)
3322     {
3323       imode = as_a <scalar_int_mode> (insn_data[(int) icode].operand[0].mode);
3324       sign = gen_reg_rtx (imode);
3325       emit_unop_insn (icode, sign, op1, UNKNOWN);
3326     }
3327   else
3328     {
3329       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3330         {
3331           if (!int_mode_for_mode (mode).exists (&imode))
3332             return NULL_RTX;
3333           op1 = gen_lowpart (imode, op1);
3334         }
3335       else
3336         {
3337           int word;
3338
3339           imode = word_mode;
3340           if (FLOAT_WORDS_BIG_ENDIAN)
3341             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3342           else
3343             word = bitpos / BITS_PER_WORD;
3344           bitpos = bitpos % BITS_PER_WORD;
3345           op1 = operand_subword_force (op1, word, mode);
3346         }
3347
3348       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3349       sign = expand_binop (imode, and_optab, op1,
3350                            immed_wide_int_const (mask, imode),
3351                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3352     }
3353
3354   if (!op0_is_abs)
3355     {
3356       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3357       if (op0 == NULL)
3358         return NULL_RTX;
3359       target = op0;
3360     }
3361   else
3362     {
3363       if (target == NULL_RTX)
3364         target = copy_to_reg (op0);
3365       else
3366         emit_move_insn (target, op0);
3367     }
3368
3369   label = gen_label_rtx ();
3370   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3371
3372   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3373     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3374   else
3375     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3376   if (op0 != target)
3377     emit_move_insn (target, op0);
3378
3379   emit_label (label);
3380
3381   return target;
3382 }
3383
3384
3385 /* A subroutine of expand_copysign, perform the entire copysign operation
3386    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3387    is true if op0 is known to have its sign bit clear.  */
3388
3389 static rtx
3390 expand_copysign_bit (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3391                      int bitpos, bool op0_is_abs)
3392 {
3393   scalar_int_mode imode;
3394   int word, nwords, i;
3395   rtx temp;
3396   rtx_insn *insns;
3397
3398   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3399     {
3400       if (!int_mode_for_mode (mode).exists (&imode))
3401         return NULL_RTX;
3402       word = 0;
3403       nwords = 1;
3404     }
3405   else
3406     {
3407       imode = word_mode;
3408
3409       if (FLOAT_WORDS_BIG_ENDIAN)
3410         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3411       else
3412         word = bitpos / BITS_PER_WORD;
3413       bitpos = bitpos % BITS_PER_WORD;
3414       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3415     }
3416
3417   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3418
3419   if (target == 0
3420       || target == op0
3421       || target == op1
3422       || (nwords > 1 && !valid_multiword_target_p (target)))
3423     target = gen_reg_rtx (mode);
3424
3425   if (nwords > 1)
3426     {
3427       start_sequence ();
3428
3429       for (i = 0; i < nwords; ++i)
3430         {
3431           rtx targ_piece = operand_subword (target, i, 1, mode);
3432           rtx op0_piece = operand_subword_force (op0, i, mode);
3433
3434           if (i == word)
3435             {
3436               if (!op0_is_abs)
3437                 op0_piece
3438                   = expand_binop (imode, and_optab, op0_piece,
3439                                   immed_wide_int_const (~mask, imode),
3440                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3441               op1 = expand_binop (imode, and_optab,
3442                                   operand_subword_force (op1, i, mode),
3443                                   immed_wide_int_const (mask, imode),
3444                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3445
3446               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3447                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3448               if (temp != targ_piece)
3449                 emit_move_insn (targ_piece, temp);
3450             }
3451           else
3452             emit_move_insn (targ_piece, op0_piece);
3453         }
3454
3455       insns = get_insns ();
3456       end_sequence ();
3457
3458       emit_insn (insns);
3459     }
3460   else
3461     {
3462       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3463                           immed_wide_int_const (mask, imode),
3464                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3465
3466       op0 = gen_lowpart (imode, op0);
3467       if (!op0_is_abs)
3468         op0 = expand_binop (imode, and_optab, op0,
3469                             immed_wide_int_const (~mask, imode),
3470                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3471
3472       temp = expand_binop (imode, ior_optab, op0, op1,
3473                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3474       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3475     }
3476
3477   return target;
3478 }
3479
3480 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3481    scalar floating point mode.  Return NULL if we do not know how to
3482    expand the operation inline.  */
3483
3484 rtx
3485 expand_copysign (rtx op0, rtx op1, rtx target)
3486 {
3487   scalar_float_mode mode;
3488   const struct real_format *fmt;
3489   bool op0_is_abs;
3490   rtx temp;
3491
3492   mode = as_a <scalar_float_mode> (GET_MODE (op0));
3493   gcc_assert (GET_MODE (op1) == mode);
3494
3495   /* First try to do it with a special instruction.  */
3496   temp = expand_binop (mode, copysign_optab, op0, op1,
3497                        target, 0, OPTAB_DIRECT);
3498   if (temp)
3499     return temp;
3500
3501   fmt = REAL_MODE_FORMAT (mode);
3502   if (fmt == NULL || !fmt->has_signed_zero)
3503     return NULL_RTX;
3504
3505   op0_is_abs = false;
3506   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3507     {
3508       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3509         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3510       op0_is_abs = true;
3511     }
3512
3513   if (fmt->signbit_ro >= 0
3514       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3515           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3516               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3517     {
3518       temp = expand_copysign_absneg (mode, op0, op1, target,
3519                                      fmt->signbit_ro, op0_is_abs);
3520       if (temp)
3521         return temp;
3522     }
3523
3524   if (fmt->signbit_rw < 0)
3525     return NULL_RTX;
3526   return expand_copysign_bit (mode, op0, op1, target,
3527                               fmt->signbit_rw, op0_is_abs);
3528 }
3529 \f
3530 /* Generate an instruction whose insn-code is INSN_CODE,
3531    with two operands: an output TARGET and an input OP0.
3532    TARGET *must* be nonzero, and the output is always stored there.
3533    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3534    the value that is stored into TARGET.
3535
3536    Return false if expansion failed.  */
3537
3538 bool
3539 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3540                       enum rtx_code code)
3541 {
3542   struct expand_operand ops[2];
3543   rtx_insn *pat;
3544
3545   create_output_operand (&ops[0], target, GET_MODE (target));
3546   create_input_operand (&ops[1], op0, GET_MODE (op0));
3547   pat = maybe_gen_insn (icode, 2, ops);
3548   if (!pat)
3549     return false;
3550
3551   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3552       && code != UNKNOWN)
3553     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3554
3555   emit_insn (pat);
3556
3557   if (ops[0].value != target)
3558     emit_move_insn (target, ops[0].value);
3559   return true;
3560 }
3561 /* Generate an instruction whose insn-code is INSN_CODE,
3562    with two operands: an output TARGET and an input OP0.
3563    TARGET *must* be nonzero, and the output is always stored there.
3564    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3565    the value that is stored into TARGET.  */
3566
3567 void
3568 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3569 {
3570   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3571   gcc_assert (ok);
3572 }
3573 \f
3574 struct no_conflict_data
3575 {
3576   rtx target;
3577   rtx_insn *first, *insn;
3578   bool must_stay;
3579 };
3580
3581 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3582    the currently examined clobber / store has to stay in the list of
3583    insns that constitute the actual libcall block.  */
3584 static void
3585 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3586 {
3587   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3588
3589   /* If this inns directly contributes to setting the target, it must stay.  */
3590   if (reg_overlap_mentioned_p (p->target, dest))
3591     p->must_stay = true;
3592   /* If we haven't committed to keeping any other insns in the list yet,
3593      there is nothing more to check.  */
3594   else if (p->insn == p->first)
3595     return;
3596   /* If this insn sets / clobbers a register that feeds one of the insns
3597      already in the list, this insn has to stay too.  */
3598   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3599            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3600            || reg_used_between_p (dest, p->first, p->insn)
3601            /* Likewise if this insn depends on a register set by a previous
3602               insn in the list, or if it sets a result (presumably a hard
3603               register) that is set or clobbered by a previous insn.
3604               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3605               SET_DEST perform the former check on the address, and the latter
3606               check on the MEM.  */
3607            || (GET_CODE (set) == SET
3608                && (modified_in_p (SET_SRC (set), p->first)
3609                    || modified_in_p (SET_DEST (set), p->first)
3610                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3611                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3612     p->must_stay = true;
3613 }
3614
3615 \f
3616 /* Emit code to make a call to a constant function or a library call.
3617
3618    INSNS is a list containing all insns emitted in the call.
3619    These insns leave the result in RESULT.  Our block is to copy RESULT
3620    to TARGET, which is logically equivalent to EQUIV.
3621
3622    We first emit any insns that set a pseudo on the assumption that these are
3623    loading constants into registers; doing so allows them to be safely cse'ed
3624    between blocks.  Then we emit all the other insns in the block, followed by
3625    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3626    note with an operand of EQUIV.  */
3627
3628 static void
3629 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3630                       bool equiv_may_trap)
3631 {
3632   rtx final_dest = target;
3633   rtx_insn *next, *last, *insn;
3634
3635   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3636      into a MEM later.  Protect the libcall block from this change.  */
3637   if (! REG_P (target) || REG_USERVAR_P (target))
3638     target = gen_reg_rtx (GET_MODE (target));
3639
3640   /* If we're using non-call exceptions, a libcall corresponding to an
3641      operation that may trap may also trap.  */
3642   /* ??? See the comment in front of make_reg_eh_region_note.  */
3643   if (cfun->can_throw_non_call_exceptions
3644       && (equiv_may_trap || may_trap_p (equiv)))
3645     {
3646       for (insn = insns; insn; insn = NEXT_INSN (insn))
3647         if (CALL_P (insn))
3648           {
3649             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3650             if (note)
3651               {
3652                 int lp_nr = INTVAL (XEXP (note, 0));
3653                 if (lp_nr == 0 || lp_nr == INT_MIN)
3654                   remove_note (insn, note);
3655               }
3656           }
3657     }
3658   else
3659     {
3660       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3661          reg note to indicate that this call cannot throw or execute a nonlocal
3662          goto (unless there is already a REG_EH_REGION note, in which case
3663          we update it).  */
3664       for (insn = insns; insn; insn = NEXT_INSN (insn))
3665         if (CALL_P (insn))
3666           make_reg_eh_region_note_nothrow_nononlocal (insn);
3667     }
3668
3669   /* First emit all insns that set pseudos.  Remove them from the list as
3670      we go.  Avoid insns that set pseudos which were referenced in previous
3671      insns.  These can be generated by move_by_pieces, for example,
3672      to update an address.  Similarly, avoid insns that reference things
3673      set in previous insns.  */
3674
3675   for (insn = insns; insn; insn = next)
3676     {
3677       rtx set = single_set (insn);
3678
3679       next = NEXT_INSN (insn);
3680
3681       if (set != 0 && REG_P (SET_DEST (set))
3682           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3683         {
3684           struct no_conflict_data data;
3685
3686           data.target = const0_rtx;
3687           data.first = insns;
3688           data.insn = insn;
3689           data.must_stay = 0;
3690           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3691           if (! data.must_stay)
3692             {
3693               if (PREV_INSN (insn))
3694                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3695               else
3696                 insns = next;
3697
3698               if (next)
3699                 SET_PREV_INSN (next) = PREV_INSN (insn);
3700
3701               add_insn (insn);
3702             }
3703         }
3704
3705       /* Some ports use a loop to copy large arguments onto the stack.
3706          Don't move anything outside such a loop.  */
3707       if (LABEL_P (insn))
3708         break;
3709     }
3710
3711   /* Write the remaining insns followed by the final copy.  */
3712   for (insn = insns; insn; insn = next)
3713     {
3714       next = NEXT_INSN (insn);
3715
3716       add_insn (insn);
3717     }
3718
3719   last = emit_move_insn (target, result);
3720   if (equiv)
3721     set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3722
3723   if (final_dest != target)
3724     emit_move_insn (final_dest, target);
3725 }
3726
3727 void
3728 emit_libcall_block (rtx_insn *insns, rtx target, rtx result, rtx equiv)
3729 {
3730   emit_libcall_block_1 (insns, target, result, equiv, false);
3731 }
3732 \f
3733 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3734    PURPOSE describes how this comparison will be used.  CODE is the rtx
3735    comparison code we will be using.
3736
3737    ??? Actually, CODE is slightly weaker than that.  A target is still
3738    required to implement all of the normal bcc operations, but not
3739    required to implement all (or any) of the unordered bcc operations.  */
3740
3741 int
3742 can_compare_p (enum rtx_code code, machine_mode mode,
3743                enum can_compare_purpose purpose)
3744 {
3745   rtx test;
3746   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
3747   do
3748     {
3749       enum insn_code icode;
3750
3751       if (purpose == ccp_jump
3752           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
3753           && insn_operand_matches (icode, 0, test))
3754         return 1;
3755       if (purpose == ccp_store_flag
3756           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
3757           && insn_operand_matches (icode, 1, test))
3758         return 1;
3759       if (purpose == ccp_cmov
3760           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
3761         return 1;
3762
3763       mode = GET_MODE_WIDER_MODE (mode).else_void ();
3764       PUT_MODE (test, mode);
3765     }
3766   while (mode != VOIDmode);
3767
3768   return 0;
3769 }
3770
3771 /* This function is called when we are going to emit a compare instruction that
3772    compares the values found in X and Y, using the rtl operator COMPARISON.
3773
3774    If they have mode BLKmode, then SIZE specifies the size of both operands.
3775
3776    UNSIGNEDP nonzero says that the operands are unsigned;
3777    this matters if they need to be widened (as given by METHODS).
3778
3779    *PTEST is where the resulting comparison RTX is returned or NULL_RTX
3780    if we failed to produce one.
3781
3782    *PMODE is the mode of the inputs (in case they are const_int).
3783
3784    This function performs all the setup necessary so that the caller only has
3785    to emit a single comparison insn.  This setup can involve doing a BLKmode
3786    comparison or emitting a library call to perform the comparison if no insn
3787    is available to handle it.
3788    The values which are passed in through pointers can be modified; the caller
3789    should perform the comparison on the modified values.  Constant
3790    comparisons must have already been folded.  */
3791
3792 static void
3793 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
3794                   int unsignedp, enum optab_methods methods,
3795                   rtx *ptest, machine_mode *pmode)
3796 {
3797   machine_mode mode = *pmode;
3798   rtx libfunc, test;
3799   machine_mode cmp_mode;
3800   enum mode_class mclass;
3801
3802   /* The other methods are not needed.  */
3803   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
3804               || methods == OPTAB_LIB_WIDEN);
3805
3806   /* If we are optimizing, force expensive constants into a register.  */
3807   if (CONSTANT_P (x) && optimize
3808       && (rtx_cost (x, mode, COMPARE, 0, optimize_insn_for_speed_p ())
3809           > COSTS_N_INSNS (1)))
3810     x = force_reg (mode, x);
3811
3812   if (CONSTANT_P (y) && optimize
3813       && (rtx_cost (y, mode, COMPARE, 1, optimize_insn_for_speed_p ())
3814           > COSTS_N_INSNS (1)))
3815     y = force_reg (mode, y);
3816
3817 #if HAVE_cc0
3818   /* Make sure if we have a canonical comparison.  The RTL
3819      documentation states that canonical comparisons are required only
3820      for targets which have cc0.  */
3821   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
3822 #endif
3823
3824   /* Don't let both operands fail to indicate the mode.  */
3825   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
3826     x = force_reg (mode, x);
3827   if (mode == VOIDmode)
3828     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
3829
3830   /* Handle all BLKmode compares.  */
3831
3832   if (mode == BLKmode)
3833     {
3834       machine_mode result_mode;
3835       enum insn_code cmp_code;
3836       rtx result;
3837       rtx opalign
3838         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
3839
3840       gcc_assert (size);
3841
3842       /* Try to use a memory block compare insn - either cmpstr
3843          or cmpmem will do.  */
3844       opt_scalar_int_mode cmp_mode_iter;
3845       FOR_EACH_MODE_IN_CLASS (cmp_mode_iter, MODE_INT)
3846         {
3847           scalar_int_mode cmp_mode = cmp_mode_iter.require ();
3848           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
3849           if (cmp_code == CODE_FOR_nothing)
3850             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
3851           if (cmp_code == CODE_FOR_nothing)
3852             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
3853           if (cmp_code == CODE_FOR_nothing)
3854             continue;
3855
3856           /* Must make sure the size fits the insn's mode.  */
3857           if (CONST_INT_P (size)
3858               ? INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode))
3859               : (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (size)))
3860                  > GET_MODE_BITSIZE (cmp_mode)))
3861             continue;
3862
3863           result_mode = insn_data[cmp_code].operand[0].mode;
3864           result = gen_reg_rtx (result_mode);
3865           size = convert_to_mode (cmp_mode, size, 1);
3866           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
3867
3868           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
3869           *pmode = result_mode;
3870           return;
3871         }
3872
3873       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
3874         goto fail;
3875
3876       /* Otherwise call a library function.  */
3877       result = emit_block_comp_via_libcall (XEXP (x, 0), XEXP (y, 0), size);
3878
3879       x = result;
3880       y = const0_rtx;
3881       mode = TYPE_MODE (integer_type_node);
3882       methods = OPTAB_LIB_WIDEN;
3883       unsignedp = false;
3884     }
3885
3886   /* Don't allow operands to the compare to trap, as that can put the
3887      compare and branch in different basic blocks.  */
3888   if (cfun->can_throw_non_call_exceptions)
3889     {
3890       if (may_trap_p (x))
3891         x = copy_to_reg (x);
3892       if (may_trap_p (y))
3893         y = copy_to_reg (y);
3894     }
3895
3896   if (GET_MODE_CLASS (mode) == MODE_CC)
3897     {
3898       enum insn_code icode = optab_handler (cbranch_optab, CCmode);
3899       test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3900       gcc_assert (icode != CODE_FOR_nothing
3901                   && insn_operand_matches (icode, 0, test));
3902       *ptest = test;
3903       return;
3904     }
3905
3906   mclass = GET_MODE_CLASS (mode);
3907   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3908   FOR_EACH_MODE_FROM (cmp_mode, mode)
3909     {
3910       enum insn_code icode;
3911       icode = optab_handler (cbranch_optab, cmp_mode);
3912       if (icode != CODE_FOR_nothing
3913           && insn_operand_matches (icode, 0, test))
3914         {
3915           rtx_insn *last = get_last_insn ();
3916           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
3917           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
3918           if (op0 && op1
3919               && insn_operand_matches (icode, 1, op0)
3920               && insn_operand_matches (icode, 2, op1))
3921             {
3922               XEXP (test, 0) = op0;
3923               XEXP (test, 1) = op1;
3924               *ptest = test;
3925               *pmode = cmp_mode;
3926               return;
3927             }
3928           delete_insns_since (last);
3929         }
3930
3931       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
3932         break;
3933     }
3934
3935   if (methods != OPTAB_LIB_WIDEN)
3936     goto fail;
3937
3938   if (!SCALAR_FLOAT_MODE_P (mode))
3939     {
3940       rtx result;
3941       machine_mode ret_mode;
3942
3943       /* Handle a libcall just for the mode we are using.  */
3944       libfunc = optab_libfunc (cmp_optab, mode);
3945       gcc_assert (libfunc);
3946
3947       /* If we want unsigned, and this mode has a distinct unsigned
3948          comparison routine, use that.  */
3949       if (unsignedp)
3950         {
3951           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
3952           if (ulibfunc)
3953             libfunc = ulibfunc;
3954         }
3955
3956       ret_mode = targetm.libgcc_cmp_return_mode ();
3957       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
3958                                         ret_mode, x, mode, y, mode);
3959
3960       /* There are two kinds of comparison routines. Biased routines
3961          return 0/1/2, and unbiased routines return -1/0/1. Other parts
3962          of gcc expect that the comparison operation is equivalent
3963          to the modified comparison. For signed comparisons compare the
3964          result against 1 in the biased case, and zero in the unbiased
3965          case. For unsigned comparisons always compare against 1 after
3966          biasing the unbiased result by adding 1. This gives us a way to
3967          represent LTU.
3968          The comparisons in the fixed-point helper library are always
3969          biased.  */
3970       x = result;
3971       y = const1_rtx;
3972
3973       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
3974         {
3975           if (unsignedp)
3976             x = plus_constant (ret_mode, result, 1);
3977           else
3978             y = const0_rtx;
3979         }
3980
3981       *pmode = ret_mode;
3982       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
3983                         ptest, pmode);
3984     }
3985   else
3986     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
3987
3988   return;
3989
3990  fail:
3991   *ptest = NULL_RTX;
3992 }
3993
3994 /* Before emitting an insn with code ICODE, make sure that X, which is going
3995    to be used for operand OPNUM of the insn, is converted from mode MODE to
3996    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
3997    that it is accepted by the operand predicate.  Return the new value.  */
3998
3999 rtx
4000 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
4001                  machine_mode wider_mode, int unsignedp)
4002 {
4003   if (mode != wider_mode)
4004     x = convert_modes (wider_mode, mode, x, unsignedp);
4005
4006   if (!insn_operand_matches (icode, opnum, x))
4007     {
4008       machine_mode op_mode = insn_data[(int) icode].operand[opnum].mode;
4009       if (reload_completed)
4010         return NULL_RTX;
4011       if (GET_MODE (x) != op_mode && GET_MODE (x) != VOIDmode)
4012         return NULL_RTX;
4013       x = copy_to_mode_reg (op_mode, x);
4014     }
4015
4016   return x;
4017 }
4018
4019 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4020    we can do the branch.  */
4021
4022 static void
4023 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label,
4024                           profile_probability prob)
4025 {
4026   machine_mode optab_mode;
4027   enum mode_class mclass;
4028   enum insn_code icode;
4029   rtx_insn *insn;
4030
4031   mclass = GET_MODE_CLASS (mode);
4032   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4033   icode = optab_handler (cbranch_optab, optab_mode);
4034
4035   gcc_assert (icode != CODE_FOR_nothing);
4036   gcc_assert (insn_operand_matches (icode, 0, test));
4037   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4038                                           XEXP (test, 1), label));
4039   if (prob.initialized_p ()
4040       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4041       && insn
4042       && JUMP_P (insn)
4043       && any_condjump_p (insn)
4044       && !find_reg_note (insn, REG_BR_PROB, 0))
4045     add_reg_br_prob_note (insn, prob);
4046 }
4047
4048 /* Generate code to compare X with Y so that the condition codes are
4049    set and to jump to LABEL if the condition is true.  If X is a
4050    constant and Y is not a constant, then the comparison is swapped to
4051    ensure that the comparison RTL has the canonical form.
4052
4053    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4054    need to be widened.  UNSIGNEDP is also used to select the proper
4055    branch condition code.
4056
4057    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4058
4059    MODE is the mode of the inputs (in case they are const_int).
4060
4061    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4062    It will be potentially converted into an unsigned variant based on
4063    UNSIGNEDP to select a proper jump instruction.
4064
4065    PROB is the probability of jumping to LABEL.  */
4066
4067 void
4068 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4069                          machine_mode mode, int unsignedp, rtx label,
4070                          profile_probability prob)
4071 {
4072   rtx op0 = x, op1 = y;
4073   rtx test;
4074
4075   /* Swap operands and condition to ensure canonical RTL.  */
4076   if (swap_commutative_operands_p (x, y)
4077       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4078     {
4079       op0 = y, op1 = x;
4080       comparison = swap_condition (comparison);
4081     }
4082
4083   /* If OP0 is still a constant, then both X and Y must be constants
4084      or the opposite comparison is not supported.  Force X into a register
4085      to create canonical RTL.  */
4086   if (CONSTANT_P (op0))
4087     op0 = force_reg (mode, op0);
4088
4089   if (unsignedp)
4090     comparison = unsigned_condition (comparison);
4091
4092   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4093                     &test, &mode);
4094   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4095 }
4096
4097 \f
4098 /* Emit a library call comparison between floating point X and Y.
4099    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4100
4101 static void
4102 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4103                        rtx *ptest, machine_mode *pmode)
4104 {
4105   enum rtx_code swapped = swap_condition (comparison);
4106   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4107   machine_mode orig_mode = GET_MODE (x);
4108   machine_mode mode;
4109   rtx true_rtx, false_rtx;
4110   rtx value, target, equiv;
4111   rtx_insn *insns;
4112   rtx libfunc = 0;
4113   bool reversed_p = false;
4114   scalar_int_mode cmp_mode = targetm.libgcc_cmp_return_mode ();
4115
4116   FOR_EACH_MODE_FROM (mode, orig_mode)
4117     {
4118       if (code_to_optab (comparison)
4119           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4120         break;
4121
4122       if (code_to_optab (swapped)
4123           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4124         {
4125           std::swap (x, y);
4126           comparison = swapped;
4127           break;
4128         }
4129
4130       if (code_to_optab (reversed)
4131           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4132         {
4133           comparison = reversed;
4134           reversed_p = true;
4135           break;
4136         }
4137     }
4138
4139   gcc_assert (mode != VOIDmode);
4140
4141   if (mode != orig_mode)
4142     {
4143       x = convert_to_mode (mode, x, 0);
4144       y = convert_to_mode (mode, y, 0);
4145     }
4146
4147   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4148      the RTL.  The allows the RTL optimizers to delete the libcall if the
4149      condition can be determined at compile-time.  */
4150   if (comparison == UNORDERED
4151       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4152     {
4153       true_rtx = const_true_rtx;
4154       false_rtx = const0_rtx;
4155     }
4156   else
4157     {
4158       switch (comparison)
4159         {
4160         case EQ:
4161           true_rtx = const0_rtx;
4162           false_rtx = const_true_rtx;
4163           break;
4164
4165         case NE:
4166           true_rtx = const_true_rtx;
4167           false_rtx = const0_rtx;
4168           break;
4169
4170         case GT:
4171           true_rtx = const1_rtx;
4172           false_rtx = const0_rtx;
4173           break;
4174
4175         case GE:
4176           true_rtx = const0_rtx;
4177           false_rtx = constm1_rtx;
4178           break;
4179
4180         case LT:
4181           true_rtx = constm1_rtx;
4182           false_rtx = const0_rtx;
4183           break;
4184
4185         case LE:
4186           true_rtx = const0_rtx;
4187           false_rtx = const1_rtx;
4188           break;
4189
4190         default:
4191           gcc_unreachable ();
4192         }
4193     }
4194
4195   if (comparison == UNORDERED)
4196     {
4197       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4198       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4199       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4200                                     temp, const_true_rtx, equiv);
4201     }
4202   else
4203     {
4204       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4205       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4206         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4207                                       equiv, true_rtx, false_rtx);
4208     }
4209
4210   start_sequence ();
4211   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4212                                    cmp_mode, x, mode, y, mode);
4213   insns = get_insns ();
4214   end_sequence ();
4215
4216   target = gen_reg_rtx (cmp_mode);
4217   emit_libcall_block (insns, target, value, equiv);
4218
4219   if (comparison == UNORDERED
4220       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4221       || reversed_p)
4222     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4223   else
4224     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4225
4226   *pmode = cmp_mode;
4227 }
4228 \f
4229 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4230
4231 void
4232 emit_indirect_jump (rtx loc)
4233 {
4234   if (!targetm.have_indirect_jump ())
4235     sorry ("indirect jumps are not available on this target");
4236   else
4237     {
4238       struct expand_operand ops[1];
4239       create_address_operand (&ops[0], loc);
4240       expand_jump_insn (targetm.code_for_indirect_jump, 1, ops);
4241       emit_barrier ();
4242     }
4243 }
4244 \f
4245
4246 /* Emit a conditional move instruction if the machine supports one for that
4247    condition and machine mode.
4248
4249    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4250    the mode to use should they be constants.  If it is VOIDmode, they cannot
4251    both be constants.
4252
4253    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4254    should be stored there.  MODE is the mode to use should they be constants.
4255    If it is VOIDmode, they cannot both be constants.
4256
4257    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4258    is not supported.  */
4259
4260 rtx
4261 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4262                        machine_mode cmode, rtx op2, rtx op3,
4263                        machine_mode mode, int unsignedp)
4264 {
4265   rtx comparison;
4266   rtx_insn *last;
4267   enum insn_code icode;
4268   enum rtx_code reversed;
4269
4270   /* If the two source operands are identical, that's just a move.  */
4271
4272   if (rtx_equal_p (op2, op3))
4273     {
4274       if (!target)
4275         target = gen_reg_rtx (mode);
4276
4277       emit_move_insn (target, op3);
4278       return target;
4279     }
4280
4281   /* If one operand is constant, make it the second one.  Only do this
4282      if the other operand is not constant as well.  */
4283
4284   if (swap_commutative_operands_p (op0, op1))
4285     {
4286       std::swap (op0, op1);
4287       code = swap_condition (code);
4288     }
4289
4290   /* get_condition will prefer to generate LT and GT even if the old
4291      comparison was against zero, so undo that canonicalization here since
4292      comparisons against zero are cheaper.  */
4293   if (code == LT && op1 == const1_rtx)
4294     code = LE, op1 = const0_rtx;
4295   else if (code == GT && op1 == constm1_rtx)
4296     code = GE, op1 = const0_rtx;
4297
4298   if (cmode == VOIDmode)
4299     cmode = GET_MODE (op0);
4300
4301   enum rtx_code orig_code = code;
4302   bool swapped = false;
4303   if (swap_commutative_operands_p (op2, op3)
4304       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4305           != UNKNOWN))
4306     {
4307       std::swap (op2, op3);
4308       code = reversed;
4309       swapped = true;
4310     }
4311
4312   if (mode == VOIDmode)
4313     mode = GET_MODE (op2);
4314
4315   icode = direct_optab_handler (movcc_optab, mode);
4316
4317   if (icode == CODE_FOR_nothing)
4318     return NULL_RTX;
4319
4320   if (!target)
4321     target = gen_reg_rtx (mode);
4322
4323   for (int pass = 0; ; pass++)
4324     {
4325       code = unsignedp ? unsigned_condition (code) : code;
4326       comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4327
4328       /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4329          punt and let the caller figure out how best to deal with this
4330          situation.  */
4331       if (COMPARISON_P (comparison))
4332         {
4333           saved_pending_stack_adjust save;
4334           save_pending_stack_adjust (&save);
4335           last = get_last_insn ();
4336           do_pending_stack_adjust ();
4337           prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4338                             GET_CODE (comparison), NULL_RTX, unsignedp,
4339                             OPTAB_WIDEN, &comparison, &cmode);
4340           if (comparison)
4341             {
4342               struct expand_operand ops[4];
4343
4344               create_output_operand (&ops[0], target, mode);
4345               create_fixed_operand (&ops[1], comparison);
4346               create_input_operand (&ops[2], op2, mode);
4347               create_input_operand (&ops[3], op3, mode);
4348               if (maybe_expand_insn (icode, 4, ops))
4349                 {
4350                   if (ops[0].value != target)
4351                     convert_move (target, ops[0].value, false);
4352                   return target;
4353                 }
4354             }
4355           delete_insns_since (last);
4356           restore_pending_stack_adjust (&save);
4357         }
4358
4359       if (pass == 1)
4360         return NULL_RTX;
4361
4362       /* If the preferred op2/op3 order is not usable, retry with other
4363          operand order, perhaps it will expand successfully.  */
4364       if (swapped)
4365         code = orig_code;
4366       else if ((reversed = reversed_comparison_code_parts (orig_code, op0, op1,
4367                                                            NULL))
4368                != UNKNOWN)
4369         code = reversed;
4370       else
4371         return NULL_RTX;
4372       std::swap (op2, op3);
4373     }
4374 }
4375
4376
4377 /* Emit a conditional negate or bitwise complement using the
4378    negcc or notcc optabs if available.  Return NULL_RTX if such operations
4379    are not available.  Otherwise return the RTX holding the result.
4380    TARGET is the desired destination of the result.  COMP is the comparison
4381    on which to negate.  If COND is true move into TARGET the negation
4382    or bitwise complement of OP1.  Otherwise move OP2 into TARGET.
4383    CODE is either NEG or NOT.  MODE is the machine mode in which the
4384    operation is performed.  */
4385
4386 rtx
4387 emit_conditional_neg_or_complement (rtx target, rtx_code code,
4388                                      machine_mode mode, rtx cond, rtx op1,
4389                                      rtx op2)
4390 {
4391   optab op = unknown_optab;
4392   if (code == NEG)
4393     op = negcc_optab;
4394   else if (code == NOT)
4395     op = notcc_optab;
4396   else
4397     gcc_unreachable ();
4398
4399   insn_code icode = direct_optab_handler (op, mode);
4400
4401   if (icode == CODE_FOR_nothing)
4402     return NULL_RTX;
4403
4404   if (!target)
4405     target = gen_reg_rtx (mode);
4406
4407   rtx_insn *last = get_last_insn ();
4408   struct expand_operand ops[4];
4409
4410   create_output_operand (&ops[0], target, mode);
4411   create_fixed_operand (&ops[1], cond);
4412   create_input_operand (&ops[2], op1, mode);
4413   create_input_operand (&ops[3], op2, mode);
4414
4415   if (maybe_expand_insn (icode, 4, ops))
4416     {
4417       if (ops[0].value != target)
4418         convert_move (target, ops[0].value, false);
4419
4420       return target;
4421     }
4422   delete_insns_since (last);
4423   return NULL_RTX;
4424 }
4425
4426 /* Emit a conditional addition instruction if the machine supports one for that
4427    condition and machine mode.
4428
4429    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4430    the mode to use should they be constants.  If it is VOIDmode, they cannot
4431    both be constants.
4432
4433    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4434    should be stored there.  MODE is the mode to use should they be constants.
4435    If it is VOIDmode, they cannot both be constants.
4436
4437    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4438    is not supported.  */
4439
4440 rtx
4441 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4442                       machine_mode cmode, rtx op2, rtx op3,
4443                       machine_mode mode, int unsignedp)
4444 {
4445   rtx comparison;
4446   rtx_insn *last;
4447   enum insn_code icode;
4448
4449   /* If one operand is constant, make it the second one.  Only do this
4450      if the other operand is not constant as well.  */
4451
4452   if (swap_commutative_operands_p (op0, op1))
4453     {
4454       std::swap (op0, op1);
4455       code = swap_condition (code);
4456     }
4457
4458   /* get_condition will prefer to generate LT and GT even if the old
4459      comparison was against zero, so undo that canonicalization here since
4460      comparisons against zero are cheaper.  */
4461   if (code == LT && op1 == const1_rtx)
4462     code = LE, op1 = const0_rtx;
4463   else if (code == GT && op1 == constm1_rtx)
4464     code = GE, op1 = const0_rtx;
4465
4466   if (cmode == VOIDmode)
4467     cmode = GET_MODE (op0);
4468
4469   if (mode == VOIDmode)
4470     mode = GET_MODE (op2);
4471
4472   icode = optab_handler (addcc_optab, mode);
4473
4474   if (icode == CODE_FOR_nothing)
4475     return 0;
4476
4477   if (!target)
4478     target = gen_reg_rtx (mode);
4479
4480   code = unsignedp ? unsigned_condition (code) : code;
4481   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4482
4483   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4484      return NULL and let the caller figure out how best to deal with this
4485      situation.  */
4486   if (!COMPARISON_P (comparison))
4487     return NULL_RTX;
4488
4489   do_pending_stack_adjust ();
4490   last = get_last_insn ();
4491   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4492                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4493                     &comparison, &cmode);
4494   if (comparison)
4495     {
4496       struct expand_operand ops[4];
4497
4498       create_output_operand (&ops[0], target, mode);
4499       create_fixed_operand (&ops[1], comparison);
4500       create_input_operand (&ops[2], op2, mode);
4501       create_input_operand (&ops[3], op3, mode);
4502       if (maybe_expand_insn (icode, 4, ops))
4503         {
4504           if (ops[0].value != target)
4505             convert_move (target, ops[0].value, false);
4506           return target;
4507         }
4508     }
4509   delete_insns_since (last);
4510   return NULL_RTX;
4511 }
4512 \f
4513 /* These functions attempt to generate an insn body, rather than
4514    emitting the insn, but if the gen function already emits them, we
4515    make no attempt to turn them back into naked patterns.  */
4516
4517 /* Generate and return an insn body to add Y to X.  */
4518
4519 rtx_insn *
4520 gen_add2_insn (rtx x, rtx y)
4521 {
4522   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4523
4524   gcc_assert (insn_operand_matches (icode, 0, x));
4525   gcc_assert (insn_operand_matches (icode, 1, x));
4526   gcc_assert (insn_operand_matches (icode, 2, y));
4527
4528   return GEN_FCN (icode) (x, x, y);
4529 }
4530
4531 /* Generate and return an insn body to add r1 and c,
4532    storing the result in r0.  */
4533
4534 rtx_insn *
4535 gen_add3_insn (rtx r0, rtx r1, rtx c)
4536 {
4537   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4538
4539   if (icode == CODE_FOR_nothing
4540       || !insn_operand_matches (icode, 0, r0)
4541       || !insn_operand_matches (icode, 1, r1)
4542       || !insn_operand_matches (icode, 2, c))
4543     return NULL;
4544
4545   return GEN_FCN (icode) (r0, r1, c);
4546 }
4547
4548 int
4549 have_add2_insn (rtx x, rtx y)
4550 {
4551   enum insn_code icode;
4552
4553   gcc_assert (GET_MODE (x) != VOIDmode);
4554
4555   icode = optab_handler (add_optab, GET_MODE (x));
4556
4557   if (icode == CODE_FOR_nothing)
4558     return 0;
4559
4560   if (!insn_operand_matches (icode, 0, x)
4561       || !insn_operand_matches (icode, 1, x)
4562       || !insn_operand_matches (icode, 2, y))
4563     return 0;
4564
4565   return 1;
4566 }
4567
4568 /* Generate and return an insn body to add Y to X.  */
4569
4570 rtx_insn *
4571 gen_addptr3_insn (rtx x, rtx y, rtx z)
4572 {
4573   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4574
4575   gcc_assert (insn_operand_matches (icode, 0, x));
4576   gcc_assert (insn_operand_matches (icode, 1, y));
4577   gcc_assert (insn_operand_matches (icode, 2, z));
4578
4579   return GEN_FCN (icode) (x, y, z);
4580 }
4581
4582 /* Return true if the target implements an addptr pattern and X, Y,
4583    and Z are valid for the pattern predicates.  */
4584
4585 int
4586 have_addptr3_insn (rtx x, rtx y, rtx z)
4587 {
4588   enum insn_code icode;
4589
4590   gcc_assert (GET_MODE (x) != VOIDmode);
4591
4592   icode = optab_handler (addptr3_optab, GET_MODE (x));
4593
4594   if (icode == CODE_FOR_nothing)
4595     return 0;
4596
4597   if (!insn_operand_matches (icode, 0, x)
4598       || !insn_operand_matches (icode, 1, y)
4599       || !insn_operand_matches (icode, 2, z))
4600     return 0;
4601
4602   return 1;
4603 }
4604
4605 /* Generate and return an insn body to subtract Y from X.  */
4606
4607 rtx_insn *
4608 gen_sub2_insn (rtx x, rtx y)
4609 {
4610   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4611
4612   gcc_assert (insn_operand_matches (icode, 0, x));
4613   gcc_assert (insn_operand_matches (icode, 1, x));
4614   gcc_assert (insn_operand_matches (icode, 2, y));
4615
4616   return GEN_FCN (icode) (x, x, y);
4617 }
4618
4619 /* Generate and return an insn body to subtract r1 and c,
4620    storing the result in r0.  */
4621
4622 rtx_insn *
4623 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4624 {
4625   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4626
4627   if (icode == CODE_FOR_nothing
4628       || !insn_operand_matches (icode, 0, r0)
4629       || !insn_operand_matches (icode, 1, r1)
4630       || !insn_operand_matches (icode, 2, c))
4631     return NULL;
4632
4633   return GEN_FCN (icode) (r0, r1, c);
4634 }
4635
4636 int
4637 have_sub2_insn (rtx x, rtx y)
4638 {
4639   enum insn_code icode;
4640
4641   gcc_assert (GET_MODE (x) != VOIDmode);
4642
4643   icode = optab_handler (sub_optab, GET_MODE (x));
4644
4645   if (icode == CODE_FOR_nothing)
4646     return 0;
4647
4648   if (!insn_operand_matches (icode, 0, x)
4649       || !insn_operand_matches (icode, 1, x)
4650       || !insn_operand_matches (icode, 2, y))
4651     return 0;
4652
4653   return 1;
4654 }
4655 \f
4656 /* Generate the body of an insn to extend Y (with mode MFROM)
4657    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4658
4659 rtx_insn *
4660 gen_extend_insn (rtx x, rtx y, machine_mode mto,
4661                  machine_mode mfrom, int unsignedp)
4662 {
4663   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4664   return GEN_FCN (icode) (x, y);
4665 }
4666 \f
4667 /* Generate code to convert FROM to floating point
4668    and store in TO.  FROM must be fixed point and not VOIDmode.
4669    UNSIGNEDP nonzero means regard FROM as unsigned.
4670    Normally this is done by correcting the final value
4671    if it is negative.  */
4672
4673 void
4674 expand_float (rtx to, rtx from, int unsignedp)
4675 {
4676   enum insn_code icode;
4677   rtx target = to;
4678   scalar_mode from_mode, to_mode;
4679   machine_mode fmode, imode;
4680   bool can_do_signed = false;
4681
4682   /* Crash now, because we won't be able to decide which mode to use.  */
4683   gcc_assert (GET_MODE (from) != VOIDmode);
4684
4685   /* Look for an insn to do the conversion.  Do it in the specified
4686      modes if possible; otherwise convert either input, output or both to
4687      wider mode.  If the integer mode is wider than the mode of FROM,
4688      we can do the conversion signed even if the input is unsigned.  */
4689
4690   FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
4691     FOR_EACH_MODE_FROM (imode, GET_MODE (from))
4692       {
4693         int doing_unsigned = unsignedp;
4694
4695         if (fmode != GET_MODE (to)
4696             && (significand_size (fmode)
4697                 < GET_MODE_UNIT_PRECISION (GET_MODE (from))))
4698           continue;
4699
4700         icode = can_float_p (fmode, imode, unsignedp);
4701         if (icode == CODE_FOR_nothing && unsignedp)
4702           {
4703             enum insn_code scode = can_float_p (fmode, imode, 0);
4704             if (scode != CODE_FOR_nothing)
4705               can_do_signed = true;
4706             if (imode != GET_MODE (from))
4707               icode = scode, doing_unsigned = 0;
4708           }
4709
4710         if (icode != CODE_FOR_nothing)
4711           {
4712             if (imode != GET_MODE (from))
4713               from = convert_to_mode (imode, from, unsignedp);
4714
4715             if (fmode != GET_MODE (to))
4716               target = gen_reg_rtx (fmode);
4717
4718             emit_unop_insn (icode, target, from,
4719                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
4720
4721             if (target != to)
4722               convert_move (to, target, 0);
4723             return;
4724           }
4725       }
4726
4727   /* Unsigned integer, and no way to convert directly.  Convert as signed,
4728      then unconditionally adjust the result.  */
4729   if (unsignedp
4730       && can_do_signed
4731       && is_a <scalar_mode> (GET_MODE (to), &to_mode)
4732       && is_a <scalar_mode> (GET_MODE (from), &from_mode))
4733     {
4734       opt_scalar_mode fmode_iter;
4735       rtx_code_label *label = gen_label_rtx ();
4736       rtx temp;
4737       REAL_VALUE_TYPE offset;
4738
4739       /* Look for a usable floating mode FMODE wider than the source and at
4740          least as wide as the target.  Using FMODE will avoid rounding woes
4741          with unsigned values greater than the signed maximum value.  */
4742
4743       FOR_EACH_MODE_FROM (fmode_iter, to_mode)
4744         {
4745           scalar_mode fmode = fmode_iter.require ();
4746           if (GET_MODE_PRECISION (from_mode) < GET_MODE_BITSIZE (fmode)
4747               && can_float_p (fmode, from_mode, 0) != CODE_FOR_nothing)
4748             break;
4749         }
4750
4751       if (!fmode_iter.exists (&fmode))
4752         {
4753           /* There is no such mode.  Pretend the target is wide enough.  */
4754           fmode = to_mode;
4755
4756           /* Avoid double-rounding when TO is narrower than FROM.  */
4757           if ((significand_size (fmode) + 1)
4758               < GET_MODE_PRECISION (from_mode))
4759             {
4760               rtx temp1;
4761               rtx_code_label *neglabel = gen_label_rtx ();
4762
4763               /* Don't use TARGET if it isn't a register, is a hard register,
4764                  or is the wrong mode.  */
4765               if (!REG_P (target)
4766                   || REGNO (target) < FIRST_PSEUDO_REGISTER
4767                   || GET_MODE (target) != fmode)
4768                 target = gen_reg_rtx (fmode);
4769
4770               imode = from_mode;
4771               do_pending_stack_adjust ();
4772
4773               /* Test whether the sign bit is set.  */
4774               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
4775                                        0, neglabel);
4776
4777               /* The sign bit is not set.  Convert as signed.  */
4778               expand_float (target, from, 0);
4779               emit_jump_insn (targetm.gen_jump (label));
4780               emit_barrier ();
4781
4782               /* The sign bit is set.
4783                  Convert to a usable (positive signed) value by shifting right
4784                  one bit, while remembering if a nonzero bit was shifted
4785                  out; i.e., compute  (from & 1) | (from >> 1).  */
4786
4787               emit_label (neglabel);
4788               temp = expand_binop (imode, and_optab, from, const1_rtx,
4789                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
4790               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
4791               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
4792                                    OPTAB_LIB_WIDEN);
4793               expand_float (target, temp, 0);
4794
4795               /* Multiply by 2 to undo the shift above.  */
4796               temp = expand_binop (fmode, add_optab, target, target,
4797                                    target, 0, OPTAB_LIB_WIDEN);
4798               if (temp != target)
4799                 emit_move_insn (target, temp);
4800
4801               do_pending_stack_adjust ();
4802               emit_label (label);
4803               goto done;
4804             }
4805         }
4806
4807       /* If we are about to do some arithmetic to correct for an
4808          unsigned operand, do it in a pseudo-register.  */
4809
4810       if (to_mode != fmode
4811           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
4812         target = gen_reg_rtx (fmode);
4813
4814       /* Convert as signed integer to floating.  */
4815       expand_float (target, from, 0);
4816
4817       /* If FROM is negative (and therefore TO is negative),
4818          correct its value by 2**bitwidth.  */
4819
4820       do_pending_stack_adjust ();
4821       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, from_mode,
4822                                0, label);
4823
4824
4825       real_2expN (&offset, GET_MODE_PRECISION (from_mode), fmode);
4826       temp = expand_binop (fmode, add_optab, target,
4827                            const_double_from_real_value (offset, fmode),
4828                            target, 0, OPTAB_LIB_WIDEN);
4829       if (temp != target)
4830         emit_move_insn (target, temp);
4831
4832       do_pending_stack_adjust ();
4833       emit_label (label);
4834       goto done;
4835     }
4836
4837   /* No hardware instruction available; call a library routine.  */
4838     {
4839       rtx libfunc;
4840       rtx_insn *insns;
4841       rtx value;
4842       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
4843
4844       if (is_narrower_int_mode (GET_MODE (from), SImode))
4845         from = convert_to_mode (SImode, from, unsignedp);
4846
4847       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
4848       gcc_assert (libfunc);
4849
4850       start_sequence ();
4851
4852       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4853                                        GET_MODE (to), from, GET_MODE (from));
4854       insns = get_insns ();
4855       end_sequence ();
4856
4857       emit_libcall_block (insns, target, value,
4858                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
4859                                          GET_MODE (to), from));
4860     }
4861
4862  done:
4863
4864   /* Copy result to requested destination
4865      if we have been computing in a temp location.  */
4866
4867   if (target != to)
4868     {
4869       if (GET_MODE (target) == GET_MODE (to))
4870         emit_move_insn (to, target);
4871       else
4872         convert_move (to, target, 0);
4873     }
4874 }
4875 \f
4876 /* Generate code to convert FROM to fixed point and store in TO.  FROM
4877    must be floating point.  */
4878
4879 void
4880 expand_fix (rtx to, rtx from, int unsignedp)
4881 {
4882   enum insn_code icode;
4883   rtx target = to;
4884   machine_mode fmode, imode;
4885   opt_scalar_mode fmode_iter;
4886   bool must_trunc = false;
4887
4888   /* We first try to find a pair of modes, one real and one integer, at
4889      least as wide as FROM and TO, respectively, in which we can open-code
4890      this conversion.  If the integer mode is wider than the mode of TO,
4891      we can do the conversion either signed or unsigned.  */
4892
4893   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
4894     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
4895       {
4896         int doing_unsigned = unsignedp;
4897
4898         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
4899         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
4900           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
4901
4902         if (icode != CODE_FOR_nothing)
4903           {
4904             rtx_insn *last = get_last_insn ();
4905             if (fmode != GET_MODE (from))
4906               from = convert_to_mode (fmode, from, 0);
4907
4908             if (must_trunc)
4909               {
4910                 rtx temp = gen_reg_rtx (GET_MODE (from));
4911                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
4912                                     temp, 0);
4913               }
4914
4915             if (imode != GET_MODE (to))
4916               target = gen_reg_rtx (imode);
4917
4918             if (maybe_emit_unop_insn (icode, target, from,
4919                                       doing_unsigned ? UNSIGNED_FIX : FIX))
4920               {
4921                 if (target != to)
4922                   convert_move (to, target, unsignedp);
4923                 return;
4924               }
4925             delete_insns_since (last);
4926           }
4927       }
4928
4929   /* For an unsigned conversion, there is one more way to do it.
4930      If we have a signed conversion, we generate code that compares
4931      the real value to the largest representable positive number.  If if
4932      is smaller, the conversion is done normally.  Otherwise, subtract
4933      one plus the highest signed number, convert, and add it back.
4934
4935      We only need to check all real modes, since we know we didn't find
4936      anything with a wider integer mode.
4937
4938      This code used to extend FP value into mode wider than the destination.
4939      This is needed for decimal float modes which cannot accurately
4940      represent one plus the highest signed number of the same size, but
4941      not for binary modes.  Consider, for instance conversion from SFmode
4942      into DImode.
4943
4944      The hot path through the code is dealing with inputs smaller than 2^63
4945      and doing just the conversion, so there is no bits to lose.
4946
4947      In the other path we know the value is positive in the range 2^63..2^64-1
4948      inclusive.  (as for other input overflow happens and result is undefined)
4949      So we know that the most important bit set in mantissa corresponds to
4950      2^63.  The subtraction of 2^63 should not generate any rounding as it
4951      simply clears out that bit.  The rest is trivial.  */
4952
4953   scalar_int_mode to_mode;
4954   if (unsignedp
4955       && is_a <scalar_int_mode> (GET_MODE (to), &to_mode)
4956       && HWI_COMPUTABLE_MODE_P (to_mode))
4957     FOR_EACH_MODE_FROM (fmode_iter, as_a <scalar_mode> (GET_MODE (from)))
4958       {
4959         scalar_mode fmode = fmode_iter.require ();
4960         if (CODE_FOR_nothing != can_fix_p (to_mode, fmode,
4961                                            0, &must_trunc)
4962             && (!DECIMAL_FLOAT_MODE_P (fmode)
4963                 || (GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (to_mode))))
4964           {
4965             int bitsize;
4966             REAL_VALUE_TYPE offset;
4967             rtx limit;
4968             rtx_code_label *lab1, *lab2;
4969             rtx_insn *insn;
4970
4971             bitsize = GET_MODE_PRECISION (to_mode);
4972             real_2expN (&offset, bitsize - 1, fmode);
4973             limit = const_double_from_real_value (offset, fmode);
4974             lab1 = gen_label_rtx ();
4975             lab2 = gen_label_rtx ();
4976
4977             if (fmode != GET_MODE (from))
4978               from = convert_to_mode (fmode, from, 0);
4979
4980             /* See if we need to do the subtraction.  */
4981             do_pending_stack_adjust ();
4982             emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX,
4983                                      GET_MODE (from), 0, lab1);
4984
4985             /* If not, do the signed "fix" and branch around fixup code.  */
4986             expand_fix (to, from, 0);
4987             emit_jump_insn (targetm.gen_jump (lab2));
4988             emit_barrier ();
4989
4990             /* Otherwise, subtract 2**(N-1), convert to signed number,
4991                then add 2**(N-1).  Do the addition using XOR since this
4992                will often generate better code.  */
4993             emit_label (lab1);
4994             target = expand_binop (GET_MODE (from), sub_optab, from, limit,
4995                                    NULL_RTX, 0, OPTAB_LIB_WIDEN);
4996             expand_fix (to, target, 0);
4997             target = expand_binop (to_mode, xor_optab, to,
4998                                    gen_int_mode
4999                                    (HOST_WIDE_INT_1 << (bitsize - 1),
5000                                     to_mode),
5001                                    to, 1, OPTAB_LIB_WIDEN);
5002
5003             if (target != to)
5004               emit_move_insn (to, target);
5005
5006             emit_label (lab2);
5007
5008             if (optab_handler (mov_optab, to_mode) != CODE_FOR_nothing)
5009               {
5010                 /* Make a place for a REG_NOTE and add it.  */
5011                 insn = emit_move_insn (to, to);
5012                 set_dst_reg_note (insn, REG_EQUAL,
5013                                   gen_rtx_fmt_e (UNSIGNED_FIX, to_mode,
5014                                                  copy_rtx (from)),
5015                                   to);
5016               }
5017
5018             return;
5019           }
5020       }
5021
5022   /* We can't do it with an insn, so use a library call.  But first ensure
5023      that the mode of TO is at least as wide as SImode, since those are the
5024      only library calls we know about.  */
5025
5026   if (is_narrower_int_mode (GET_MODE (to), SImode))
5027     {
5028       target = gen_reg_rtx (SImode);
5029
5030       expand_fix (target, from, unsignedp);
5031     }
5032   else
5033     {
5034       rtx_insn *insns;
5035       rtx value;
5036       rtx libfunc;
5037
5038       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5039       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5040       gcc_assert (libfunc);
5041
5042       start_sequence ();
5043
5044       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5045                                        GET_MODE (to), from, GET_MODE (from));
5046       insns = get_insns ();
5047       end_sequence ();
5048
5049       emit_libcall_block (insns, target, value,
5050                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5051                                          GET_MODE (to), from));
5052     }
5053
5054   if (target != to)
5055     {
5056       if (GET_MODE (to) == GET_MODE (target))
5057         emit_move_insn (to, target);
5058       else
5059         convert_move (to, target, 0);
5060     }
5061 }
5062
5063
5064 /* Promote integer arguments for a libcall if necessary.
5065    emit_library_call_value cannot do the promotion because it does not
5066    know if it should do a signed or unsigned promotion.  This is because
5067    there are no tree types defined for libcalls.  */
5068
5069 static rtx
5070 prepare_libcall_arg (rtx arg, int uintp)
5071 {
5072   scalar_int_mode mode;
5073   machine_mode arg_mode;
5074   if (is_a <scalar_int_mode> (GET_MODE (arg), &mode))
5075     {
5076       /*  If we need to promote the integer function argument we need to do
5077           it here instead of inside emit_library_call_value because in
5078           emit_library_call_value we don't know if we should do a signed or
5079           unsigned promotion.  */
5080
5081       int unsigned_p = 0;
5082       arg_mode = promote_function_mode (NULL_TREE, mode,
5083                                         &unsigned_p, NULL_TREE, 0);
5084       if (arg_mode != mode)
5085         return convert_to_mode (arg_mode, arg, uintp);
5086     }
5087     return arg;
5088 }
5089
5090 /* Generate code to convert FROM or TO a fixed-point.
5091    If UINTP is true, either TO or FROM is an unsigned integer.
5092    If SATP is true, we need to saturate the result.  */
5093
5094 void
5095 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5096 {
5097   machine_mode to_mode = GET_MODE (to);
5098   machine_mode from_mode = GET_MODE (from);
5099   convert_optab tab;
5100   enum rtx_code this_code;
5101   enum insn_code code;
5102   rtx_insn *insns;
5103   rtx value;
5104   rtx libfunc;
5105
5106   if (to_mode == from_mode)
5107     {
5108       emit_move_insn (to, from);
5109       return;
5110     }
5111
5112   if (uintp)
5113     {
5114       tab = satp ? satfractuns_optab : fractuns_optab;
5115       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5116     }
5117   else
5118     {
5119       tab = satp ? satfract_optab : fract_optab;
5120       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5121     }
5122   code = convert_optab_handler (tab, to_mode, from_mode);
5123   if (code != CODE_FOR_nothing)
5124     {
5125       emit_unop_insn (code, to, from, this_code);
5126       return;
5127     }
5128
5129   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5130   gcc_assert (libfunc);
5131
5132   from = prepare_libcall_arg (from, uintp);
5133   from_mode = GET_MODE (from);
5134
5135   start_sequence ();
5136   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5137                                    from, from_mode);
5138   insns = get_insns ();
5139   end_sequence ();
5140
5141   emit_libcall_block (insns, to, value,
5142                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5143 }
5144
5145 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5146    must be floating point, TO must be signed.  Use the conversion optab
5147    TAB to do the conversion.  */
5148
5149 bool
5150 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5151 {
5152   enum insn_code icode;
5153   rtx target = to;
5154   machine_mode fmode, imode;
5155
5156   /* We first try to find a pair of modes, one real and one integer, at
5157      least as wide as FROM and TO, respectively, in which we can open-code
5158      this conversion.  If the integer mode is wider than the mode of TO,
5159      we can do the conversion either signed or unsigned.  */
5160
5161   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
5162     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
5163       {
5164         icode = convert_optab_handler (tab, imode, fmode);
5165         if (icode != CODE_FOR_nothing)
5166           {
5167             rtx_insn *last = get_last_insn ();
5168             if (fmode != GET_MODE (from))
5169               from = convert_to_mode (fmode, from, 0);
5170
5171             if (imode != GET_MODE (to))
5172               target = gen_reg_rtx (imode);
5173
5174             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5175               {
5176                 delete_insns_since (last);
5177                 continue;
5178               }
5179             if (target != to)
5180               convert_move (to, target, 0);
5181             return true;
5182           }
5183       }
5184
5185   return false;
5186 }
5187 \f
5188 /* Report whether we have an instruction to perform the operation
5189    specified by CODE on operands of mode MODE.  */
5190 int
5191 have_insn_for (enum rtx_code code, machine_mode mode)
5192 {
5193   return (code_to_optab (code)
5194           && (optab_handler (code_to_optab (code), mode)
5195               != CODE_FOR_nothing));
5196 }
5197
5198 /* Print information about the current contents of the optabs on
5199    STDERR.  */
5200
5201 DEBUG_FUNCTION void
5202 debug_optab_libfuncs (void)
5203 {
5204   int i, j, k;
5205
5206   /* Dump the arithmetic optabs.  */
5207   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
5208     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5209       {
5210         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
5211         if (l)
5212           {
5213             gcc_assert (GET_CODE (l) == SYMBOL_REF);
5214             fprintf (stderr, "%s\t%s:\t%s\n",
5215                      GET_RTX_NAME (optab_to_code ((optab) i)),
5216                      GET_MODE_NAME (j),
5217                      XSTR (l, 0));
5218           }
5219       }
5220
5221   /* Dump the conversion optabs.  */
5222   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
5223     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5224       for (k = 0; k < NUM_MACHINE_MODES; ++k)
5225         {
5226           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
5227                                          (machine_mode) k);
5228           if (l)
5229             {
5230               gcc_assert (GET_CODE (l) == SYMBOL_REF);
5231               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
5232                        GET_RTX_NAME (optab_to_code ((optab) i)),
5233                        GET_MODE_NAME (j),
5234                        GET_MODE_NAME (k),
5235                        XSTR (l, 0));
5236             }
5237         }
5238 }
5239
5240 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
5241    CODE.  Return 0 on failure.  */
5242
5243 rtx_insn *
5244 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
5245 {
5246   machine_mode mode = GET_MODE (op1);
5247   enum insn_code icode;
5248   rtx_insn *insn;
5249   rtx trap_rtx;
5250
5251   if (mode == VOIDmode)
5252     return 0;
5253
5254   icode = optab_handler (ctrap_optab, mode);
5255   if (icode == CODE_FOR_nothing)
5256     return 0;
5257
5258   /* Some targets only accept a zero trap code.  */
5259   if (!insn_operand_matches (icode, 3, tcode))
5260     return 0;
5261
5262   do_pending_stack_adjust ();
5263   start_sequence ();
5264   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
5265                     &trap_rtx, &mode);
5266   if (!trap_rtx)
5267     insn = NULL;
5268   else
5269     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
5270                             tcode);
5271
5272   /* If that failed, then give up.  */
5273   if (insn == 0)
5274     {
5275       end_sequence ();
5276       return 0;
5277     }
5278
5279   emit_insn (insn);
5280   insn = get_insns ();
5281   end_sequence ();
5282   return insn;
5283 }
5284
5285 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
5286    or unsigned operation code.  */
5287
5288 enum rtx_code
5289 get_rtx_code (enum tree_code tcode, bool unsignedp)
5290 {
5291   enum rtx_code code;
5292   switch (tcode)
5293     {
5294     case EQ_EXPR:
5295       code = EQ;
5296       break;
5297     case NE_EXPR:
5298       code = NE;
5299       break;
5300     case LT_EXPR:
5301       code = unsignedp ? LTU : LT;
5302       break;
5303     case LE_EXPR:
5304       code = unsignedp ? LEU : LE;
5305       break;
5306     case GT_EXPR:
5307       code = unsignedp ? GTU : GT;
5308       break;
5309     case GE_EXPR:
5310       code = unsignedp ? GEU : GE;
5311       break;
5312
5313     case UNORDERED_EXPR:
5314       code = UNORDERED;
5315       break;
5316     case ORDERED_EXPR:
5317       code = ORDERED;
5318       break;
5319     case UNLT_EXPR:
5320       code = UNLT;
5321       break;
5322     case UNLE_EXPR:
5323       code = UNLE;
5324       break;
5325     case UNGT_EXPR:
5326       code = UNGT;
5327       break;
5328     case UNGE_EXPR:
5329       code = UNGE;
5330       break;
5331     case UNEQ_EXPR:
5332       code = UNEQ;
5333       break;
5334     case LTGT_EXPR:
5335       code = LTGT;
5336       break;
5337
5338     case BIT_AND_EXPR:
5339       code = AND;
5340       break;
5341
5342     case BIT_IOR_EXPR:
5343       code = IOR;
5344       break;
5345
5346     default:
5347       gcc_unreachable ();
5348     }
5349   return code;
5350 }
5351
5352 /* Return a comparison rtx of mode CMP_MODE for COND.  Use UNSIGNEDP to
5353    select signed or unsigned operators.  OPNO holds the index of the
5354    first comparison operand for insn ICODE.  Do not generate the
5355    compare instruction itself.  */
5356
5357 static rtx
5358 vector_compare_rtx (machine_mode cmp_mode, enum tree_code tcode,
5359                     tree t_op0, tree t_op1, bool unsignedp,
5360                     enum insn_code icode, unsigned int opno)
5361 {
5362   struct expand_operand ops[2];
5363   rtx rtx_op0, rtx_op1;
5364   machine_mode m0, m1;
5365   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
5366
5367   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
5368
5369   /* Expand operands.  For vector types with scalar modes, e.g. where int64x1_t
5370      has mode DImode, this can produce a constant RTX of mode VOIDmode; in such
5371      cases, use the original mode.  */
5372   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
5373                          EXPAND_STACK_PARM);
5374   m0 = GET_MODE (rtx_op0);
5375   if (m0 == VOIDmode)
5376     m0 = TYPE_MODE (TREE_TYPE (t_op0));
5377
5378   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
5379                          EXPAND_STACK_PARM);
5380   m1 = GET_MODE (rtx_op1);
5381   if (m1 == VOIDmode)
5382     m1 = TYPE_MODE (TREE_TYPE (t_op1));
5383
5384   create_input_operand (&ops[0], rtx_op0, m0);
5385   create_input_operand (&ops[1], rtx_op1, m1);
5386   if (!maybe_legitimize_operands (icode, opno, 2, ops))
5387     gcc_unreachable ();
5388   return gen_rtx_fmt_ee (rcode, cmp_mode, ops[0].value, ops[1].value);
5389 }
5390
5391 /* Check if vec_perm mask SEL is a constant equivalent to a shift of
5392    the first vec_perm operand, assuming the second operand is a constant
5393    vector of zeros.  Return the shift distance in bits if so, or NULL_RTX
5394    if the vec_perm is not a shift.  MODE is the mode of the value being
5395    shifted.  */
5396 static rtx
5397 shift_amt_for_vec_perm_mask (machine_mode mode, const vec_perm_indices &sel)
5398 {
5399   unsigned int bitsize = GET_MODE_UNIT_BITSIZE (mode);
5400   poly_int64 first = sel[0];
5401   if (maybe_ge (sel[0], GET_MODE_NUNITS (mode)))
5402     return NULL_RTX;
5403
5404   if (!sel.series_p (0, 1, first, 1))
5405     {
5406       unsigned int nelt;
5407       if (!GET_MODE_NUNITS (mode).is_constant (&nelt))
5408         return NULL_RTX;
5409       for (unsigned int i = 1; i < nelt; i++)
5410         {
5411           poly_int64 expected = i + first;
5412           /* Indices into the second vector are all equivalent.  */
5413           if (maybe_lt (sel[i], nelt)
5414               ? maybe_ne (sel[i], expected)
5415               : maybe_lt (expected, nelt))
5416             return NULL_RTX;
5417         }
5418     }
5419
5420   return gen_int_shift_amount (mode, first * bitsize);
5421 }
5422
5423 /* A subroutine of expand_vec_perm_var for expanding one vec_perm insn.  */
5424
5425 static rtx
5426 expand_vec_perm_1 (enum insn_code icode, rtx target,
5427                    rtx v0, rtx v1, rtx sel)
5428 {
5429   machine_mode tmode = GET_MODE (target);
5430   machine_mode smode = GET_MODE (sel);
5431   struct expand_operand ops[4];
5432
5433   gcc_assert (GET_MODE_CLASS (smode) == MODE_VECTOR_INT
5434               || mode_for_int_vector (tmode).require () == smode);
5435   create_output_operand (&ops[0], target, tmode);
5436   create_input_operand (&ops[3], sel, smode);
5437
5438   /* Make an effort to preserve v0 == v1.  The target expander is able to
5439      rely on this to determine if we're permuting a single input operand.  */
5440   if (rtx_equal_p (v0, v1))
5441     {
5442       if (!insn_operand_matches (icode, 1, v0))
5443         v0 = force_reg (tmode, v0);
5444       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
5445       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
5446
5447       create_fixed_operand (&ops[1], v0);
5448       create_fixed_operand (&ops[2], v0);
5449     }
5450   else
5451     {
5452       create_input_operand (&ops[1], v0, tmode);
5453       create_input_operand (&ops[2], v1, tmode);
5454     }
5455
5456   if (maybe_expand_insn (icode, 4, ops))
5457     return ops[0].value;
5458   return NULL_RTX;
5459 }
5460
5461 /* Implement a permutation of vectors v0 and v1 using the permutation
5462    vector in SEL and return the result.  Use TARGET to hold the result
5463    if nonnull and convenient.
5464
5465    MODE is the mode of the vectors being permuted (V0 and V1).  SEL_MODE
5466    is the TYPE_MODE associated with SEL, or BLKmode if SEL isn't known
5467    to have a particular mode.  */
5468
5469 rtx
5470 expand_vec_perm_const (machine_mode mode, rtx v0, rtx v1,
5471                        const vec_perm_builder &sel, machine_mode sel_mode,
5472                        rtx target)
5473 {
5474   if (!target || !register_operand (target, mode))
5475     target = gen_reg_rtx (mode);
5476
5477   /* Set QIMODE to a different vector mode with byte elements.
5478      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
5479   machine_mode qimode;
5480   if (!qimode_for_vec_perm (mode).exists (&qimode))
5481     qimode = VOIDmode;
5482
5483   rtx_insn *last = get_last_insn ();
5484
5485   bool single_arg_p = rtx_equal_p (v0, v1);
5486   /* Always specify two input vectors here and leave the target to handle
5487      cases in which the inputs are equal.  Not all backends can cope with
5488      the single-input representation when testing for a double-input
5489      target instruction.  */
5490   vec_perm_indices indices (sel, 2, GET_MODE_NUNITS (mode));
5491
5492   /* See if this can be handled with a vec_shr.  We only do this if the
5493      second vector is all zeroes.  */
5494   insn_code shift_code = optab_handler (vec_shr_optab, mode);
5495   insn_code shift_code_qi = ((qimode != VOIDmode && qimode != mode)
5496                              ? optab_handler (vec_shr_optab, qimode)
5497                              : CODE_FOR_nothing);
5498
5499   if (v1 == CONST0_RTX (GET_MODE (v1))
5500       && (shift_code != CODE_FOR_nothing
5501           || shift_code_qi != CODE_FOR_nothing))
5502     {
5503       rtx shift_amt = shift_amt_for_vec_perm_mask (mode, indices);
5504       if (shift_amt)
5505         {
5506           struct expand_operand ops[3];
5507           if (shift_code != CODE_FOR_nothing)
5508             {
5509               create_output_operand (&ops[0], target, mode);
5510               create_input_operand (&ops[1], v0, mode);
5511               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
5512               if (maybe_expand_insn (shift_code, 3, ops))
5513                 return ops[0].value;
5514             }
5515           if (shift_code_qi != CODE_FOR_nothing)
5516             {
5517               rtx tmp = gen_reg_rtx (qimode);
5518               create_output_operand (&ops[0], tmp, qimode);
5519               create_input_operand (&ops[1], gen_lowpart (qimode, v0), qimode);
5520               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
5521               if (maybe_expand_insn (shift_code_qi, 3, ops))
5522                 return gen_lowpart (mode, ops[0].value);
5523             }
5524         }
5525     }
5526
5527   if (targetm.vectorize.vec_perm_const != NULL)
5528     {
5529       v0 = force_reg (mode, v0);
5530       if (single_arg_p)
5531         v1 = v0;
5532       else
5533         v1 = force_reg (mode, v1);
5534
5535       if (targetm.vectorize.vec_perm_const (mode, target, v0, v1, indices))
5536         return target;
5537     }
5538
5539   /* Fall back to a constant byte-based permutation.  */
5540   vec_perm_indices qimode_indices;
5541   rtx target_qi = NULL_RTX, v0_qi = NULL_RTX, v1_qi = NULL_RTX;
5542   if (qimode != VOIDmode)
5543     {
5544       qimode_indices.new_expanded_vector (indices, GET_MODE_UNIT_SIZE (mode));
5545       target_qi = gen_reg_rtx (qimode);
5546       v0_qi = gen_lowpart (qimode, v0);
5547       v1_qi = gen_lowpart (qimode, v1);
5548       if (targetm.vectorize.vec_perm_const != NULL
5549           && targetm.vectorize.vec_perm_const (qimode, target_qi, v0_qi,
5550                                                v1_qi, qimode_indices))
5551         return gen_lowpart (mode, target_qi);
5552     }
5553
5554   /* Otherwise expand as a fully variable permuation.  */
5555
5556   /* The optabs are only defined for selectors with the same width
5557      as the values being permuted.  */
5558   machine_mode required_sel_mode;
5559   if (!mode_for_int_vector (mode).exists (&required_sel_mode)
5560       || !VECTOR_MODE_P (required_sel_mode))
5561     {
5562       delete_insns_since (last);
5563       return NULL_RTX;
5564     }
5565
5566   /* We know that it is semantically valid to treat SEL as having SEL_MODE.
5567      If that isn't the mode we want then we need to prove that using
5568      REQUIRED_SEL_MODE is OK.  */
5569   if (sel_mode != required_sel_mode)
5570     {
5571       if (!selector_fits_mode_p (required_sel_mode, indices))
5572         {
5573           delete_insns_since (last);
5574           return NULL_RTX;
5575         }
5576       sel_mode = required_sel_mode;
5577     }
5578
5579   insn_code icode = direct_optab_handler (vec_perm_optab, mode);
5580   if (icode != CODE_FOR_nothing)
5581     {
5582       rtx sel_rtx = vec_perm_indices_to_rtx (sel_mode, indices);
5583       rtx tmp = expand_vec_perm_1 (icode, target, v0, v1, sel_rtx);
5584       if (tmp)
5585         return tmp;
5586     }
5587
5588   if (qimode != VOIDmode
5589       && selector_fits_mode_p (qimode, qimode_indices))
5590     {
5591       icode = direct_optab_handler (vec_perm_optab, qimode);
5592       if (icode != CODE_FOR_nothing)
5593         {
5594           rtx sel_qi = vec_perm_indices_to_rtx (qimode, qimode_indices);
5595           rtx tmp = expand_vec_perm_1 (icode, target_qi, v0_qi, v1_qi, sel_qi);
5596           if (tmp)
5597             return gen_lowpart (mode, tmp);
5598         }
5599     }
5600
5601   delete_insns_since (last);
5602   return NULL_RTX;
5603 }
5604
5605 /* Implement a permutation of vectors v0 and v1 using the permutation
5606    vector in SEL and return the result.  Use TARGET to hold the result
5607    if nonnull and convenient.
5608
5609    MODE is the mode of the vectors being permuted (V0 and V1).
5610    SEL must have the integer equivalent of MODE and is known to be
5611    unsuitable for permutes with a constant permutation vector.  */
5612
5613 rtx
5614 expand_vec_perm_var (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
5615 {
5616   enum insn_code icode;
5617   unsigned int i, w, u;
5618   rtx tmp, sel_qi;
5619
5620   w = GET_MODE_SIZE (mode);
5621   u = GET_MODE_UNIT_SIZE (mode);
5622
5623   if (!target || GET_MODE (target) != mode)
5624     target = gen_reg_rtx (mode);
5625
5626   icode = direct_optab_handler (vec_perm_optab, mode);
5627   if (icode != CODE_FOR_nothing)
5628     {
5629       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5630       if (tmp)
5631         return tmp;
5632     }
5633
5634   /* As a special case to aid several targets, lower the element-based
5635      permutation to a byte-based permutation and try again.  */
5636   machine_mode qimode;
5637   if (!qimode_for_vec_perm (mode).exists (&qimode)
5638       || maybe_gt (GET_MODE_NUNITS (qimode), GET_MODE_MASK (QImode) + 1))
5639     return NULL_RTX;
5640   icode = direct_optab_handler (vec_perm_optab, qimode);
5641   if (icode == CODE_FOR_nothing)
5642     return NULL_RTX;
5643
5644   /* Multiply each element by its byte size.  */
5645   machine_mode selmode = GET_MODE (sel);
5646   if (u == 2)
5647     sel = expand_simple_binop (selmode, PLUS, sel, sel,
5648                                NULL, 0, OPTAB_DIRECT);
5649   else
5650     sel = expand_simple_binop (selmode, ASHIFT, sel,
5651                                gen_int_shift_amount (selmode, exact_log2 (u)),
5652                                NULL, 0, OPTAB_DIRECT);
5653   gcc_assert (sel != NULL);
5654
5655   /* Broadcast the low byte each element into each of its bytes.
5656      The encoding has U interleaved stepped patterns, one for each
5657      byte of an element.  */
5658   vec_perm_builder const_sel (w, u, 3);
5659   unsigned int low_byte_in_u = BYTES_BIG_ENDIAN ? u - 1 : 0;
5660   for (i = 0; i < 3; ++i)
5661     for (unsigned int j = 0; j < u; ++j)
5662       const_sel.quick_push (i * u + low_byte_in_u);
5663   sel = gen_lowpart (qimode, sel);
5664   sel = expand_vec_perm_const (qimode, sel, sel, const_sel, qimode, NULL);
5665   gcc_assert (sel != NULL);
5666
5667   /* Add the byte offset to each byte element.  */
5668   /* Note that the definition of the indicies here is memory ordering,
5669      so there should be no difference between big and little endian.  */
5670   rtx_vector_builder byte_indices (qimode, u, 1);
5671   for (i = 0; i < u; ++i)
5672     byte_indices.quick_push (GEN_INT (i));
5673   tmp = byte_indices.build ();
5674   sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
5675                                 sel, 0, OPTAB_DIRECT);
5676   gcc_assert (sel_qi != NULL);
5677
5678   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5679   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5680                            gen_lowpart (qimode, v1), sel_qi);
5681   if (tmp)
5682     tmp = gen_lowpart (mode, tmp);
5683   return tmp;
5684 }
5685
5686 /* Generate insns for a VEC_COND_EXPR with mask, given its TYPE and its
5687    three operands.  */
5688
5689 rtx
5690 expand_vec_cond_mask_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5691                            rtx target)
5692 {
5693   struct expand_operand ops[4];
5694   machine_mode mode = TYPE_MODE (vec_cond_type);
5695   machine_mode mask_mode = TYPE_MODE (TREE_TYPE (op0));
5696   enum insn_code icode = get_vcond_mask_icode (mode, mask_mode);
5697   rtx mask, rtx_op1, rtx_op2;
5698
5699   if (icode == CODE_FOR_nothing)
5700     return 0;
5701
5702   mask = expand_normal (op0);
5703   rtx_op1 = expand_normal (op1);
5704   rtx_op2 = expand_normal (op2);
5705
5706   mask = force_reg (mask_mode, mask);
5707   rtx_op1 = force_reg (GET_MODE (rtx_op1), rtx_op1);
5708
5709   create_output_operand (&ops[0], target, mode);
5710   create_input_operand (&ops[1], rtx_op1, mode);
5711   create_input_operand (&ops[2], rtx_op2, mode);
5712   create_input_operand (&ops[3], mask, mask_mode);
5713   expand_insn (icode, 4, ops);
5714
5715   return ops[0].value;
5716 }
5717
5718 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
5719    three operands.  */
5720
5721 rtx
5722 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5723                       rtx target)
5724 {
5725   struct expand_operand ops[6];
5726   enum insn_code icode;
5727   rtx comparison, rtx_op1, rtx_op2;
5728   machine_mode mode = TYPE_MODE (vec_cond_type);
5729   machine_mode cmp_op_mode;
5730   bool unsignedp;
5731   tree op0a, op0b;
5732   enum tree_code tcode;
5733
5734   if (COMPARISON_CLASS_P (op0))
5735     {
5736       op0a = TREE_OPERAND (op0, 0);
5737       op0b = TREE_OPERAND (op0, 1);
5738       tcode = TREE_CODE (op0);
5739     }
5740   else
5741     {
5742       gcc_assert (VECTOR_BOOLEAN_TYPE_P (TREE_TYPE (op0)));
5743       if (get_vcond_mask_icode (mode, TYPE_MODE (TREE_TYPE (op0)))
5744           != CODE_FOR_nothing)
5745         return expand_vec_cond_mask_expr (vec_cond_type, op0, op1,
5746                                           op2, target);
5747       /* Fake op0 < 0.  */
5748       else
5749         {
5750           gcc_assert (GET_MODE_CLASS (TYPE_MODE (TREE_TYPE (op0)))
5751                       == MODE_VECTOR_INT);
5752           op0a = op0;
5753           op0b = build_zero_cst (TREE_TYPE (op0));
5754           tcode = LT_EXPR;
5755         }
5756     }
5757   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
5758   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5759
5760
5761   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
5762               && known_eq (GET_MODE_NUNITS (mode),
5763                            GET_MODE_NUNITS (cmp_op_mode)));
5764
5765   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
5766   if (icode == CODE_FOR_nothing)
5767     {
5768       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5769         icode = get_vcond_eq_icode (mode, cmp_op_mode);
5770       if (icode == CODE_FOR_nothing)
5771         return 0;
5772     }
5773
5774   comparison = vector_compare_rtx (VOIDmode, tcode, op0a, op0b, unsignedp,
5775                                    icode, 4);
5776   rtx_op1 = expand_normal (op1);
5777   rtx_op2 = expand_normal (op2);
5778
5779   create_output_operand (&ops[0], target, mode);
5780   create_input_operand (&ops[1], rtx_op1, mode);
5781   create_input_operand (&ops[2], rtx_op2, mode);
5782   create_fixed_operand (&ops[3], comparison);
5783   create_fixed_operand (&ops[4], XEXP (comparison, 0));
5784   create_fixed_operand (&ops[5], XEXP (comparison, 1));
5785   expand_insn (icode, 6, ops);
5786   return ops[0].value;
5787 }
5788
5789 /* Generate VEC_SERIES_EXPR <OP0, OP1>, returning a value of mode VMODE.
5790    Use TARGET for the result if nonnull and convenient.  */
5791
5792 rtx
5793 expand_vec_series_expr (machine_mode vmode, rtx op0, rtx op1, rtx target)
5794 {
5795   struct expand_operand ops[3];
5796   enum insn_code icode;
5797   machine_mode emode = GET_MODE_INNER (vmode);
5798
5799   icode = direct_optab_handler (vec_series_optab, vmode);
5800   gcc_assert (icode != CODE_FOR_nothing);
5801
5802   create_output_operand (&ops[0], target, vmode);
5803   create_input_operand (&ops[1], op0, emode);
5804   create_input_operand (&ops[2], op1, emode);
5805
5806   expand_insn (icode, 3, ops);
5807   return ops[0].value;
5808 }
5809
5810 /* Generate insns for a vector comparison into a mask.  */
5811
5812 rtx
5813 expand_vec_cmp_expr (tree type, tree exp, rtx target)
5814 {
5815   struct expand_operand ops[4];
5816   enum insn_code icode;
5817   rtx comparison;
5818   machine_mode mask_mode = TYPE_MODE (type);
5819   machine_mode vmode;
5820   bool unsignedp;
5821   tree op0a, op0b;
5822   enum tree_code tcode;
5823
5824   op0a = TREE_OPERAND (exp, 0);
5825   op0b = TREE_OPERAND (exp, 1);
5826   tcode = TREE_CODE (exp);
5827
5828   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5829   vmode = TYPE_MODE (TREE_TYPE (op0a));
5830
5831   icode = get_vec_cmp_icode (vmode, mask_mode, unsignedp);
5832   if (icode == CODE_FOR_nothing)
5833     {
5834       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5835         icode = get_vec_cmp_eq_icode (vmode, mask_mode);
5836       if (icode == CODE_FOR_nothing)
5837         return 0;
5838     }
5839
5840   comparison = vector_compare_rtx (mask_mode, tcode, op0a, op0b,
5841                                    unsignedp, icode, 2);
5842   create_output_operand (&ops[0], target, mask_mode);
5843   create_fixed_operand (&ops[1], comparison);
5844   create_fixed_operand (&ops[2], XEXP (comparison, 0));
5845   create_fixed_operand (&ops[3], XEXP (comparison, 1));
5846   expand_insn (icode, 4, ops);
5847   return ops[0].value;
5848 }
5849
5850 /* Expand a highpart multiply.  */
5851
5852 rtx
5853 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
5854                       rtx target, bool uns_p)
5855 {
5856   struct expand_operand eops[3];
5857   enum insn_code icode;
5858   int method, i;
5859   machine_mode wmode;
5860   rtx m1, m2;
5861   optab tab1, tab2;
5862
5863   method = can_mult_highpart_p (mode, uns_p);
5864   switch (method)
5865     {
5866     case 0:
5867       return NULL_RTX;
5868     case 1:
5869       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
5870       return expand_binop (mode, tab1, op0, op1, target, uns_p,
5871                            OPTAB_LIB_WIDEN);
5872     case 2:
5873       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
5874       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
5875       break;
5876     case 3:
5877       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
5878       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
5879       if (BYTES_BIG_ENDIAN)
5880         std::swap (tab1, tab2);
5881       break;
5882     default:
5883       gcc_unreachable ();
5884     }
5885
5886   icode = optab_handler (tab1, mode);
5887   wmode = insn_data[icode].operand[0].mode;
5888   gcc_checking_assert (known_eq (2 * GET_MODE_NUNITS (wmode),
5889                                  GET_MODE_NUNITS (mode)));
5890   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
5891
5892   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5893   create_input_operand (&eops[1], op0, mode);
5894   create_input_operand (&eops[2], op1, mode);
5895   expand_insn (icode, 3, eops);
5896   m1 = gen_lowpart (mode, eops[0].value);
5897
5898   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5899   create_input_operand (&eops[1], op0, mode);
5900   create_input_operand (&eops[2], op1, mode);
5901   expand_insn (optab_handler (tab2, mode), 3, eops);
5902   m2 = gen_lowpart (mode, eops[0].value);
5903
5904   vec_perm_builder sel;
5905   if (method == 2)
5906     {
5907       /* The encoding has 2 interleaved stepped patterns.  */
5908       sel.new_vector (GET_MODE_NUNITS (mode), 2, 3);
5909       for (i = 0; i < 6; ++i)
5910         sel.quick_push (!BYTES_BIG_ENDIAN + (i & ~1)
5911                         + ((i & 1) ? GET_MODE_NUNITS (mode) : 0));
5912     }
5913   else
5914     {
5915       /* The encoding has a single interleaved stepped pattern.  */
5916       sel.new_vector (GET_MODE_NUNITS (mode), 1, 3);
5917       for (i = 0; i < 3; ++i)
5918         sel.quick_push (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
5919     }
5920
5921   return expand_vec_perm_const (mode, m1, m2, sel, BLKmode, target);
5922 }
5923 \f
5924 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
5925    pattern.  */
5926
5927 static void
5928 find_cc_set (rtx x, const_rtx pat, void *data)
5929 {
5930   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
5931       && GET_CODE (pat) == SET)
5932     {
5933       rtx *p_cc_reg = (rtx *) data;
5934       gcc_assert (!*p_cc_reg);
5935       *p_cc_reg = x;
5936     }
5937 }
5938
5939 /* This is a helper function for the other atomic operations.  This function
5940    emits a loop that contains SEQ that iterates until a compare-and-swap
5941    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
5942    a set of instructions that takes a value from OLD_REG as an input and
5943    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
5944    set to the current contents of MEM.  After SEQ, a compare-and-swap will
5945    attempt to update MEM with NEW_REG.  The function returns true when the
5946    loop was generated successfully.  */
5947
5948 static bool
5949 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
5950 {
5951   machine_mode mode = GET_MODE (mem);
5952   rtx_code_label *label;
5953   rtx cmp_reg, success, oldval;
5954
5955   /* The loop we want to generate looks like
5956
5957         cmp_reg = mem;
5958       label:
5959         old_reg = cmp_reg;
5960         seq;
5961         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
5962         if (success)
5963           goto label;
5964
5965      Note that we only do the plain load from memory once.  Subsequent
5966      iterations use the value loaded by the compare-and-swap pattern.  */
5967
5968   label = gen_label_rtx ();
5969   cmp_reg = gen_reg_rtx (mode);
5970
5971   emit_move_insn (cmp_reg, mem);
5972   emit_label (label);
5973   emit_move_insn (old_reg, cmp_reg);
5974   if (seq)
5975     emit_insn (seq);
5976
5977   success = NULL_RTX;
5978   oldval = cmp_reg;
5979   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
5980                                        new_reg, false, MEMMODEL_SYNC_SEQ_CST,
5981                                        MEMMODEL_RELAXED))
5982     return false;
5983
5984   if (oldval != cmp_reg)
5985     emit_move_insn (cmp_reg, oldval);
5986
5987   /* Mark this jump predicted not taken.  */
5988   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
5989                            GET_MODE (success), 1, label,
5990                            profile_probability::guessed_never ());
5991   return true;
5992 }
5993
5994
5995 /* This function tries to emit an atomic_exchange intruction.  VAL is written
5996    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
5997    using TARGET if possible.  */
5998
5999 static rtx
6000 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6001 {
6002   machine_mode mode = GET_MODE (mem);
6003   enum insn_code icode;
6004
6005   /* If the target supports the exchange directly, great.  */
6006   icode = direct_optab_handler (atomic_exchange_optab, mode);
6007   if (icode != CODE_FOR_nothing)
6008     {
6009       struct expand_operand ops[4];
6010
6011       create_output_operand (&ops[0], target, mode);
6012       create_fixed_operand (&ops[1], mem);
6013       create_input_operand (&ops[2], val, mode);
6014       create_integer_operand (&ops[3], model);
6015       if (maybe_expand_insn (icode, 4, ops))
6016         return ops[0].value;
6017     }
6018
6019   return NULL_RTX;
6020 }
6021
6022 /* This function tries to implement an atomic exchange operation using
6023    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
6024    The previous contents of *MEM are returned, using TARGET if possible.
6025    Since this instructionn is an acquire barrier only, stronger memory
6026    models may require additional barriers to be emitted.  */
6027
6028 static rtx
6029 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
6030                                    enum memmodel model)
6031 {
6032   machine_mode mode = GET_MODE (mem);
6033   enum insn_code icode;
6034   rtx_insn *last_insn = get_last_insn ();
6035
6036   icode = optab_handler (sync_lock_test_and_set_optab, mode);
6037
6038   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
6039      exists, and the memory model is stronger than acquire, add a release
6040      barrier before the instruction.  */
6041
6042   if (is_mm_seq_cst (model) || is_mm_release (model) || is_mm_acq_rel (model))
6043     expand_mem_thread_fence (model);
6044
6045   if (icode != CODE_FOR_nothing)
6046     {
6047       struct expand_operand ops[3];
6048       create_output_operand (&ops[0], target, mode);
6049       create_fixed_operand (&ops[1], mem);
6050       create_input_operand (&ops[2], val, mode);
6051       if (maybe_expand_insn (icode, 3, ops))
6052         return ops[0].value;
6053     }
6054
6055   /* If an external test-and-set libcall is provided, use that instead of
6056      any external compare-and-swap that we might get from the compare-and-
6057      swap-loop expansion later.  */
6058   if (!can_compare_and_swap_p (mode, false))
6059     {
6060       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
6061       if (libfunc != NULL)
6062         {
6063           rtx addr;
6064
6065           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6066           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6067                                           mode, addr, ptr_mode,
6068                                           val, mode);
6069         }
6070     }
6071
6072   /* If the test_and_set can't be emitted, eliminate any barrier that might
6073      have been emitted.  */
6074   delete_insns_since (last_insn);
6075   return NULL_RTX;
6076 }
6077
6078 /* This function tries to implement an atomic exchange operation using a
6079    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
6080    *MEM are returned, using TARGET if possible.  No memory model is required
6081    since a compare_and_swap loop is seq-cst.  */
6082
6083 static rtx
6084 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
6085 {
6086   machine_mode mode = GET_MODE (mem);
6087
6088   if (can_compare_and_swap_p (mode, true))
6089     {
6090       if (!target || !register_operand (target, mode))
6091         target = gen_reg_rtx (mode);
6092       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
6093         return target;
6094     }
6095
6096   return NULL_RTX;
6097 }
6098
6099 /* This function tries to implement an atomic test-and-set operation
6100    using the atomic_test_and_set instruction pattern.  A boolean value
6101    is returned from the operation, using TARGET if possible.  */
6102
6103 static rtx
6104 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6105 {
6106   machine_mode pat_bool_mode;
6107   struct expand_operand ops[3];
6108
6109   if (!targetm.have_atomic_test_and_set ())
6110     return NULL_RTX;
6111
6112   /* While we always get QImode from __atomic_test_and_set, we get
6113      other memory modes from __sync_lock_test_and_set.  Note that we
6114      use no endian adjustment here.  This matches the 4.6 behavior
6115      in the Sparc backend.  */
6116   enum insn_code icode = targetm.code_for_atomic_test_and_set;
6117   gcc_checking_assert (insn_data[icode].operand[1].mode == QImode);
6118   if (GET_MODE (mem) != QImode)
6119     mem = adjust_address_nv (mem, QImode, 0);
6120
6121   pat_bool_mode = insn_data[icode].operand[0].mode;
6122   create_output_operand (&ops[0], target, pat_bool_mode);
6123   create_fixed_operand (&ops[1], mem);
6124   create_integer_operand (&ops[2], model);
6125
6126   if (maybe_expand_insn (icode, 3, ops))
6127     return ops[0].value;
6128   return NULL_RTX;
6129 }
6130
6131 /* This function expands the legacy _sync_lock test_and_set operation which is
6132    generally an atomic exchange.  Some limited targets only allow the
6133    constant 1 to be stored.  This is an ACQUIRE operation.
6134
6135    TARGET is an optional place to stick the return value.
6136    MEM is where VAL is stored.  */
6137
6138 rtx
6139 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
6140 {
6141   rtx ret;
6142
6143   /* Try an atomic_exchange first.  */
6144   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_SYNC_ACQUIRE);
6145   if (ret)
6146     return ret;
6147
6148   ret = maybe_emit_sync_lock_test_and_set (target, mem, val,
6149                                            MEMMODEL_SYNC_ACQUIRE);
6150   if (ret)
6151     return ret;
6152
6153   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6154   if (ret)
6155     return ret;
6156
6157   /* If there are no other options, try atomic_test_and_set if the value
6158      being stored is 1.  */
6159   if (val == const1_rtx)
6160     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_SYNC_ACQUIRE);
6161
6162   return ret;
6163 }
6164
6165 /* This function expands the atomic test_and_set operation:
6166    atomically store a boolean TRUE into MEM and return the previous value.
6167
6168    MEMMODEL is the memory model variant to use.
6169    TARGET is an optional place to stick the return value.  */
6170
6171 rtx
6172 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6173 {
6174   machine_mode mode = GET_MODE (mem);
6175   rtx ret, trueval, subtarget;
6176
6177   ret = maybe_emit_atomic_test_and_set (target, mem, model);
6178   if (ret)
6179     return ret;
6180
6181   /* Be binary compatible with non-default settings of trueval, and different
6182      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
6183      another only has atomic-exchange.  */
6184   if (targetm.atomic_test_and_set_trueval == 1)
6185     {
6186       trueval = const1_rtx;
6187       subtarget = target ? target : gen_reg_rtx (mode);
6188     }
6189   else
6190     {
6191       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
6192       subtarget = gen_reg_rtx (mode);
6193     }
6194
6195   /* Try the atomic-exchange optab...  */
6196   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
6197
6198   /* ... then an atomic-compare-and-swap loop ... */
6199   if (!ret)
6200     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
6201
6202   /* ... before trying the vaguely defined legacy lock_test_and_set. */
6203   if (!ret)
6204     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
6205
6206   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
6207      things with the value 1.  Thus we try again without trueval.  */
6208   if (!ret && targetm.atomic_test_and_set_trueval != 1)
6209     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
6210
6211   /* Failing all else, assume a single threaded environment and simply
6212      perform the operation.  */
6213   if (!ret)
6214     {
6215       /* If the result is ignored skip the move to target.  */
6216       if (subtarget != const0_rtx)
6217         emit_move_insn (subtarget, mem);
6218
6219       emit_move_insn (mem, trueval);
6220       ret = subtarget;
6221     }
6222
6223   /* Recall that have to return a boolean value; rectify if trueval
6224      is not exactly one.  */
6225   if (targetm.atomic_test_and_set_trueval != 1)
6226     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
6227
6228   return ret;
6229 }
6230
6231 /* This function expands the atomic exchange operation:
6232    atomically store VAL in MEM and return the previous value in MEM.
6233
6234    MEMMODEL is the memory model variant to use.
6235    TARGET is an optional place to stick the return value.  */
6236
6237 rtx
6238 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6239 {
6240   machine_mode mode = GET_MODE (mem);
6241   rtx ret;
6242
6243   /* If loads are not atomic for the required size and we are not called to
6244      provide a __sync builtin, do not do anything so that we stay consistent
6245      with atomic loads of the same size.  */
6246   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6247     return NULL_RTX;
6248
6249   ret = maybe_emit_atomic_exchange (target, mem, val, model);
6250
6251   /* Next try a compare-and-swap loop for the exchange.  */
6252   if (!ret)
6253     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6254
6255   return ret;
6256 }
6257
6258 /* This function expands the atomic compare exchange operation:
6259
6260    *PTARGET_BOOL is an optional place to store the boolean success/failure.
6261    *PTARGET_OVAL is an optional place to store the old value from memory.
6262    Both target parameters may be NULL or const0_rtx to indicate that we do
6263    not care about that return value.  Both target parameters are updated on
6264    success to the actual location of the corresponding result.
6265
6266    MEMMODEL is the memory model variant to use.
6267
6268    The return value of the function is true for success.  */
6269
6270 bool
6271 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
6272                                 rtx mem, rtx expected, rtx desired,
6273                                 bool is_weak, enum memmodel succ_model,
6274                                 enum memmodel fail_model)
6275 {
6276   machine_mode mode = GET_MODE (mem);
6277   struct expand_operand ops[8];
6278   enum insn_code icode;
6279   rtx target_oval, target_bool = NULL_RTX;
6280   rtx libfunc;
6281
6282   /* If loads are not atomic for the required size and we are not called to
6283      provide a __sync builtin, do not do anything so that we stay consistent
6284      with atomic loads of the same size.  */
6285   if (!can_atomic_load_p (mode) && !is_mm_sync (succ_model))
6286     return false;
6287
6288   /* Load expected into a register for the compare and swap.  */
6289   if (MEM_P (expected))
6290     expected = copy_to_reg (expected);
6291
6292   /* Make sure we always have some place to put the return oldval.
6293      Further, make sure that place is distinct from the input expected,
6294      just in case we need that path down below.  */
6295   if (ptarget_oval && *ptarget_oval == const0_rtx)
6296     ptarget_oval = NULL;
6297
6298   if (ptarget_oval == NULL
6299       || (target_oval = *ptarget_oval) == NULL
6300       || reg_overlap_mentioned_p (expected, target_oval))
6301     target_oval = gen_reg_rtx (mode);
6302
6303   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
6304   if (icode != CODE_FOR_nothing)
6305     {
6306       machine_mode bool_mode = insn_data[icode].operand[0].mode;
6307
6308       if (ptarget_bool && *ptarget_bool == const0_rtx)
6309         ptarget_bool = NULL;
6310
6311       /* Make sure we always have a place for the bool operand.  */
6312       if (ptarget_bool == NULL
6313           || (target_bool = *ptarget_bool) == NULL
6314           || GET_MODE (target_bool) != bool_mode)
6315         target_bool = gen_reg_rtx (bool_mode);
6316
6317       /* Emit the compare_and_swap.  */
6318       create_output_operand (&ops[0], target_bool, bool_mode);
6319       create_output_operand (&ops[1], target_oval, mode);
6320       create_fixed_operand (&ops[2], mem);
6321       create_input_operand (&ops[3], expected, mode);
6322       create_input_operand (&ops[4], desired, mode);
6323       create_integer_operand (&ops[5], is_weak);
6324       create_integer_operand (&ops[6], succ_model);
6325       create_integer_operand (&ops[7], fail_model);
6326       if (maybe_expand_insn (icode, 8, ops))
6327         {
6328           /* Return success/failure.  */
6329           target_bool = ops[0].value;
6330           target_oval = ops[1].value;
6331           goto success;
6332         }
6333     }
6334
6335   /* Otherwise fall back to the original __sync_val_compare_and_swap
6336      which is always seq-cst.  */
6337   icode = optab_handler (sync_compare_and_swap_optab, mode);
6338   if (icode != CODE_FOR_nothing)
6339     {
6340       rtx cc_reg;
6341
6342       create_output_operand (&ops[0], target_oval, mode);
6343       create_fixed_operand (&ops[1], mem);
6344       create_input_operand (&ops[2], expected, mode);
6345       create_input_operand (&ops[3], desired, mode);
6346       if (!maybe_expand_insn (icode, 4, ops))
6347         return false;
6348
6349       target_oval = ops[0].value;
6350
6351       /* If the caller isn't interested in the boolean return value,
6352          skip the computation of it.  */
6353       if (ptarget_bool == NULL)
6354         goto success;
6355
6356       /* Otherwise, work out if the compare-and-swap succeeded.  */
6357       cc_reg = NULL_RTX;
6358       if (have_insn_for (COMPARE, CCmode))
6359         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
6360       if (cc_reg)
6361         {
6362           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
6363                                                const0_rtx, VOIDmode, 0, 1);
6364           goto success;
6365         }
6366       goto success_bool_from_val;
6367     }
6368
6369   /* Also check for library support for __sync_val_compare_and_swap.  */
6370   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
6371   if (libfunc != NULL)
6372     {
6373       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6374       rtx target = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6375                                             mode, addr, ptr_mode,
6376                                             expected, mode, desired, mode);
6377       emit_move_insn (target_oval, target);
6378
6379       /* Compute the boolean return value only if requested.  */
6380       if (ptarget_bool)
6381         goto success_bool_from_val;
6382       else
6383         goto success;
6384     }
6385
6386   /* Failure.  */
6387   return false;
6388
6389  success_bool_from_val:
6390    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
6391                                         expected, VOIDmode, 1, 1);
6392  success:
6393   /* Make sure that the oval output winds up where the caller asked.  */
6394   if (ptarget_oval)
6395     *ptarget_oval = target_oval;
6396   if (ptarget_bool)
6397     *ptarget_bool = target_bool;
6398   return true;
6399 }
6400
6401 /* Generate asm volatile("" : : : "memory") as the memory blockage.  */
6402
6403 static void
6404 expand_asm_memory_blockage (void)
6405 {
6406   rtx asm_op, clob;
6407
6408   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, "", "", 0,
6409                                  rtvec_alloc (0), rtvec_alloc (0),
6410                                  rtvec_alloc (0), UNKNOWN_LOCATION);
6411   MEM_VOLATILE_P (asm_op) = 1;
6412
6413   clob = gen_rtx_SCRATCH (VOIDmode);
6414   clob = gen_rtx_MEM (BLKmode, clob);
6415   clob = gen_rtx_CLOBBER (VOIDmode, clob);
6416
6417   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
6418 }
6419
6420 /* Do not propagate memory accesses across this point.  */
6421
6422 static void
6423 expand_memory_blockage (void)
6424 {
6425   if (targetm.have_memory_blockage ())
6426     emit_insn (targetm.gen_memory_blockage ());
6427   else
6428     expand_asm_memory_blockage ();
6429 }
6430
6431 /* This routine will either emit the mem_thread_fence pattern or issue a
6432    sync_synchronize to generate a fence for memory model MEMMODEL.  */
6433
6434 void
6435 expand_mem_thread_fence (enum memmodel model)
6436 {
6437   if (is_mm_relaxed (model))
6438     return;
6439   if (targetm.have_mem_thread_fence ())
6440     {
6441       emit_insn (targetm.gen_mem_thread_fence (GEN_INT (model)));
6442       expand_memory_blockage ();
6443     }
6444   else if (targetm.have_memory_barrier ())
6445     emit_insn (targetm.gen_memory_barrier ());
6446   else if (synchronize_libfunc != NULL_RTX)
6447     emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode);
6448   else
6449     expand_memory_blockage ();
6450 }
6451
6452 /* Emit a signal fence with given memory model.  */
6453
6454 void
6455 expand_mem_signal_fence (enum memmodel model)
6456 {
6457   /* No machine barrier is required to implement a signal fence, but
6458      a compiler memory barrier must be issued, except for relaxed MM.  */
6459   if (!is_mm_relaxed (model))
6460     expand_memory_blockage ();
6461 }
6462
6463 /* This function expands the atomic load operation:
6464    return the atomically loaded value in MEM.
6465
6466    MEMMODEL is the memory model variant to use.
6467    TARGET is an option place to stick the return value.  */
6468
6469 rtx
6470 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
6471 {
6472   machine_mode mode = GET_MODE (mem);
6473   enum insn_code icode;
6474
6475   /* If the target supports the load directly, great.  */
6476   icode = direct_optab_handler (atomic_load_optab, mode);
6477   if (icode != CODE_FOR_nothing)
6478     {
6479       struct expand_operand ops[3];
6480       rtx_insn *last = get_last_insn ();
6481       if (is_mm_seq_cst (model))
6482         expand_memory_blockage ();
6483
6484       create_output_operand (&ops[0], target, mode);
6485       create_fixed_operand (&ops[1], mem);
6486       create_integer_operand (&ops[2], model);
6487       if (maybe_expand_insn (icode, 3, ops))
6488         {
6489           if (!is_mm_relaxed (model))
6490             expand_memory_blockage ();
6491           return ops[0].value;
6492         }
6493       delete_insns_since (last);
6494     }
6495
6496   /* If the size of the object is greater than word size on this target,
6497      then we assume that a load will not be atomic.  We could try to
6498      emulate a load with a compare-and-swap operation, but the store that
6499      doing this could result in would be incorrect if this is a volatile
6500      atomic load or targetting read-only-mapped memory.  */
6501   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6502     /* If there is no atomic load, leave the library call.  */
6503     return NULL_RTX;
6504
6505   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
6506   if (!target || target == const0_rtx)
6507     target = gen_reg_rtx (mode);
6508
6509   /* For SEQ_CST, emit a barrier before the load.  */
6510   if (is_mm_seq_cst (model))
6511     expand_mem_thread_fence (model);
6512
6513   emit_move_insn (target, mem);
6514
6515   /* Emit the appropriate barrier after the load.  */
6516   expand_mem_thread_fence (model);
6517
6518   return target;
6519 }
6520
6521 /* This function expands the atomic store operation:
6522    Atomically store VAL in MEM.
6523    MEMMODEL is the memory model variant to use.
6524    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
6525    function returns const0_rtx if a pattern was emitted.  */
6526
6527 rtx
6528 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
6529 {
6530   machine_mode mode = GET_MODE (mem);
6531   enum insn_code icode;
6532   struct expand_operand ops[3];
6533
6534   /* If the target supports the store directly, great.  */
6535   icode = direct_optab_handler (atomic_store_optab, mode);
6536   if (icode != CODE_FOR_nothing)
6537     {
6538       rtx_insn *last = get_last_insn ();
6539       if (!is_mm_relaxed (model))
6540         expand_memory_blockage ();
6541       create_fixed_operand (&ops[0], mem);
6542       create_input_operand (&ops[1], val, mode);
6543       create_integer_operand (&ops[2], model);
6544       if (maybe_expand_insn (icode, 3, ops))
6545         {
6546           if (is_mm_seq_cst (model))
6547             expand_memory_blockage ();
6548           return const0_rtx;
6549         }
6550       delete_insns_since (last);
6551     }
6552
6553   /* If using __sync_lock_release is a viable alternative, try it.
6554      Note that this will not be set to true if we are expanding a generic
6555      __atomic_store_n.  */
6556   if (use_release)
6557     {
6558       icode = direct_optab_handler (sync_lock_release_optab, mode);
6559       if (icode != CODE_FOR_nothing)
6560         {
6561           create_fixed_operand (&ops[0], mem);
6562           create_input_operand (&ops[1], const0_rtx, mode);
6563           if (maybe_expand_insn (icode, 2, ops))
6564             {
6565               /* lock_release is only a release barrier.  */
6566               if (is_mm_seq_cst (model))
6567                 expand_mem_thread_fence (model);
6568               return const0_rtx;
6569             }
6570         }
6571     }
6572
6573   /* If the size of the object is greater than word size on this target,
6574      a default store will not be atomic.  */
6575   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6576     {
6577       /* If loads are atomic or we are called to provide a __sync builtin,
6578          we can try a atomic_exchange and throw away the result.  Otherwise,
6579          don't do anything so that we do not create an inconsistency between
6580          loads and stores.  */
6581       if (can_atomic_load_p (mode) || is_mm_sync (model))
6582         {
6583           rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
6584           if (!target)
6585             target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem,
6586                                                                 val);
6587           if (target)
6588             return const0_rtx;
6589         }
6590         return NULL_RTX;
6591     }
6592
6593   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
6594   expand_mem_thread_fence (model);
6595
6596   emit_move_insn (mem, val);
6597
6598   /* For SEQ_CST, also emit a barrier after the store.  */
6599   if (is_mm_seq_cst (model))
6600     expand_mem_thread_fence (model);
6601
6602   return const0_rtx;
6603 }
6604
6605
6606 /* Structure containing the pointers and values required to process the
6607    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
6608
6609 struct atomic_op_functions
6610 {
6611   direct_optab mem_fetch_before;
6612   direct_optab mem_fetch_after;
6613   direct_optab mem_no_result;
6614   optab fetch_before;
6615   optab fetch_after;
6616   direct_optab no_result;
6617   enum rtx_code reverse_code;
6618 };
6619
6620
6621 /* Fill in structure pointed to by OP with the various optab entries for an
6622    operation of type CODE.  */
6623
6624 static void
6625 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
6626 {
6627   gcc_assert (op!= NULL);
6628
6629   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
6630      in the source code during compilation, and the optab entries are not
6631      computable until runtime.  Fill in the values at runtime.  */
6632   switch (code)
6633     {
6634     case PLUS:
6635       op->mem_fetch_before = atomic_fetch_add_optab;
6636       op->mem_fetch_after = atomic_add_fetch_optab;
6637       op->mem_no_result = atomic_add_optab;
6638       op->fetch_before = sync_old_add_optab;
6639       op->fetch_after = sync_new_add_optab;
6640       op->no_result = sync_add_optab;
6641       op->reverse_code = MINUS;
6642       break;
6643     case MINUS:
6644       op->mem_fetch_before = atomic_fetch_sub_optab;
6645       op->mem_fetch_after = atomic_sub_fetch_optab;
6646       op->mem_no_result = atomic_sub_optab;
6647       op->fetch_before = sync_old_sub_optab;
6648       op->fetch_after = sync_new_sub_optab;
6649       op->no_result = sync_sub_optab;
6650       op->reverse_code = PLUS;
6651       break;
6652     case XOR:
6653       op->mem_fetch_before = atomic_fetch_xor_optab;
6654       op->mem_fetch_after = atomic_xor_fetch_optab;
6655       op->mem_no_result = atomic_xor_optab;
6656       op->fetch_before = sync_old_xor_optab;
6657       op->fetch_after = sync_new_xor_optab;
6658       op->no_result = sync_xor_optab;
6659       op->reverse_code = XOR;
6660       break;
6661     case AND:
6662       op->mem_fetch_before = atomic_fetch_and_optab;
6663       op->mem_fetch_after = atomic_and_fetch_optab;
6664       op->mem_no_result = atomic_and_optab;
6665       op->fetch_before = sync_old_and_optab;
6666       op->fetch_after = sync_new_and_optab;
6667       op->no_result = sync_and_optab;
6668       op->reverse_code = UNKNOWN;
6669       break;
6670     case IOR:
6671       op->mem_fetch_before = atomic_fetch_or_optab;
6672       op->mem_fetch_after = atomic_or_fetch_optab;
6673       op->mem_no_result = atomic_or_optab;
6674       op->fetch_before = sync_old_ior_optab;
6675       op->fetch_after = sync_new_ior_optab;
6676       op->no_result = sync_ior_optab;
6677       op->reverse_code = UNKNOWN;
6678       break;
6679     case NOT:
6680       op->mem_fetch_before = atomic_fetch_nand_optab;
6681       op->mem_fetch_after = atomic_nand_fetch_optab;
6682       op->mem_no_result = atomic_nand_optab;
6683       op->fetch_before = sync_old_nand_optab;
6684       op->fetch_after = sync_new_nand_optab;
6685       op->no_result = sync_nand_optab;
6686       op->reverse_code = UNKNOWN;
6687       break;
6688     default:
6689       gcc_unreachable ();
6690     }
6691 }
6692
6693 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
6694    using memory order MODEL.  If AFTER is true the operation needs to return
6695    the value of *MEM after the operation, otherwise the previous value.
6696    TARGET is an optional place to place the result.  The result is unused if
6697    it is const0_rtx.
6698    Return the result if there is a better sequence, otherwise NULL_RTX.  */
6699
6700 static rtx
6701 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6702                          enum memmodel model, bool after)
6703 {
6704   /* If the value is prefetched, or not used, it may be possible to replace
6705      the sequence with a native exchange operation.  */
6706   if (!after || target == const0_rtx)
6707     {
6708       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
6709       if (code == AND && val == const0_rtx)
6710         {
6711           if (target == const0_rtx)
6712             target = gen_reg_rtx (GET_MODE (mem));
6713           return maybe_emit_atomic_exchange (target, mem, val, model);
6714         }
6715
6716       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
6717       if (code == IOR && val == constm1_rtx)
6718         {
6719           if (target == const0_rtx)
6720             target = gen_reg_rtx (GET_MODE (mem));
6721           return maybe_emit_atomic_exchange (target, mem, val, model);
6722         }
6723     }
6724
6725   return NULL_RTX;
6726 }
6727
6728 /* Try to emit an instruction for a specific operation varaition.
6729    OPTAB contains the OP functions.
6730    TARGET is an optional place to return the result. const0_rtx means unused.
6731    MEM is the memory location to operate on.
6732    VAL is the value to use in the operation.
6733    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
6734    MODEL is the memory model, if used.
6735    AFTER is true if the returned result is the value after the operation.  */
6736
6737 static rtx
6738 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
6739                rtx val, bool use_memmodel, enum memmodel model, bool after)
6740 {
6741   machine_mode mode = GET_MODE (mem);
6742   struct expand_operand ops[4];
6743   enum insn_code icode;
6744   int op_counter = 0;
6745   int num_ops;
6746
6747   /* Check to see if there is a result returned.  */
6748   if (target == const0_rtx)
6749     {
6750       if (use_memmodel)
6751         {
6752           icode = direct_optab_handler (optab->mem_no_result, mode);
6753           create_integer_operand (&ops[2], model);
6754           num_ops = 3;
6755         }
6756       else
6757         {
6758           icode = direct_optab_handler (optab->no_result, mode);
6759           num_ops = 2;
6760         }
6761     }
6762   /* Otherwise, we need to generate a result.  */
6763   else
6764     {
6765       if (use_memmodel)
6766         {
6767           icode = direct_optab_handler (after ? optab->mem_fetch_after
6768                                         : optab->mem_fetch_before, mode);
6769           create_integer_operand (&ops[3], model);
6770           num_ops = 4;
6771         }
6772       else
6773         {
6774           icode = optab_handler (after ? optab->fetch_after
6775                                  : optab->fetch_before, mode);
6776           num_ops = 3;
6777         }
6778       create_output_operand (&ops[op_counter++], target, mode);
6779     }
6780   if (icode == CODE_FOR_nothing)
6781     return NULL_RTX;
6782
6783   create_fixed_operand (&ops[op_counter++], mem);
6784   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
6785   create_convert_operand_to (&ops[op_counter++], val, mode, true);
6786
6787   if (maybe_expand_insn (icode, num_ops, ops))
6788     return (target == const0_rtx ? const0_rtx : ops[0].value);
6789
6790   return NULL_RTX;
6791 }
6792
6793
6794 /* This function expands an atomic fetch_OP or OP_fetch operation:
6795    TARGET is an option place to stick the return value.  const0_rtx indicates
6796    the result is unused.
6797    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6798    CODE is the operation being performed (OP)
6799    MEMMODEL is the memory model variant to use.
6800    AFTER is true to return the result of the operation (OP_fetch).
6801    AFTER is false to return the value before the operation (fetch_OP).
6802
6803    This function will *only* generate instructions if there is a direct
6804    optab. No compare and swap loops or libcalls will be generated. */
6805
6806 static rtx
6807 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
6808                                     enum rtx_code code, enum memmodel model,
6809                                     bool after)
6810 {
6811   machine_mode mode = GET_MODE (mem);
6812   struct atomic_op_functions optab;
6813   rtx result;
6814   bool unused_result = (target == const0_rtx);
6815
6816   get_atomic_op_for_code (&optab, code);
6817
6818   /* Check to see if there are any better instructions.  */
6819   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
6820   if (result)
6821     return result;
6822
6823   /* Check for the case where the result isn't used and try those patterns.  */
6824   if (unused_result)
6825     {
6826       /* Try the memory model variant first.  */
6827       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
6828       if (result)
6829         return result;
6830
6831       /* Next try the old style withuot a memory model.  */
6832       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
6833       if (result)
6834         return result;
6835
6836       /* There is no no-result pattern, so try patterns with a result.  */
6837       target = NULL_RTX;
6838     }
6839
6840   /* Try the __atomic version.  */
6841   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
6842   if (result)
6843     return result;
6844
6845   /* Try the older __sync version.  */
6846   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
6847   if (result)
6848     return result;
6849
6850   /* If the fetch value can be calculated from the other variation of fetch,
6851      try that operation.  */
6852   if (after || unused_result || optab.reverse_code != UNKNOWN)
6853     {
6854       /* Try the __atomic version, then the older __sync version.  */
6855       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
6856       if (!result)
6857         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
6858
6859       if (result)
6860         {
6861           /* If the result isn't used, no need to do compensation code.  */
6862           if (unused_result)
6863             return result;
6864
6865           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
6866              Fetch_before == after REVERSE_OP val.  */
6867           if (!after)
6868             code = optab.reverse_code;
6869           if (code == NOT)
6870             {
6871               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
6872                                             true, OPTAB_LIB_WIDEN);
6873               result = expand_simple_unop (mode, NOT, result, target, true);
6874             }
6875           else
6876             result = expand_simple_binop (mode, code, result, val, target,
6877                                           true, OPTAB_LIB_WIDEN);
6878           return result;
6879         }
6880     }
6881
6882   /* No direct opcode can be generated.  */
6883   return NULL_RTX;
6884 }
6885
6886
6887
6888 /* This function expands an atomic fetch_OP or OP_fetch operation:
6889    TARGET is an option place to stick the return value.  const0_rtx indicates
6890    the result is unused.
6891    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6892    CODE is the operation being performed (OP)
6893    MEMMODEL is the memory model variant to use.
6894    AFTER is true to return the result of the operation (OP_fetch).
6895    AFTER is false to return the value before the operation (fetch_OP).  */
6896 rtx
6897 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6898                         enum memmodel model, bool after)
6899 {
6900   machine_mode mode = GET_MODE (mem);
6901   rtx result;
6902   bool unused_result = (target == const0_rtx);
6903
6904   /* If loads are not atomic for the required size and we are not called to
6905      provide a __sync builtin, do not do anything so that we stay consistent
6906      with atomic loads of the same size.  */
6907   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6908     return NULL_RTX;
6909
6910   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
6911                                                after);
6912
6913   if (result)
6914     return result;
6915
6916   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
6917   if (code == PLUS || code == MINUS)
6918     {
6919       rtx tmp;
6920       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
6921
6922       start_sequence ();
6923       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
6924       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
6925                                                    model, after);
6926       if (result)
6927         {
6928           /* PLUS worked so emit the insns and return.  */
6929           tmp = get_insns ();
6930           end_sequence ();
6931           emit_insn (tmp);
6932           return result;
6933         }
6934
6935       /* PLUS did not work, so throw away the negation code and continue.  */
6936       end_sequence ();
6937     }
6938
6939   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
6940   if (!can_compare_and_swap_p (mode, false))
6941     {
6942       rtx libfunc;
6943       bool fixup = false;
6944       enum rtx_code orig_code = code;
6945       struct atomic_op_functions optab;
6946
6947       get_atomic_op_for_code (&optab, code);
6948       libfunc = optab_libfunc (after ? optab.fetch_after
6949                                : optab.fetch_before, mode);
6950       if (libfunc == NULL
6951           && (after || unused_result || optab.reverse_code != UNKNOWN))
6952         {
6953           fixup = true;
6954           if (!after)
6955             code = optab.reverse_code;
6956           libfunc = optab_libfunc (after ? optab.fetch_before
6957                                    : optab.fetch_after, mode);
6958         }
6959       if (libfunc != NULL)
6960         {
6961           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6962           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
6963                                             addr, ptr_mode, val, mode);
6964
6965           if (!unused_result && fixup)
6966             result = expand_simple_binop (mode, code, result, val, target,
6967                                           true, OPTAB_LIB_WIDEN);
6968           return result;
6969         }
6970
6971       /* We need the original code for any further attempts.  */
6972       code = orig_code;
6973     }
6974
6975   /* If nothing else has succeeded, default to a compare and swap loop.  */
6976   if (can_compare_and_swap_p (mode, true))
6977     {
6978       rtx_insn *insn;
6979       rtx t0 = gen_reg_rtx (mode), t1;
6980
6981       start_sequence ();
6982
6983       /* If the result is used, get a register for it.  */
6984       if (!unused_result)
6985         {
6986           if (!target || !register_operand (target, mode))
6987             target = gen_reg_rtx (mode);
6988           /* If fetch_before, copy the value now.  */
6989           if (!after)
6990             emit_move_insn (target, t0);
6991         }
6992       else
6993         target = const0_rtx;
6994
6995       t1 = t0;
6996       if (code == NOT)
6997         {
6998           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
6999                                     true, OPTAB_LIB_WIDEN);
7000           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
7001         }
7002       else
7003         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
7004                                   OPTAB_LIB_WIDEN);
7005
7006       /* For after, copy the value now.  */
7007       if (!unused_result && after)
7008         emit_move_insn (target, t1);
7009       insn = get_insns ();
7010       end_sequence ();
7011
7012       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
7013         return target;
7014     }
7015
7016   return NULL_RTX;
7017 }
7018 \f
7019 /* Return true if OPERAND is suitable for operand number OPNO of
7020    instruction ICODE.  */
7021
7022 bool
7023 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
7024 {
7025   return (!insn_data[(int) icode].operand[opno].predicate
7026           || (insn_data[(int) icode].operand[opno].predicate
7027               (operand, insn_data[(int) icode].operand[opno].mode)));
7028 }
7029 \f
7030 /* TARGET is a target of a multiword operation that we are going to
7031    implement as a series of word-mode operations.  Return true if
7032    TARGET is suitable for this purpose.  */
7033
7034 bool
7035 valid_multiword_target_p (rtx target)
7036 {
7037   machine_mode mode;
7038   int i;
7039
7040   mode = GET_MODE (target);
7041   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
7042     if (!validate_subreg (word_mode, mode, target, i))
7043       return false;
7044   return true;
7045 }
7046
7047 /* Make OP describe an input operand that has value INTVAL and that has
7048    no inherent mode.  This function should only be used for operands that
7049    are always expand-time constants.  The backend may request that INTVAL
7050    be copied into a different kind of rtx, but it must specify the mode
7051    of that rtx if so.  */
7052
7053 void
7054 create_integer_operand (struct expand_operand *op, poly_int64 intval)
7055 {
7056   create_expand_operand (op, EXPAND_INTEGER,
7057                          gen_int_mode (intval, MAX_MODE_INT),
7058                          VOIDmode, false, intval);
7059 }
7060
7061 /* Like maybe_legitimize_operand, but do not change the code of the
7062    current rtx value.  */
7063
7064 static bool
7065 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
7066                                     struct expand_operand *op)
7067 {
7068   /* See if the operand matches in its current form.  */
7069   if (insn_operand_matches (icode, opno, op->value))
7070     return true;
7071
7072   /* If the operand is a memory whose address has no side effects,
7073      try forcing the address into a non-virtual pseudo register.
7074      The check for side effects is important because copy_to_mode_reg
7075      cannot handle things like auto-modified addresses.  */
7076   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
7077     {
7078       rtx addr, mem;
7079
7080       mem = op->value;
7081       addr = XEXP (mem, 0);
7082       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
7083           && !side_effects_p (addr))
7084         {
7085           rtx_insn *last;
7086           machine_mode mode;
7087
7088           last = get_last_insn ();
7089           mode = get_address_mode (mem);
7090           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
7091           if (insn_operand_matches (icode, opno, mem))
7092             {
7093               op->value = mem;
7094               return true;
7095             }
7096           delete_insns_since (last);
7097         }
7098     }
7099
7100   return false;
7101 }
7102
7103 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
7104    on success, storing the new operand value back in OP.  */
7105
7106 static bool
7107 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
7108                           struct expand_operand *op)
7109 {
7110   machine_mode mode, imode;
7111   bool old_volatile_ok, result;
7112
7113   mode = op->mode;
7114   switch (op->type)
7115     {
7116     case EXPAND_FIXED:
7117       old_volatile_ok = volatile_ok;
7118       volatile_ok = true;
7119       result = maybe_legitimize_operand_same_code (icode, opno, op);
7120       volatile_ok = old_volatile_ok;
7121       return result;
7122
7123     case EXPAND_OUTPUT:
7124       gcc_assert (mode != VOIDmode);
7125       if (op->value
7126           && op->value != const0_rtx
7127           && GET_MODE (op->value) == mode
7128           && maybe_legitimize_operand_same_code (icode, opno, op))
7129         return true;
7130
7131       op->value = gen_reg_rtx (mode);
7132       op->target = 0;
7133       break;
7134
7135     case EXPAND_INPUT:
7136     input:
7137       gcc_assert (mode != VOIDmode);
7138       gcc_assert (GET_MODE (op->value) == VOIDmode
7139                   || GET_MODE (op->value) == mode);
7140       if (maybe_legitimize_operand_same_code (icode, opno, op))
7141         return true;
7142
7143       op->value = copy_to_mode_reg (mode, op->value);
7144       break;
7145
7146     case EXPAND_CONVERT_TO:
7147       gcc_assert (mode != VOIDmode);
7148       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
7149       goto input;
7150
7151     case EXPAND_CONVERT_FROM:
7152       if (GET_MODE (op->value) != VOIDmode)
7153         mode = GET_MODE (op->value);
7154       else
7155         /* The caller must tell us what mode this value has.  */
7156         gcc_assert (mode != VOIDmode);
7157
7158       imode = insn_data[(int) icode].operand[opno].mode;
7159       if (imode != VOIDmode && imode != mode)
7160         {
7161           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
7162           mode = imode;
7163         }
7164       goto input;
7165
7166     case EXPAND_ADDRESS:
7167       op->value = convert_memory_address (as_a <scalar_int_mode> (mode),
7168                                           op->value);
7169       goto input;
7170
7171     case EXPAND_INTEGER:
7172       mode = insn_data[(int) icode].operand[opno].mode;
7173       if (mode != VOIDmode
7174           && known_eq (trunc_int_for_mode (op->int_value, mode),
7175                        op->int_value))
7176         {
7177           op->value = gen_int_mode (op->int_value, mode);
7178           goto input;
7179         }
7180       break;
7181     }
7182   return insn_operand_matches (icode, opno, op->value);
7183 }
7184
7185 /* Make OP describe an input operand that should have the same value
7186    as VALUE, after any mode conversion that the target might request.
7187    TYPE is the type of VALUE.  */
7188
7189 void
7190 create_convert_operand_from_type (struct expand_operand *op,
7191                                   rtx value, tree type)
7192 {
7193   create_convert_operand_from (op, value, TYPE_MODE (type),
7194                                TYPE_UNSIGNED (type));
7195 }
7196
7197 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
7198    of instruction ICODE.  Return true on success, leaving the new operand
7199    values in the OPS themselves.  Emit no code on failure.  */
7200
7201 bool
7202 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
7203                            unsigned int nops, struct expand_operand *ops)
7204 {
7205   rtx_insn *last;
7206   unsigned int i;
7207
7208   last = get_last_insn ();
7209   for (i = 0; i < nops; i++)
7210     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
7211       {
7212         delete_insns_since (last);
7213         return false;
7214       }
7215   return true;
7216 }
7217
7218 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
7219    as its operands.  Return the instruction pattern on success,
7220    and emit any necessary set-up code.  Return null and emit no
7221    code on failure.  */
7222
7223 rtx_insn *
7224 maybe_gen_insn (enum insn_code icode, unsigned int nops,
7225                 struct expand_operand *ops)
7226 {
7227   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
7228   if (!maybe_legitimize_operands (icode, 0, nops, ops))
7229     return NULL;
7230
7231   switch (nops)
7232     {
7233     case 1:
7234       return GEN_FCN (icode) (ops[0].value);
7235     case 2:
7236       return GEN_FCN (icode) (ops[0].value, ops[1].value);
7237     case 3:
7238       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
7239     case 4:
7240       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7241                               ops[3].value);
7242     case 5:
7243       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7244                               ops[3].value, ops[4].value);
7245     case 6:
7246       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7247                               ops[3].value, ops[4].value, ops[5].value);
7248     case 7:
7249       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7250                               ops[3].value, ops[4].value, ops[5].value,
7251                               ops[6].value);
7252     case 8:
7253       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7254                               ops[3].value, ops[4].value, ops[5].value,
7255                               ops[6].value, ops[7].value);
7256     case 9:
7257       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7258                               ops[3].value, ops[4].value, ops[5].value,
7259                               ops[6].value, ops[7].value, ops[8].value);
7260     }
7261   gcc_unreachable ();
7262 }
7263
7264 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
7265    as its operands.  Return true on success and emit no code on failure.  */
7266
7267 bool
7268 maybe_expand_insn (enum insn_code icode, unsigned int nops,
7269                    struct expand_operand *ops)
7270 {
7271   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7272   if (pat)
7273     {
7274       emit_insn (pat);
7275       return true;
7276     }
7277   return false;
7278 }
7279
7280 /* Like maybe_expand_insn, but for jumps.  */
7281
7282 bool
7283 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
7284                         struct expand_operand *ops)
7285 {
7286   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7287   if (pat)
7288     {
7289       emit_jump_insn (pat);
7290       return true;
7291     }
7292   return false;
7293 }
7294
7295 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
7296    as its operands.  */
7297
7298 void
7299 expand_insn (enum insn_code icode, unsigned int nops,
7300              struct expand_operand *ops)
7301 {
7302   if (!maybe_expand_insn (icode, nops, ops))
7303     gcc_unreachable ();
7304 }
7305
7306 /* Like expand_insn, but for jumps.  */
7307
7308 void
7309 expand_jump_insn (enum insn_code icode, unsigned int nops,
7310                   struct expand_operand *ops)
7311 {
7312   if (!maybe_expand_jump_insn (icode, nops, ops))
7313     gcc_unreachable ();
7314 }