gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2017 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "backend.h"
  25 #include "target.h"
  26 #include "rtl.h"
  27 #include "tree.h"
  28 #include "memmodel.h"
  29 #include "predict.h"
  30 #include "tm_p.h"
  31 #include "expmed.h"
  32 #include "optabs.h"
  33 #include "emit-rtl.h"
  34 #include "recog.h"
  35 #include "diagnostic-core.h"
  36
  37 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  38    is properly defined.  */
  39 #include "stor-layout.h"
  40 #include "except.h"
  41 #include "dojump.h"
  42 #include "explow.h"
  43 #include "expr.h"
  44 #include "optabs-tree.h"
  45 #include "libfuncs.h"
  46
  47 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  48                                    machine_mode *);
  49 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  50 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  51
  52 /* Debug facility for use in GDB.  */
  53 void debug_optab_libfuncs (void);
  54 \f
  55 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
  56    the result of operation CODE applied to OP0 (and OP1 if it is a binary
  57    operation).
  58
  59    If the last insn does not set TARGET, don't do anything, but return 1.
  60
  61    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
  62    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
  63    try again, ensuring that TARGET is not one of the operands.  */
  64
  65 static int
  66 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
  67 {
  68   rtx_insn *last_insn;
  69   rtx set;
  70   rtx note;
  71
  72   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
  73
  74   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
  75       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
  76       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
  77       && GET_RTX_CLASS (code) != RTX_COMPARE
  78       && GET_RTX_CLASS (code) != RTX_UNARY)
  79     return 1;
  80
  81   if (GET_CODE (target) == ZERO_EXTRACT)
  82     return 1;
  83
  84   for (last_insn = insns;
  85        NEXT_INSN (last_insn) != NULL_RTX;
  86        last_insn = NEXT_INSN (last_insn))
  87     ;
  88
  89   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
  90      a value changing in the insn, so the note would be invalid for CSE.  */
  91   if (reg_overlap_mentioned_p (target, op0)
  92       || (op1 && reg_overlap_mentioned_p (target, op1)))
  93     {
  94       if (MEM_P (target)
  95           && (rtx_equal_p (target, op0)
  96               || (op1 && rtx_equal_p (target, op1))))
  97         {
  98           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
  99              over expanding it as temp = MEM op X, MEM = temp.  If the target
 100              supports MEM = MEM op X instructions, it is sometimes too hard
 101              to reconstruct that form later, especially if X is also a memory,
 102              and due to multiple occurrences of addresses the address might
 103              be forced into register unnecessarily.
 104              Note that not emitting the REG_EQUIV note might inhibit
 105              CSE in some cases.  */
 106           set = single_set (last_insn);
 107           if (set
 108               && GET_CODE (SET_SRC (set)) == code
 109               && MEM_P (SET_DEST (set))
 110               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 111                   || (op1 && rtx_equal_p (SET_DEST (set),
 112                                           XEXP (SET_SRC (set), 1)))))
 113             return 1;
 114         }
 115       return 0;
 116     }
 117
 118   set = set_for_reg_notes (last_insn);
 119   if (set == NULL_RTX)
 120     return 1;
 121
 122   if (! rtx_equal_p (SET_DEST (set), target)
 123       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 124       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 125           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 126     return 1;
 127
 128   if (GET_RTX_CLASS (code) == RTX_UNARY)
 129     switch (code)
 130       {
 131       case FFS:
 132       case CLZ:
 133       case CTZ:
 134       case CLRSB:
 135       case POPCOUNT:
 136       case PARITY:
 137       case BSWAP:
 138         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 139           {
 140             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 141             if (GET_MODE_UNIT_SIZE (GET_MODE (op0))
 142                 > GET_MODE_UNIT_SIZE (GET_MODE (target)))
 143               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 144                                          note, GET_MODE (op0));
 145             else
 146               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 147                                          note, GET_MODE (op0));
 148             break;
 149           }
 150         /* FALLTHRU */
 151       default:
 152         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 153         break;
 154       }
 155   else
 156     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 157
 158   set_unique_reg_note (last_insn, REG_EQUAL, note);
 159
 160   return 1;
 161 }
 162 \f
 163 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 164    for a widening operation would be.  In most cases this would be OP0, but if
 165    that's a constant it'll be VOIDmode, which isn't useful.  */
 166
 167 static machine_mode
 168 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 169 {
 170   machine_mode m0 = GET_MODE (op0);
 171   machine_mode m1 = GET_MODE (op1);
 172   machine_mode result;
 173
 174   if (m0 == VOIDmode && m1 == VOIDmode)
 175     return to_mode;
 176   else if (m0 == VOIDmode || GET_MODE_UNIT_SIZE (m0) < GET_MODE_UNIT_SIZE (m1))
 177     result = m1;
 178   else
 179     result = m0;
 180
 181   if (GET_MODE_UNIT_SIZE (result) > GET_MODE_UNIT_SIZE (to_mode))
 182     return to_mode;
 183
 184   return result;
 185 }
 186 \f
 187 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 188    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 189    not actually do a sign-extend or zero-extend, but can leave the
 190    higher-order bits of the result rtx undefined, for example, in the case
 191    of logical operations, but not right shifts.  */
 192
 193 static rtx
 194 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 195                int unsignedp, int no_extend)
 196 {
 197   rtx result;
 198   scalar_int_mode int_mode;
 199
 200   /* If we don't have to extend and this is a constant, return it.  */
 201   if (no_extend && GET_MODE (op) == VOIDmode)
 202     return op;
 203
 204   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 205      extend since it will be more efficient to do so unless the signedness of
 206      a promoted object differs from our extension.  */
 207   if (! no_extend
 208       || !is_a <scalar_int_mode> (mode, &int_mode)
 209       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 210           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 211     return convert_modes (mode, oldmode, op, unsignedp);
 212
 213   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 214      SUBREG.  */
 215   if (GET_MODE_SIZE (int_mode) <= UNITS_PER_WORD)
 216     return gen_lowpart (int_mode, force_reg (GET_MODE (op), op));
 217
 218   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 219      part to OP.  */
 220
 221   result = gen_reg_rtx (int_mode);
 222   emit_clobber (result);
 223   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 224   return result;
 225 }
 226 \f
 227 /* Expand vector widening operations.
 228
 229    There are two different classes of operations handled here:
 230    1) Operations whose result is wider than all the arguments to the operation.
 231       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 232       In this case OP0 and optionally OP1 would be initialized,
 233       but WIDE_OP wouldn't (not relevant for this case).
 234    2) Operations whose result is of the same size as the last argument to the
 235       operation, but wider than all the other arguments to the operation.
 236       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 237       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 238
 239    E.g, when called to expand the following operations, this is how
 240    the arguments will be initialized:
 241                                 nops    OP0     OP1     WIDE_OP
 242    widening-sum                 2       oprnd0  -       oprnd1
 243    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 244    widening-mult                2       oprnd0  oprnd1  -
 245    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 246
 247 rtx
 248 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 249                            rtx target, int unsignedp)
 250 {
 251   struct expand_operand eops[4];
 252   tree oprnd0, oprnd1, oprnd2;
 253   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 254   optab widen_pattern_optab;
 255   enum insn_code icode;
 256   int nops = TREE_CODE_LENGTH (ops->code);
 257   int op;
 258
 259   oprnd0 = ops->op0;
 260   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 261   widen_pattern_optab =
 262     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 263   if (ops->code == WIDEN_MULT_PLUS_EXPR
 264       || ops->code == WIDEN_MULT_MINUS_EXPR)
 265     icode = find_widening_optab_handler (widen_pattern_optab,
 266                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 267                                          tmode0);
 268   else
 269     icode = optab_handler (widen_pattern_optab, tmode0);
 270   gcc_assert (icode != CODE_FOR_nothing);
 271
 272   if (nops >= 2)
 273     {
 274       oprnd1 = ops->op1;
 275       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 276     }
 277
 278   /* The last operand is of a wider mode than the rest of the operands.  */
 279   if (nops == 2)
 280     wmode = tmode1;
 281   else if (nops == 3)
 282     {
 283       gcc_assert (tmode1 == tmode0);
 284       gcc_assert (op1);
 285       oprnd2 = ops->op2;
 286       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 287     }
 288
 289   op = 0;
 290   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 291   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 292   if (op1)
 293     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 294   if (wide_op)
 295     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 296   expand_insn (icode, op, eops);
 297   return eops[0].value;
 298 }
 299
 300 /* Generate code to perform an operation specified by TERNARY_OPTAB
 301    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 302
 303    UNSIGNEDP is for the case where we have to widen the operands
 304    to perform the operation.  It says to use zero-extension.
 305
 306    If TARGET is nonzero, the value
 307    is generated there, if it is convenient to do so.
 308    In all cases an rtx is returned for the locus of the value;
 309    this may or may not be TARGET.  */
 310
 311 rtx
 312 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 313                    rtx op1, rtx op2, rtx target, int unsignedp)
 314 {
 315   struct expand_operand ops[4];
 316   enum insn_code icode = optab_handler (ternary_optab, mode);
 317
 318   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 319
 320   create_output_operand (&ops[0], target, mode);
 321   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 322   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 323   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 324   expand_insn (icode, 4, ops);
 325   return ops[0].value;
 326 }
 327
 328
 329 /* Like expand_binop, but return a constant rtx if the result can be
 330    calculated at compile time.  The arguments and return value are
 331    otherwise the same as for expand_binop.  */
 332
 333 rtx
 334 simplify_expand_binop (machine_mode mode, optab binoptab,
 335                        rtx op0, rtx op1, rtx target, int unsignedp,
 336                        enum optab_methods methods)
 337 {
 338   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 339     {
 340       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 341                                          mode, op0, op1);
 342       if (x)
 343         return x;
 344     }
 345
 346   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 347 }
 348
 349 /* Like simplify_expand_binop, but always put the result in TARGET.
 350    Return true if the expansion succeeded.  */
 351
 352 bool
 353 force_expand_binop (machine_mode mode, optab binoptab,
 354                     rtx op0, rtx op1, rtx target, int unsignedp,
 355                     enum optab_methods methods)
 356 {
 357   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 358                                  target, unsignedp, methods);
 359   if (x == 0)
 360     return false;
 361   if (x != target)
 362     emit_move_insn (target, x);
 363   return true;
 364 }
 365
 366 /* Create a new vector value in VMODE with all elements set to OP.  The
 367    mode of OP must be the element mode of VMODE.  If OP is a constant,
 368    then the return value will be a constant.  */
 369
 370 rtx
 371 expand_vector_broadcast (machine_mode vmode, rtx op)
 372 {
 373   enum insn_code icode;
 374   rtvec vec;
 375   rtx ret;
 376   int i, n;
 377
 378   gcc_checking_assert (VECTOR_MODE_P (vmode));
 379
 380   if (valid_for_const_vector_p (vmode, op))
 381     return gen_const_vec_duplicate (vmode, op);
 382
 383   icode = optab_handler (vec_duplicate_optab, vmode);
 384   if (icode != CODE_FOR_nothing)
 385     {
 386       struct expand_operand ops[2];
 387       create_output_operand (&ops[0], NULL_RTX, vmode);
 388       create_input_operand (&ops[1], op, GET_MODE (op));
 389       expand_insn (icode, 2, ops);
 390       return ops[0].value;
 391     }
 392
 393   /* ??? If the target doesn't have a vec_init, then we have no easy way
 394      of performing this operation.  Most of this sort of generic support
 395      is hidden away in the vector lowering support in gimple.  */
 396   icode = convert_optab_handler (vec_init_optab, vmode,
 397                                  GET_MODE_INNER (vmode));
 398   if (icode == CODE_FOR_nothing)
 399     return NULL;
 400
 401   n = GET_MODE_NUNITS (vmode);
 402   vec = rtvec_alloc (n);
 403   for (i = 0; i < n; ++i)
 404     RTVEC_ELT (vec, i) = op;
 405   ret = gen_reg_rtx (vmode);
 406   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 407
 408   return ret;
 409 }
 410
 411 /* This subroutine of expand_doubleword_shift handles the cases in which
 412    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 413    value are the same as for the parent routine, except that SUPERWORD_OP1
 414    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 415    INTO_TARGET may be null if the caller has decided to calculate it.  */
 416
 417 static bool
 418 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 419                         rtx outof_target, rtx into_target,
 420                         int unsignedp, enum optab_methods methods)
 421 {
 422   if (into_target != 0)
 423     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 424                              into_target, unsignedp, methods))
 425       return false;
 426
 427   if (outof_target != 0)
 428     {
 429       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 430          of the sign bit, otherwise we must fill it with zeros.  */
 431       if (binoptab != ashr_optab)
 432         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 433       else
 434         if (!force_expand_binop (word_mode, binoptab, outof_input,
 435                                  gen_int_shift_amount (word_mode,
 436                                                        BITS_PER_WORD - 1),
 437                                  outof_target, unsignedp, methods))
 438           return false;
 439     }
 440   return true;
 441 }
 442
 443 /* This subroutine of expand_doubleword_shift handles the cases in which
 444    the effective shift value is < BITS_PER_WORD.  The arguments and return
 445    value are the same as for the parent routine.  */
 446
 447 static bool
 448 expand_subword_shift (scalar_int_mode op1_mode, optab binoptab,
 449                       rtx outof_input, rtx into_input, rtx op1,
 450                       rtx outof_target, rtx into_target,
 451                       int unsignedp, enum optab_methods methods,
 452                       unsigned HOST_WIDE_INT shift_mask)
 453 {
 454   optab reverse_unsigned_shift, unsigned_shift;
 455   rtx tmp, carries;
 456
 457   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 458   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 459
 460   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 461      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 462      the opposite direction to BINOPTAB.  */
 463   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 464     {
 465       carries = outof_input;
 466       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 467                                             op1_mode), op1_mode);
 468       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 469                                    0, true, methods);
 470     }
 471   else
 472     {
 473       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 474          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 475          has unknown behavior.  Do a single shift first, then shift by the
 476          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 477          are truncated to the mode size.  */
 478       carries = expand_binop (word_mode, reverse_unsigned_shift,
 479                               outof_input, const1_rtx, 0, unsignedp, methods);
 480       if (shift_mask == BITS_PER_WORD - 1)
 481         {
 482           tmp = immed_wide_int_const
 483             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 484           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 485                                        0, true, methods);
 486         }
 487       else
 488         {
 489           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 490                                                 op1_mode), op1_mode);
 491           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 492                                        0, true, methods);
 493         }
 494     }
 495   if (tmp == 0 || carries == 0)
 496     return false;
 497   carries = expand_binop (word_mode, reverse_unsigned_shift,
 498                           carries, tmp, 0, unsignedp, methods);
 499   if (carries == 0)
 500     return false;
 501
 502   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 503      so the result can go directly into INTO_TARGET if convenient.  */
 504   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 505                       into_target, unsignedp, methods);
 506   if (tmp == 0)
 507     return false;
 508
 509   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 510   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 511                            into_target, unsignedp, methods))
 512     return false;
 513
 514   /* Use a standard word_mode shift for the out-of half.  */
 515   if (outof_target != 0)
 516     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 517                              outof_target, unsignedp, methods))
 518       return false;
 519
 520   return true;
 521 }
 522
 523
 524 /* Try implementing expand_doubleword_shift using conditional moves.
 525    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 526    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 527    are the shift counts to use in the former and latter case.  All other
 528    arguments are the same as the parent routine.  */
 529
 530 static bool
 531 expand_doubleword_shift_condmove (scalar_int_mode op1_mode, optab binoptab,
 532                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 533                                   rtx outof_input, rtx into_input,
 534                                   rtx subword_op1, rtx superword_op1,
 535                                   rtx outof_target, rtx into_target,
 536                                   int unsignedp, enum optab_methods methods,
 537                                   unsigned HOST_WIDE_INT shift_mask)
 538 {
 539   rtx outof_superword, into_superword;
 540
 541   /* Put the superword version of the output into OUTOF_SUPERWORD and
 542      INTO_SUPERWORD.  */
 543   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 544   if (outof_target != 0 && subword_op1 == superword_op1)
 545     {
 546       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 547          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 548       into_superword = outof_target;
 549       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 550                                    outof_superword, 0, unsignedp, methods))
 551         return false;
 552     }
 553   else
 554     {
 555       into_superword = gen_reg_rtx (word_mode);
 556       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 557                                    outof_superword, into_superword,
 558                                    unsignedp, methods))
 559         return false;
 560     }
 561
 562   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 563   if (!expand_subword_shift (op1_mode, binoptab,
 564                              outof_input, into_input, subword_op1,
 565                              outof_target, into_target,
 566                              unsignedp, methods, shift_mask))
 567     return false;
 568
 569   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 570      might be the current value of OUTOF_TARGET.  */
 571   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 572                               into_target, into_superword, word_mode, false))
 573     return false;
 574
 575   if (outof_target != 0)
 576     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 577                                 outof_target, outof_superword,
 578                                 word_mode, false))
 579       return false;
 580
 581   return true;
 582 }
 583
 584 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 585    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 586    input operand; the shift moves bits in the direction OUTOF_INPUT->
 587    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 588    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 589    If OP1 is constant, it will have been truncated as appropriate
 590    and is known to be nonzero.
 591
 592    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 593    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 594    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 595
 596    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 597    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 598    fill with zeros or sign bits as appropriate.
 599
 600    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 601    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 602    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
 603    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
 604    are undefined.
 605
 606    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
 607    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
 608    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
 609    function wants to calculate it itself.
 610
 611    Return true if the shift could be successfully synthesized.  */
 612
 613 static bool
 614 expand_doubleword_shift (scalar_int_mode op1_mode, optab binoptab,
 615                          rtx outof_input, rtx into_input, rtx op1,
 616                          rtx outof_target, rtx into_target,
 617                          int unsignedp, enum optab_methods methods,
 618                          unsigned HOST_WIDE_INT shift_mask)
 619 {
 620   rtx superword_op1, tmp, cmp1, cmp2;
 621   enum rtx_code cmp_code;
 622
 623   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
 624      fill the result with sign or zero bits as appropriate.  If so, the value
 625      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
 626      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
 627      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
 628
 629      This isn't worthwhile for constant shifts since the optimizers will
 630      cope better with in-range shift counts.  */
 631   if (shift_mask >= BITS_PER_WORD
 632       && outof_target != 0
 633       && !CONSTANT_P (op1))
 634     {
 635       if (!expand_doubleword_shift (op1_mode, binoptab,
 636                                     outof_input, into_input, op1,
 637                                     0, into_target,
 638                                     unsignedp, methods, shift_mask))
 639         return false;
 640       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 641                                outof_target, unsignedp, methods))
 642         return false;
 643       return true;
 644     }
 645
 646   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
 647      is true when the effective shift value is less than BITS_PER_WORD.
 648      Set SUPERWORD_OP1 to the shift count that should be used to shift
 649      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
 650   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
 651   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
 652     {
 653       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
 654          is a subword shift count.  */
 655       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
 656                                     0, true, methods);
 657       cmp2 = CONST0_RTX (op1_mode);
 658       cmp_code = EQ;
 659       superword_op1 = op1;
 660     }
 661   else
 662     {
 663       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
 664       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
 665                                     0, true, methods);
 666       cmp2 = CONST0_RTX (op1_mode);
 667       cmp_code = LT;
 668       superword_op1 = cmp1;
 669     }
 670   if (cmp1 == 0)
 671     return false;
 672
 673   /* If we can compute the condition at compile time, pick the
 674      appropriate subroutine.  */
 675   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
 676   if (tmp != 0 && CONST_INT_P (tmp))
 677     {
 678       if (tmp == const0_rtx)
 679         return expand_superword_shift (binoptab, outof_input, superword_op1,
 680                                        outof_target, into_target,
 681                                        unsignedp, methods);
 682       else
 683         return expand_subword_shift (op1_mode, binoptab,
 684                                      outof_input, into_input, op1,
 685                                      outof_target, into_target,
 686                                      unsignedp, methods, shift_mask);
 687     }
 688
 689   /* Try using conditional moves to generate straight-line code.  */
 690   if (HAVE_conditional_move)
 691     {
 692       rtx_insn *start = get_last_insn ();
 693       if (expand_doubleword_shift_condmove (op1_mode, binoptab,
 694                                             cmp_code, cmp1, cmp2,
 695                                             outof_input, into_input,
 696                                             op1, superword_op1,
 697                                             outof_target, into_target,
 698                                             unsignedp, methods, shift_mask))
 699         return true;
 700       delete_insns_since (start);
 701     }
 702
 703   /* As a last resort, use branches to select the correct alternative.  */
 704   rtx_code_label *subword_label = gen_label_rtx ();
 705   rtx_code_label *done_label = gen_label_rtx ();
 706
 707   NO_DEFER_POP;
 708   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
 709                            0, 0, subword_label,
 710                            profile_probability::uninitialized ());
 711   OK_DEFER_POP;
 712
 713   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 714                                outof_target, into_target,
 715                                unsignedp, methods))
 716     return false;
 717
 718   emit_jump_insn (targetm.gen_jump (done_label));
 719   emit_barrier ();
 720   emit_label (subword_label);
 721
 722   if (!expand_subword_shift (op1_mode, binoptab,
 723                              outof_input, into_input, op1,
 724                              outof_target, into_target,
 725                              unsignedp, methods, shift_mask))
 726     return false;
 727
 728   emit_label (done_label);
 729   return true;
 730 }
 731 \f
 732 /* Subroutine of expand_binop.  Perform a double word multiplication of
 733    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
 734    as the target's word_mode.  This function return NULL_RTX if anything
 735    goes wrong, in which case it may have already emitted instructions
 736    which need to be deleted.
 737
 738    If we want to multiply two two-word values and have normal and widening
 739    multiplies of single-word values, we can do this with three smaller
 740    multiplications.
 741
 742    The multiplication proceeds as follows:
 743                                  _______________________
 744                                 [__op0_high_|__op0_low__]
 745                                  _______________________
 746         *                       [__op1_high_|__op1_low__]
 747         _______________________________________________
 748                                  _______________________
 749     (1)                         [__op0_low__*__op1_low__]
 750                      _______________________
 751     (2a)            [__op0_low__*__op1_high_]
 752                      _______________________
 753     (2b)            [__op0_high_*__op1_low__]
 754          _______________________
 755     (3) [__op0_high_*__op1_high_]
 756
 757
 758   This gives a 4-word result.  Since we are only interested in the
 759   lower 2 words, partial result (3) and the upper words of (2a) and
 760   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
 761   calculated using non-widening multiplication.
 762
 763   (1), however, needs to be calculated with an unsigned widening
 764   multiplication.  If this operation is not directly supported we
 765   try using a signed widening multiplication and adjust the result.
 766   This adjustment works as follows:
 767
 768       If both operands are positive then no adjustment is needed.
 769
 770       If the operands have different signs, for example op0_low < 0 and
 771       op1_low >= 0, the instruction treats the most significant bit of
 772       op0_low as a sign bit instead of a bit with significance
 773       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
 774       with 2**BITS_PER_WORD - op0_low, and two's complements the
 775       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
 776       the result.
 777
 778       Similarly, if both operands are negative, we need to add
 779       (op0_low + op1_low) * 2**BITS_PER_WORD.
 780
 781       We use a trick to adjust quickly.  We logically shift op0_low right
 782       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
 783       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
 784       logical shift exists, we do an arithmetic right shift and subtract
 785       the 0 or -1.  */
 786
 787 static rtx
 788 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
 789                        bool umulp, enum optab_methods methods)
 790 {
 791   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
 792   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
 793   rtx wordm1 = (umulp ? NULL_RTX
 794                 : gen_int_shift_amount (word_mode, BITS_PER_WORD - 1));
 795   rtx product, adjust, product_high, temp;
 796
 797   rtx op0_high = operand_subword_force (op0, high, mode);
 798   rtx op0_low = operand_subword_force (op0, low, mode);
 799   rtx op1_high = operand_subword_force (op1, high, mode);
 800   rtx op1_low = operand_subword_force (op1, low, mode);
 801
 802   /* If we're using an unsigned multiply to directly compute the product
 803      of the low-order words of the operands and perform any required
 804      adjustments of the operands, we begin by trying two more multiplications
 805      and then computing the appropriate sum.
 806
 807      We have checked above that the required addition is provided.
 808      Full-word addition will normally always succeed, especially if
 809      it is provided at all, so we don't worry about its failure.  The
 810      multiplication may well fail, however, so we do handle that.  */
 811
 812   if (!umulp)
 813     {
 814       /* ??? This could be done with emit_store_flag where available.  */
 815       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
 816                            NULL_RTX, 1, methods);
 817       if (temp)
 818         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
 819                                  NULL_RTX, 0, OPTAB_DIRECT);
 820       else
 821         {
 822           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
 823                                NULL_RTX, 0, methods);
 824           if (!temp)
 825             return NULL_RTX;
 826           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
 827                                    NULL_RTX, 0, OPTAB_DIRECT);
 828         }
 829
 830       if (!op0_high)
 831         return NULL_RTX;
 832     }
 833
 834   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
 835                          NULL_RTX, 0, OPTAB_DIRECT);
 836   if (!adjust)
 837     return NULL_RTX;
 838
 839   /* OP0_HIGH should now be dead.  */
 840
 841   if (!umulp)
 842     {
 843       /* ??? This could be done with emit_store_flag where available.  */
 844       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
 845                            NULL_RTX, 1, methods);
 846       if (temp)
 847         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
 848                                  NULL_RTX, 0, OPTAB_DIRECT);
 849       else
 850         {
 851           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
 852                                NULL_RTX, 0, methods);
 853           if (!temp)
 854             return NULL_RTX;
 855           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
 856                                    NULL_RTX, 0, OPTAB_DIRECT);
 857         }
 858
 859       if (!op1_high)
 860         return NULL_RTX;
 861     }
 862
 863   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
 864                        NULL_RTX, 0, OPTAB_DIRECT);
 865   if (!temp)
 866     return NULL_RTX;
 867
 868   /* OP1_HIGH should now be dead.  */
 869
 870   adjust = expand_binop (word_mode, add_optab, adjust, temp,
 871                          NULL_RTX, 0, OPTAB_DIRECT);
 872
 873   if (target && !REG_P (target))
 874     target = NULL_RTX;
 875
 876   /* *_widen_optab needs to determine operand mode, make sure at least
 877      one operand has non-VOID mode.  */
 878   if (GET_MODE (op0_low) == VOIDmode && GET_MODE (op1_low) == VOIDmode)
 879     op0_low = force_reg (word_mode, op0_low);
 880
 881   if (umulp)
 882     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
 883                             target, 1, OPTAB_DIRECT);
 884   else
 885     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
 886                             target, 1, OPTAB_DIRECT);
 887
 888   if (!product)
 889     return NULL_RTX;
 890
 891   product_high = operand_subword (product, high, 1, mode);
 892   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
 893                          NULL_RTX, 0, OPTAB_DIRECT);
 894   emit_move_insn (product_high, adjust);
 895   return product;
 896 }
 897 \f
 898 /* Wrapper around expand_binop which takes an rtx code to specify
 899    the operation to perform, not an optab pointer.  All other
 900    arguments are the same.  */
 901 rtx
 902 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
 903                      rtx op1, rtx target, int unsignedp,
 904                      enum optab_methods methods)
 905 {
 906   optab binop = code_to_optab (code);
 907   gcc_assert (binop);
 908
 909   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
 910 }
 911
 912 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
 913    binop.  Order them according to commutative_operand_precedence and, if
 914    possible, try to put TARGET or a pseudo first.  */
 915 static bool
 916 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
 917 {
 918   int op0_prec = commutative_operand_precedence (op0);
 919   int op1_prec = commutative_operand_precedence (op1);
 920
 921   if (op0_prec < op1_prec)
 922     return true;
 923
 924   if (op0_prec > op1_prec)
 925     return false;
 926
 927   /* With equal precedence, both orders are ok, but it is better if the
 928      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
 929   if (target == 0 || REG_P (target))
 930     return (REG_P (op1) && !REG_P (op0)) || target == op1;
 931   else
 932     return rtx_equal_p (op1, target);
 933 }
 934
 935 /* Return true if BINOPTAB implements a shift operation.  */
 936
 937 static bool
 938 shift_optab_p (optab binoptab)
 939 {
 940   switch (optab_to_code (binoptab))
 941     {
 942     case ASHIFT:
 943     case SS_ASHIFT:
 944     case US_ASHIFT:
 945     case ASHIFTRT:
 946     case LSHIFTRT:
 947     case ROTATE:
 948     case ROTATERT:
 949       return true;
 950
 951     default:
 952       return false;
 953     }
 954 }
 955
 956 /* Return true if BINOPTAB implements a commutative binary operation.  */
 957
 958 static bool
 959 commutative_optab_p (optab binoptab)
 960 {
 961   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
 962           || binoptab == smul_widen_optab
 963           || binoptab == umul_widen_optab
 964           || binoptab == smul_highpart_optab
 965           || binoptab == umul_highpart_optab);
 966 }
 967
 968 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
 969    optimizing, and if the operand is a constant that costs more than
 970    1 instruction, force the constant into a register and return that
 971    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
 972
 973 static rtx
 974 avoid_expensive_constant (machine_mode mode, optab binoptab,
 975                           int opn, rtx x, bool unsignedp)
 976 {
 977   bool speed = optimize_insn_for_speed_p ();
 978
 979   if (mode != VOIDmode
 980       && optimize
 981       && CONSTANT_P (x)
 982       && (rtx_cost (x, mode, optab_to_code (binoptab), opn, speed)
 983           > set_src_cost (x, mode, speed)))
 984     {
 985       if (CONST_INT_P (x))
 986         {
 987           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
 988           if (intval != INTVAL (x))
 989             x = GEN_INT (intval);
 990         }
 991       else
 992         x = convert_modes (mode, VOIDmode, x, unsignedp);
 993       x = force_reg (mode, x);
 994     }
 995   return x;
 996 }
 997
 998 /* Helper function for expand_binop: handle the case where there
 999    is an insn ICODE that directly implements the indicated operation.
1000    Returns null if this is not possible.  */
1001 static rtx
1002 expand_binop_directly (enum insn_code icode, machine_mode mode, optab binoptab,
1003                        rtx op0, rtx op1,
1004                        rtx target, int unsignedp, enum optab_methods methods,
1005                        rtx_insn *last)
1006 {
1007   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1008   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1009   machine_mode mode0, mode1, tmp_mode;
1010   struct expand_operand ops[3];
1011   bool commutative_p;
1012   rtx_insn *pat;
1013   rtx xop0 = op0, xop1 = op1;
1014   bool canonicalize_op1 = false;
1015
1016   /* If it is a commutative operator and the modes would match
1017      if we would swap the operands, we can save the conversions.  */
1018   commutative_p = commutative_optab_p (binoptab);
1019   if (commutative_p
1020       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1021       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1022     std::swap (xop0, xop1);
1023
1024   /* If we are optimizing, force expensive constants into a register.  */
1025   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1026   if (!shift_optab_p (binoptab))
1027     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1028   else
1029     /* Shifts and rotates often use a different mode for op1 from op0;
1030        for VOIDmode constants we don't know the mode, so force it
1031        to be canonicalized using convert_modes.  */
1032     canonicalize_op1 = true;
1033
1034   /* In case the insn wants input operands in modes different from
1035      those of the actual operands, convert the operands.  It would
1036      seem that we don't need to convert CONST_INTs, but we do, so
1037      that they're properly zero-extended, sign-extended or truncated
1038      for their mode.  */
1039
1040   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1041   if (xmode0 != VOIDmode && xmode0 != mode0)
1042     {
1043       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1044       mode0 = xmode0;
1045     }
1046
1047   mode1 = ((GET_MODE (xop1) != VOIDmode || canonicalize_op1)
1048            ? GET_MODE (xop1) : mode);
1049   if (xmode1 != VOIDmode && xmode1 != mode1)
1050     {
1051       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1052       mode1 = xmode1;
1053     }
1054
1055   /* If operation is commutative,
1056      try to make the first operand a register.
1057      Even better, try to make it the same as the target.
1058      Also try to make the last operand a constant.  */
1059   if (commutative_p
1060       && swap_commutative_operands_with_target (target, xop0, xop1))
1061     std::swap (xop0, xop1);
1062
1063   /* Now, if insn's predicates don't allow our operands, put them into
1064      pseudo regs.  */
1065
1066   if (binoptab == vec_pack_trunc_optab
1067       || binoptab == vec_pack_usat_optab
1068       || binoptab == vec_pack_ssat_optab
1069       || binoptab == vec_pack_ufix_trunc_optab
1070       || binoptab == vec_pack_sfix_trunc_optab)
1071     {
1072       /* The mode of the result is different then the mode of the
1073          arguments.  */
1074       tmp_mode = insn_data[(int) icode].operand[0].mode;
1075       if (VECTOR_MODE_P (mode)
1076           && GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1077         {
1078           delete_insns_since (last);
1079           return NULL_RTX;
1080         }
1081     }
1082   else
1083     tmp_mode = mode;
1084
1085   create_output_operand (&ops[0], target, tmp_mode);
1086   create_input_operand (&ops[1], xop0, mode0);
1087   create_input_operand (&ops[2], xop1, mode1);
1088   pat = maybe_gen_insn (icode, 3, ops);
1089   if (pat)
1090     {
1091       /* If PAT is composed of more than one insn, try to add an appropriate
1092          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1093          operand, call expand_binop again, this time without a target.  */
1094       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1095           && ! add_equal_note (pat, ops[0].value,
1096                                optab_to_code (binoptab),
1097                                ops[1].value, ops[2].value))
1098         {
1099           delete_insns_since (last);
1100           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1101                                unsignedp, methods);
1102         }
1103
1104       emit_insn (pat);
1105       return ops[0].value;
1106     }
1107   delete_insns_since (last);
1108   return NULL_RTX;
1109 }
1110
1111 /* Generate code to perform an operation specified by BINOPTAB
1112    on operands OP0 and OP1, with result having machine-mode MODE.
1113
1114    UNSIGNEDP is for the case where we have to widen the operands
1115    to perform the operation.  It says to use zero-extension.
1116
1117    If TARGET is nonzero, the value
1118    is generated there, if it is convenient to do so.
1119    In all cases an rtx is returned for the locus of the value;
1120    this may or may not be TARGET.  */
1121
1122 rtx
1123 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1124               rtx target, int unsignedp, enum optab_methods methods)
1125 {
1126   enum optab_methods next_methods
1127     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1128        ? OPTAB_WIDEN : methods);
1129   enum mode_class mclass;
1130   enum insn_code icode;
1131   machine_mode wider_mode;
1132   scalar_int_mode int_mode;
1133   rtx libfunc;
1134   rtx temp;
1135   rtx_insn *entry_last = get_last_insn ();
1136   rtx_insn *last;
1137
1138   mclass = GET_MODE_CLASS (mode);
1139
1140   /* If subtracting an integer constant, convert this into an addition of
1141      the negated constant.  */
1142
1143   if (binoptab == sub_optab && CONST_INT_P (op1))
1144     {
1145       op1 = negate_rtx (mode, op1);
1146       binoptab = add_optab;
1147     }
1148   /* For shifts, constant invalid op1 might be expanded from different
1149      mode than MODE.  As those are invalid, force them to a register
1150      to avoid further problems during expansion.  */
1151   else if (CONST_INT_P (op1)
1152            && shift_optab_p (binoptab)
1153            && UINTVAL (op1) >= GET_MODE_BITSIZE (GET_MODE_INNER (mode)))
1154     {
1155       op1 = gen_int_mode (INTVAL (op1), GET_MODE_INNER (mode));
1156       op1 = force_reg (GET_MODE_INNER (mode), op1);
1157     }
1158
1159   /* Record where to delete back to if we backtrack.  */
1160   last = get_last_insn ();
1161
1162   /* If we can do it with a three-operand insn, do so.  */
1163
1164   if (methods != OPTAB_MUST_WIDEN)
1165     {
1166       if (convert_optab_p (binoptab))
1167         {
1168           machine_mode from_mode = widened_mode (mode, op0, op1);
1169           icode = find_widening_optab_handler (binoptab, mode, from_mode);
1170         }
1171       else
1172         icode = optab_handler (binoptab, mode);
1173       if (icode != CODE_FOR_nothing)
1174         {
1175           temp = expand_binop_directly (icode, mode, binoptab, op0, op1,
1176                                         target, unsignedp, methods, last);
1177           if (temp)
1178             return temp;
1179         }
1180     }
1181
1182   /* If we were trying to rotate, and that didn't work, try rotating
1183      the other direction before falling back to shifts and bitwise-or.  */
1184   if (((binoptab == rotl_optab
1185         && (icode = optab_handler (rotr_optab, mode)) != CODE_FOR_nothing)
1186        || (binoptab == rotr_optab
1187            && (icode = optab_handler (rotl_optab, mode)) != CODE_FOR_nothing))
1188       && is_int_mode (mode, &int_mode))
1189     {
1190       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1191       rtx newop1;
1192       unsigned int bits = GET_MODE_PRECISION (int_mode);
1193
1194       if (CONST_INT_P (op1))
1195         newop1 = gen_int_shift_amount (int_mode, bits - INTVAL (op1));
1196       else if (targetm.shift_truncation_mask (int_mode) == bits - 1)
1197         newop1 = negate_rtx (GET_MODE (op1), op1);
1198       else
1199         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1200                                gen_int_mode (bits, GET_MODE (op1)), op1,
1201                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1202
1203       temp = expand_binop_directly (icode, int_mode, otheroptab, op0, newop1,
1204                                     target, unsignedp, methods, last);
1205       if (temp)
1206         return temp;
1207     }
1208
1209   /* If this is a multiply, see if we can do a widening operation that
1210      takes operands of this mode and makes a wider mode.  */
1211
1212   if (binoptab == smul_optab
1213       && GET_MODE_2XWIDER_MODE (mode).exists (&wider_mode)
1214       && (convert_optab_handler ((unsignedp
1215                                   ? umul_widen_optab
1216                                   : smul_widen_optab),
1217                                  wider_mode, mode) != CODE_FOR_nothing))
1218     {
1219       /* *_widen_optab needs to determine operand mode, make sure at least
1220          one operand has non-VOID mode.  */
1221       if (GET_MODE (op0) == VOIDmode && GET_MODE (op1) == VOIDmode)
1222         op0 = force_reg (mode, op0);
1223       temp = expand_binop (wider_mode,
1224                            unsignedp ? umul_widen_optab : smul_widen_optab,
1225                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1226
1227       if (temp != 0)
1228         {
1229           if (GET_MODE_CLASS (mode) == MODE_INT
1230               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1231             return gen_lowpart (mode, temp);
1232           else
1233             return convert_to_mode (mode, temp, unsignedp);
1234         }
1235     }
1236
1237   /* If this is a vector shift by a scalar, see if we can do a vector
1238      shift by a vector.  If so, broadcast the scalar into a vector.  */
1239   if (mclass == MODE_VECTOR_INT)
1240     {
1241       optab otheroptab = unknown_optab;
1242
1243       if (binoptab == ashl_optab)
1244         otheroptab = vashl_optab;
1245       else if (binoptab == ashr_optab)
1246         otheroptab = vashr_optab;
1247       else if (binoptab == lshr_optab)
1248         otheroptab = vlshr_optab;
1249       else if (binoptab == rotl_optab)
1250         otheroptab = vrotl_optab;
1251       else if (binoptab == rotr_optab)
1252         otheroptab = vrotr_optab;
1253
1254       if (otheroptab
1255           && (icode = optab_handler (otheroptab, mode)) != CODE_FOR_nothing)
1256         {
1257           /* The scalar may have been extended to be too wide.  Truncate
1258              it back to the proper size to fit in the broadcast vector.  */
1259           scalar_mode inner_mode = GET_MODE_INNER (mode);
1260           if (!CONST_INT_P (op1)
1261               && (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (op1)))
1262                   > GET_MODE_BITSIZE (inner_mode)))
1263             op1 = force_reg (inner_mode,
1264                              simplify_gen_unary (TRUNCATE, inner_mode, op1,
1265                                                  GET_MODE (op1)));
1266           rtx vop1 = expand_vector_broadcast (mode, op1);
1267           if (vop1)
1268             {
1269               temp = expand_binop_directly (icode, mode, otheroptab, op0, vop1,
1270                                             target, unsignedp, methods, last);
1271               if (temp)
1272                 return temp;
1273             }
1274         }
1275     }
1276
1277   /* Look for a wider mode of the same class for which we think we
1278      can open-code the operation.  Check for a widening multiply at the
1279      wider mode as well.  */
1280
1281   if (CLASS_HAS_WIDER_MODES_P (mclass)
1282       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1283     FOR_EACH_WIDER_MODE (wider_mode, mode)
1284       {
1285         machine_mode next_mode;
1286         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1287             || (binoptab == smul_optab
1288                 && GET_MODE_WIDER_MODE (wider_mode).exists (&next_mode)
1289                 && (find_widening_optab_handler ((unsignedp
1290                                                   ? umul_widen_optab
1291                                                   : smul_widen_optab),
1292                                                  next_mode, mode)
1293                     != CODE_FOR_nothing)))
1294           {
1295             rtx xop0 = op0, xop1 = op1;
1296             int no_extend = 0;
1297
1298             /* For certain integer operations, we need not actually extend
1299                the narrow operands, as long as we will truncate
1300                the results to the same narrowness.  */
1301
1302             if ((binoptab == ior_optab || binoptab == and_optab
1303                  || binoptab == xor_optab
1304                  || binoptab == add_optab || binoptab == sub_optab
1305                  || binoptab == smul_optab || binoptab == ashl_optab)
1306                 && mclass == MODE_INT)
1307               {
1308                 no_extend = 1;
1309                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1310                                                  xop0, unsignedp);
1311                 if (binoptab != ashl_optab)
1312                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1313                                                    xop1, unsignedp);
1314               }
1315
1316             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1317
1318             /* The second operand of a shift must always be extended.  */
1319             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1320                                   no_extend && binoptab != ashl_optab);
1321
1322             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1323                                  unsignedp, OPTAB_DIRECT);
1324             if (temp)
1325               {
1326                 if (mclass != MODE_INT
1327                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1328                   {
1329                     if (target == 0)
1330                       target = gen_reg_rtx (mode);
1331                     convert_move (target, temp, 0);
1332                     return target;
1333                   }
1334                 else
1335                   return gen_lowpart (mode, temp);
1336               }
1337             else
1338               delete_insns_since (last);
1339           }
1340       }
1341
1342   /* If operation is commutative,
1343      try to make the first operand a register.
1344      Even better, try to make it the same as the target.
1345      Also try to make the last operand a constant.  */
1346   if (commutative_optab_p (binoptab)
1347       && swap_commutative_operands_with_target (target, op0, op1))
1348     std::swap (op0, op1);
1349
1350   /* These can be done a word at a time.  */
1351   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1352       && is_int_mode (mode, &int_mode)
1353       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
1354       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1355     {
1356       int i;
1357       rtx_insn *insns;
1358
1359       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1360          won't be accurate, so use a new target.  */
1361       if (target == 0
1362           || target == op0
1363           || target == op1
1364           || !valid_multiword_target_p (target))
1365         target = gen_reg_rtx (int_mode);
1366
1367       start_sequence ();
1368
1369       /* Do the actual arithmetic.  */
1370       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
1371         {
1372           rtx target_piece = operand_subword (target, i, 1, int_mode);
1373           rtx x = expand_binop (word_mode, binoptab,
1374                                 operand_subword_force (op0, i, int_mode),
1375                                 operand_subword_force (op1, i, int_mode),
1376                                 target_piece, unsignedp, next_methods);
1377
1378           if (x == 0)
1379             break;
1380
1381           if (target_piece != x)
1382             emit_move_insn (target_piece, x);
1383         }
1384
1385       insns = get_insns ();
1386       end_sequence ();
1387
1388       if (i == GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD)
1389         {
1390           emit_insn (insns);
1391           return target;
1392         }
1393     }
1394
1395   /* Synthesize double word shifts from single word shifts.  */
1396   if ((binoptab == lshr_optab || binoptab == ashl_optab
1397        || binoptab == ashr_optab)
1398       && is_int_mode (mode, &int_mode)
1399       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1400       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1401       && GET_MODE_PRECISION (int_mode) == GET_MODE_BITSIZE (int_mode)
1402       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1403       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1404       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1405     {
1406       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1407       scalar_int_mode op1_mode;
1408
1409       double_shift_mask = targetm.shift_truncation_mask (int_mode);
1410       shift_mask = targetm.shift_truncation_mask (word_mode);
1411       op1_mode = (GET_MODE (op1) != VOIDmode
1412                   ? as_a <scalar_int_mode> (GET_MODE (op1))
1413                   : word_mode);
1414
1415       /* Apply the truncation to constant shifts.  */
1416       if (double_shift_mask > 0 && CONST_INT_P (op1))
1417         op1 = gen_int_mode (INTVAL (op1) & double_shift_mask, op1_mode);
1418
1419       if (op1 == CONST0_RTX (op1_mode))
1420         return op0;
1421
1422       /* Make sure that this is a combination that expand_doubleword_shift
1423          can handle.  See the comments there for details.  */
1424       if (double_shift_mask == 0
1425           || (shift_mask == BITS_PER_WORD - 1
1426               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1427         {
1428           rtx_insn *insns;
1429           rtx into_target, outof_target;
1430           rtx into_input, outof_input;
1431           int left_shift, outof_word;
1432
1433           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1434              won't be accurate, so use a new target.  */
1435           if (target == 0
1436               || target == op0
1437               || target == op1
1438               || !valid_multiword_target_p (target))
1439             target = gen_reg_rtx (int_mode);
1440
1441           start_sequence ();
1442
1443           /* OUTOF_* is the word we are shifting bits away from, and
1444              INTO_* is the word that we are shifting bits towards, thus
1445              they differ depending on the direction of the shift and
1446              WORDS_BIG_ENDIAN.  */
1447
1448           left_shift = binoptab == ashl_optab;
1449           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1450
1451           outof_target = operand_subword (target, outof_word, 1, int_mode);
1452           into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1453
1454           outof_input = operand_subword_force (op0, outof_word, int_mode);
1455           into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1456
1457           if (expand_doubleword_shift (op1_mode, binoptab,
1458                                        outof_input, into_input, op1,
1459                                        outof_target, into_target,
1460                                        unsignedp, next_methods, shift_mask))
1461             {
1462               insns = get_insns ();
1463               end_sequence ();
1464
1465               emit_insn (insns);
1466               return target;
1467             }
1468           end_sequence ();
1469         }
1470     }
1471
1472   /* Synthesize double word rotates from single word shifts.  */
1473   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1474       && is_int_mode (mode, &int_mode)
1475       && CONST_INT_P (op1)
1476       && GET_MODE_PRECISION (int_mode) == 2 * BITS_PER_WORD
1477       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1478       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1479     {
1480       rtx_insn *insns;
1481       rtx into_target, outof_target;
1482       rtx into_input, outof_input;
1483       rtx inter;
1484       int shift_count, left_shift, outof_word;
1485
1486       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1487          won't be accurate, so use a new target. Do this also if target is not
1488          a REG, first because having a register instead may open optimization
1489          opportunities, and second because if target and op0 happen to be MEMs
1490          designating the same location, we would risk clobbering it too early
1491          in the code sequence we generate below.  */
1492       if (target == 0
1493           || target == op0
1494           || target == op1
1495           || !REG_P (target)
1496           || !valid_multiword_target_p (target))
1497         target = gen_reg_rtx (int_mode);
1498
1499       start_sequence ();
1500
1501       shift_count = INTVAL (op1);
1502
1503       /* OUTOF_* is the word we are shifting bits away from, and
1504          INTO_* is the word that we are shifting bits towards, thus
1505          they differ depending on the direction of the shift and
1506          WORDS_BIG_ENDIAN.  */
1507
1508       left_shift = (binoptab == rotl_optab);
1509       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1510
1511       outof_target = operand_subword (target, outof_word, 1, int_mode);
1512       into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1513
1514       outof_input = operand_subword_force (op0, outof_word, int_mode);
1515       into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1516
1517       if (shift_count == BITS_PER_WORD)
1518         {
1519           /* This is just a word swap.  */
1520           emit_move_insn (outof_target, into_input);
1521           emit_move_insn (into_target, outof_input);
1522           inter = const0_rtx;
1523         }
1524       else
1525         {
1526           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1527           HOST_WIDE_INT first_shift_count, second_shift_count;
1528           optab reverse_unsigned_shift, unsigned_shift;
1529
1530           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1531                                     ? lshr_optab : ashl_optab);
1532
1533           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1534                             ? ashl_optab : lshr_optab);
1535
1536           if (shift_count > BITS_PER_WORD)
1537             {
1538               first_shift_count = shift_count - BITS_PER_WORD;
1539               second_shift_count = 2 * BITS_PER_WORD - shift_count;
1540             }
1541           else
1542             {
1543               first_shift_count = BITS_PER_WORD - shift_count;
1544               second_shift_count = shift_count;
1545             }
1546           rtx first_shift_count_rtx
1547             = gen_int_shift_amount (word_mode, first_shift_count);
1548           rtx second_shift_count_rtx
1549             = gen_int_shift_amount (word_mode, second_shift_count);
1550
1551           into_temp1 = expand_binop (word_mode, unsigned_shift,
1552                                      outof_input, first_shift_count_rtx,
1553                                      NULL_RTX, unsignedp, next_methods);
1554           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1555                                      into_input, second_shift_count_rtx,
1556                                      NULL_RTX, unsignedp, next_methods);
1557
1558           if (into_temp1 != 0 && into_temp2 != 0)
1559             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1560                                   into_target, unsignedp, next_methods);
1561           else
1562             inter = 0;
1563
1564           if (inter != 0 && inter != into_target)
1565             emit_move_insn (into_target, inter);
1566
1567           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1568                                       into_input, first_shift_count_rtx,
1569                                       NULL_RTX, unsignedp, next_methods);
1570           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1571                                       outof_input, second_shift_count_rtx,
1572                                       NULL_RTX, unsignedp, next_methods);
1573
1574           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1575             inter = expand_binop (word_mode, ior_optab,
1576                                   outof_temp1, outof_temp2,
1577                                   outof_target, unsignedp, next_methods);
1578
1579           if (inter != 0 && inter != outof_target)
1580             emit_move_insn (outof_target, inter);
1581         }
1582
1583       insns = get_insns ();
1584       end_sequence ();
1585
1586       if (inter != 0)
1587         {
1588           emit_insn (insns);
1589           return target;
1590         }
1591     }
1592
1593   /* These can be done a word at a time by propagating carries.  */
1594   if ((binoptab == add_optab || binoptab == sub_optab)
1595       && is_int_mode (mode, &int_mode)
1596       && GET_MODE_SIZE (int_mode) >= 2 * UNITS_PER_WORD
1597       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1598     {
1599       unsigned int i;
1600       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1601       const unsigned int nwords = GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD;
1602       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1603       rtx xop0, xop1, xtarget;
1604
1605       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1606          value is one of those, use it.  Otherwise, use 1 since it is the
1607          one easiest to get.  */
1608 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1609       int normalizep = STORE_FLAG_VALUE;
1610 #else
1611       int normalizep = 1;
1612 #endif
1613
1614       /* Prepare the operands.  */
1615       xop0 = force_reg (int_mode, op0);
1616       xop1 = force_reg (int_mode, op1);
1617
1618       xtarget = gen_reg_rtx (int_mode);
1619
1620       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1621         target = xtarget;
1622
1623       /* Indicate for flow that the entire target reg is being set.  */
1624       if (REG_P (target))
1625         emit_clobber (xtarget);
1626
1627       /* Do the actual arithmetic.  */
1628       for (i = 0; i < nwords; i++)
1629         {
1630           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1631           rtx target_piece = operand_subword (xtarget, index, 1, int_mode);
1632           rtx op0_piece = operand_subword_force (xop0, index, int_mode);
1633           rtx op1_piece = operand_subword_force (xop1, index, int_mode);
1634           rtx x;
1635
1636           /* Main add/subtract of the input operands.  */
1637           x = expand_binop (word_mode, binoptab,
1638                             op0_piece, op1_piece,
1639                             target_piece, unsignedp, next_methods);
1640           if (x == 0)
1641             break;
1642
1643           if (i + 1 < nwords)
1644             {
1645               /* Store carry from main add/subtract.  */
1646               carry_out = gen_reg_rtx (word_mode);
1647               carry_out = emit_store_flag_force (carry_out,
1648                                                  (binoptab == add_optab
1649                                                   ? LT : GT),
1650                                                  x, op0_piece,
1651                                                  word_mode, 1, normalizep);
1652             }
1653
1654           if (i > 0)
1655             {
1656               rtx newx;
1657
1658               /* Add/subtract previous carry to main result.  */
1659               newx = expand_binop (word_mode,
1660                                    normalizep == 1 ? binoptab : otheroptab,
1661                                    x, carry_in,
1662                                    NULL_RTX, 1, next_methods);
1663
1664               if (i + 1 < nwords)
1665                 {
1666                   /* Get out carry from adding/subtracting carry in.  */
1667                   rtx carry_tmp = gen_reg_rtx (word_mode);
1668                   carry_tmp = emit_store_flag_force (carry_tmp,
1669                                                      (binoptab == add_optab
1670                                                       ? LT : GT),
1671                                                      newx, x,
1672                                                      word_mode, 1, normalizep);
1673
1674                   /* Logical-ior the two poss. carry together.  */
1675                   carry_out = expand_binop (word_mode, ior_optab,
1676                                             carry_out, carry_tmp,
1677                                             carry_out, 0, next_methods);
1678                   if (carry_out == 0)
1679                     break;
1680                 }
1681               emit_move_insn (target_piece, newx);
1682             }
1683           else
1684             {
1685               if (x != target_piece)
1686                 emit_move_insn (target_piece, x);
1687             }
1688
1689           carry_in = carry_out;
1690         }
1691
1692       if (i == GET_MODE_BITSIZE (int_mode) / (unsigned) BITS_PER_WORD)
1693         {
1694           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing
1695               || ! rtx_equal_p (target, xtarget))
1696             {
1697               rtx_insn *temp = emit_move_insn (target, xtarget);
1698
1699               set_dst_reg_note (temp, REG_EQUAL,
1700                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
1701                                                 int_mode, copy_rtx (xop0),
1702                                                 copy_rtx (xop1)),
1703                                 target);
1704             }
1705           else
1706             target = xtarget;
1707
1708           return target;
1709         }
1710
1711       else
1712         delete_insns_since (last);
1713     }
1714
1715   /* Attempt to synthesize double word multiplies using a sequence of word
1716      mode multiplications.  We first attempt to generate a sequence using a
1717      more efficient unsigned widening multiply, and if that fails we then
1718      try using a signed widening multiply.  */
1719
1720   if (binoptab == smul_optab
1721       && is_int_mode (mode, &int_mode)
1722       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1723       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
1724       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
1725     {
1726       rtx product = NULL_RTX;
1727       if (convert_optab_handler (umul_widen_optab, int_mode, word_mode)
1728           != CODE_FOR_nothing)
1729         {
1730           product = expand_doubleword_mult (int_mode, op0, op1, target,
1731                                             true, methods);
1732           if (!product)
1733             delete_insns_since (last);
1734         }
1735
1736       if (product == NULL_RTX
1737           && (convert_optab_handler (smul_widen_optab, int_mode, word_mode)
1738               != CODE_FOR_nothing))
1739         {
1740           product = expand_doubleword_mult (int_mode, op0, op1, target,
1741                                             false, methods);
1742           if (!product)
1743             delete_insns_since (last);
1744         }
1745
1746       if (product != NULL_RTX)
1747         {
1748           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing)
1749             {
1750               rtx_insn *move = emit_move_insn (target ? target : product,
1751                                                product);
1752               set_dst_reg_note (move,
1753                                 REG_EQUAL,
1754                                 gen_rtx_fmt_ee (MULT, int_mode,
1755                                                 copy_rtx (op0),
1756                                                 copy_rtx (op1)),
1757                                 target ? target : product);
1758             }
1759           return product;
1760         }
1761     }
1762
1763   /* It can't be open-coded in this mode.
1764      Use a library call if one is available and caller says that's ok.  */
1765
1766   libfunc = optab_libfunc (binoptab, mode);
1767   if (libfunc
1768       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
1769     {
1770       rtx_insn *insns;
1771       rtx op1x = op1;
1772       machine_mode op1_mode = mode;
1773       rtx value;
1774
1775       start_sequence ();
1776
1777       if (shift_optab_p (binoptab))
1778         {
1779           op1_mode = targetm.libgcc_shift_count_mode ();
1780           /* Specify unsigned here,
1781              since negative shift counts are meaningless.  */
1782           op1x = convert_to_mode (op1_mode, op1, 1);
1783         }
1784
1785       if (GET_MODE (op0) != VOIDmode
1786           && GET_MODE (op0) != mode)
1787         op0 = convert_to_mode (mode, op0, unsignedp);
1788
1789       /* Pass 1 for NO_QUEUE so we don't lose any increments
1790          if the libcall is cse'd or moved.  */
1791       value = emit_library_call_value (libfunc,
1792                                        NULL_RTX, LCT_CONST, mode,
1793                                        op0, mode, op1x, op1_mode);
1794
1795       insns = get_insns ();
1796       end_sequence ();
1797
1798       bool trapv = trapv_binoptab_p (binoptab);
1799       target = gen_reg_rtx (mode);
1800       emit_libcall_block_1 (insns, target, value,
1801                             trapv ? NULL_RTX
1802                             : gen_rtx_fmt_ee (optab_to_code (binoptab),
1803                                               mode, op0, op1), trapv);
1804
1805       return target;
1806     }
1807
1808   delete_insns_since (last);
1809
1810   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1811
1812   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
1813          || methods == OPTAB_MUST_WIDEN))
1814     {
1815       /* Caller says, don't even try.  */
1816       delete_insns_since (entry_last);
1817       return 0;
1818     }
1819
1820   /* Compute the value of METHODS to pass to recursive calls.
1821      Don't allow widening to be tried recursively.  */
1822
1823   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
1824
1825   /* Look for a wider mode of the same class for which it appears we can do
1826      the operation.  */
1827
1828   if (CLASS_HAS_WIDER_MODES_P (mclass))
1829     {
1830       /* This code doesn't make sense for conversion optabs, since we
1831          wouldn't then want to extend the operands to be the same size
1832          as the result.  */
1833       gcc_assert (!convert_optab_p (binoptab));
1834       FOR_EACH_WIDER_MODE (wider_mode, mode)
1835         {
1836           if (optab_handler (binoptab, wider_mode)
1837               || (methods == OPTAB_LIB
1838                   && optab_libfunc (binoptab, wider_mode)))
1839             {
1840               rtx xop0 = op0, xop1 = op1;
1841               int no_extend = 0;
1842
1843               /* For certain integer operations, we need not actually extend
1844                  the narrow operands, as long as we will truncate
1845                  the results to the same narrowness.  */
1846
1847               if ((binoptab == ior_optab || binoptab == and_optab
1848                    || binoptab == xor_optab
1849                    || binoptab == add_optab || binoptab == sub_optab
1850                    || binoptab == smul_optab || binoptab == ashl_optab)
1851                   && mclass == MODE_INT)
1852                 no_extend = 1;
1853
1854               xop0 = widen_operand (xop0, wider_mode, mode,
1855                                     unsignedp, no_extend);
1856
1857               /* The second operand of a shift must always be extended.  */
1858               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1859                                     no_extend && binoptab != ashl_optab);
1860
1861               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1862                                    unsignedp, methods);
1863               if (temp)
1864                 {
1865                   if (mclass != MODE_INT
1866                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1867                     {
1868                       if (target == 0)
1869                         target = gen_reg_rtx (mode);
1870                       convert_move (target, temp, 0);
1871                       return target;
1872                     }
1873                   else
1874                     return gen_lowpart (mode, temp);
1875                 }
1876               else
1877                 delete_insns_since (last);
1878             }
1879         }
1880     }
1881
1882   delete_insns_since (entry_last);
1883   return 0;
1884 }
1885 \f
1886 /* Expand a binary operator which has both signed and unsigned forms.
1887    UOPTAB is the optab for unsigned operations, and SOPTAB is for
1888    signed operations.
1889
1890    If we widen unsigned operands, we may use a signed wider operation instead
1891    of an unsigned wider operation, since the result would be the same.  */
1892
1893 rtx
1894 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
1895                    rtx op0, rtx op1, rtx target, int unsignedp,
1896                    enum optab_methods methods)
1897 {
1898   rtx temp;
1899   optab direct_optab = unsignedp ? uoptab : soptab;
1900   bool save_enable;
1901
1902   /* Do it without widening, if possible.  */
1903   temp = expand_binop (mode, direct_optab, op0, op1, target,
1904                        unsignedp, OPTAB_DIRECT);
1905   if (temp || methods == OPTAB_DIRECT)
1906     return temp;
1907
1908   /* Try widening to a signed int.  Disable any direct use of any
1909      signed insn in the current mode.  */
1910   save_enable = swap_optab_enable (soptab, mode, false);
1911
1912   temp = expand_binop (mode, soptab, op0, op1, target,
1913                        unsignedp, OPTAB_WIDEN);
1914
1915   /* For unsigned operands, try widening to an unsigned int.  */
1916   if (!temp && unsignedp)
1917     temp = expand_binop (mode, uoptab, op0, op1, target,
1918                          unsignedp, OPTAB_WIDEN);
1919   if (temp || methods == OPTAB_WIDEN)
1920     goto egress;
1921
1922   /* Use the right width libcall if that exists.  */
1923   temp = expand_binop (mode, direct_optab, op0, op1, target,
1924                        unsignedp, OPTAB_LIB);
1925   if (temp || methods == OPTAB_LIB)
1926     goto egress;
1927
1928   /* Must widen and use a libcall, use either signed or unsigned.  */
1929   temp = expand_binop (mode, soptab, op0, op1, target,
1930                        unsignedp, methods);
1931   if (!temp && unsignedp)
1932     temp = expand_binop (mode, uoptab, op0, op1, target,
1933                          unsignedp, methods);
1934
1935  egress:
1936   /* Undo the fiddling above.  */
1937   if (save_enable)
1938     swap_optab_enable (soptab, mode, true);
1939   return temp;
1940 }
1941 \f
1942 /* Generate code to perform an operation specified by UNOPPTAB
1943    on operand OP0, with two results to TARG0 and TARG1.
1944    We assume that the order of the operands for the instruction
1945    is TARG0, TARG1, OP0.
1946
1947    Either TARG0 or TARG1 may be zero, but what that means is that
1948    the result is not actually wanted.  We will generate it into
1949    a dummy pseudo-reg and discard it.  They may not both be zero.
1950
1951    Returns 1 if this operation can be performed; 0 if not.  */
1952
1953 int
1954 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
1955                     int unsignedp)
1956 {
1957   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
1958   enum mode_class mclass;
1959   machine_mode wider_mode;
1960   rtx_insn *entry_last = get_last_insn ();
1961   rtx_insn *last;
1962
1963   mclass = GET_MODE_CLASS (mode);
1964
1965   if (!targ0)
1966     targ0 = gen_reg_rtx (mode);
1967   if (!targ1)
1968     targ1 = gen_reg_rtx (mode);
1969
1970   /* Record where to go back to if we fail.  */
1971   last = get_last_insn ();
1972
1973   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
1974     {
1975       struct expand_operand ops[3];
1976       enum insn_code icode = optab_handler (unoptab, mode);
1977
1978       create_fixed_operand (&ops[0], targ0);
1979       create_fixed_operand (&ops[1], targ1);
1980       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
1981       if (maybe_expand_insn (icode, 3, ops))
1982         return 1;
1983     }
1984
1985   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1986
1987   if (CLASS_HAS_WIDER_MODES_P (mclass))
1988     {
1989       FOR_EACH_WIDER_MODE (wider_mode, mode)
1990         {
1991           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
1992             {
1993               rtx t0 = gen_reg_rtx (wider_mode);
1994               rtx t1 = gen_reg_rtx (wider_mode);
1995               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
1996
1997               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
1998                 {
1999                   convert_move (targ0, t0, unsignedp);
2000                   convert_move (targ1, t1, unsignedp);
2001                   return 1;
2002                 }
2003               else
2004                 delete_insns_since (last);
2005             }
2006         }
2007     }
2008
2009   delete_insns_since (entry_last);
2010   return 0;
2011 }
2012 \f
2013 /* Generate code to perform an operation specified by BINOPTAB
2014    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2015    We assume that the order of the operands for the instruction
2016    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2017    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2018
2019    Either TARG0 or TARG1 may be zero, but what that means is that
2020    the result is not actually wanted.  We will generate it into
2021    a dummy pseudo-reg and discard it.  They may not both be zero.
2022
2023    Returns 1 if this operation can be performed; 0 if not.  */
2024
2025 int
2026 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2027                      int unsignedp)
2028 {
2029   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2030   enum mode_class mclass;
2031   machine_mode wider_mode;
2032   rtx_insn *entry_last = get_last_insn ();
2033   rtx_insn *last;
2034
2035   mclass = GET_MODE_CLASS (mode);
2036
2037   if (!targ0)
2038     targ0 = gen_reg_rtx (mode);
2039   if (!targ1)
2040     targ1 = gen_reg_rtx (mode);
2041
2042   /* Record where to go back to if we fail.  */
2043   last = get_last_insn ();
2044
2045   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2046     {
2047       struct expand_operand ops[4];
2048       enum insn_code icode = optab_handler (binoptab, mode);
2049       machine_mode mode0 = insn_data[icode].operand[1].mode;
2050       machine_mode mode1 = insn_data[icode].operand[2].mode;
2051       rtx xop0 = op0, xop1 = op1;
2052
2053       /* If we are optimizing, force expensive constants into a register.  */
2054       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2055       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2056
2057       create_fixed_operand (&ops[0], targ0);
2058       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2059       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2060       create_fixed_operand (&ops[3], targ1);
2061       if (maybe_expand_insn (icode, 4, ops))
2062         return 1;
2063       delete_insns_since (last);
2064     }
2065
2066   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2067
2068   if (CLASS_HAS_WIDER_MODES_P (mclass))
2069     {
2070       FOR_EACH_WIDER_MODE (wider_mode, mode)
2071         {
2072           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2073             {
2074               rtx t0 = gen_reg_rtx (wider_mode);
2075               rtx t1 = gen_reg_rtx (wider_mode);
2076               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2077               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2078
2079               if (expand_twoval_binop (binoptab, cop0, cop1,
2080                                        t0, t1, unsignedp))
2081                 {
2082                   convert_move (targ0, t0, unsignedp);
2083                   convert_move (targ1, t1, unsignedp);
2084                   return 1;
2085                 }
2086               else
2087                 delete_insns_since (last);
2088             }
2089         }
2090     }
2091
2092   delete_insns_since (entry_last);
2093   return 0;
2094 }
2095
2096 /* Expand the two-valued library call indicated by BINOPTAB, but
2097    preserve only one of the values.  If TARG0 is non-NULL, the first
2098    value is placed into TARG0; otherwise the second value is placed
2099    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2100    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2101    This routine assumes that the value returned by the library call is
2102    as if the return value was of an integral mode twice as wide as the
2103    mode of OP0.  Returns 1 if the call was successful.  */
2104
2105 bool
2106 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2107                              rtx targ0, rtx targ1, enum rtx_code code)
2108 {
2109   machine_mode mode;
2110   machine_mode libval_mode;
2111   rtx libval;
2112   rtx_insn *insns;
2113   rtx libfunc;
2114
2115   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2116   gcc_assert (!targ0 != !targ1);
2117
2118   mode = GET_MODE (op0);
2119   libfunc = optab_libfunc (binoptab, mode);
2120   if (!libfunc)
2121     return false;
2122
2123   /* The value returned by the library function will have twice as
2124      many bits as the nominal MODE.  */
2125   libval_mode = smallest_int_mode_for_size (2 * GET_MODE_BITSIZE (mode));
2126   start_sequence ();
2127   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2128                                     libval_mode,
2129                                     op0, mode,
2130                                     op1, mode);
2131   /* Get the part of VAL containing the value that we want.  */
2132   libval = simplify_gen_subreg (mode, libval, libval_mode,
2133                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2134   insns = get_insns ();
2135   end_sequence ();
2136   /* Move the into the desired location.  */
2137   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2138                       gen_rtx_fmt_ee (code, mode, op0, op1));
2139
2140   return true;
2141 }
2142
2143 \f
2144 /* Wrapper around expand_unop which takes an rtx code to specify
2145    the operation to perform, not an optab pointer.  All other
2146    arguments are the same.  */
2147 rtx
2148 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2149                     rtx target, int unsignedp)
2150 {
2151   optab unop = code_to_optab (code);
2152   gcc_assert (unop);
2153
2154   return expand_unop (mode, unop, op0, target, unsignedp);
2155 }
2156
2157 /* Try calculating
2158         (clz:narrow x)
2159    as
2160         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2161
2162    A similar operation can be used for clrsb.  UNOPTAB says which operation
2163    we are trying to expand.  */
2164 static rtx
2165 widen_leading (scalar_int_mode mode, rtx op0, rtx target, optab unoptab)
2166 {
2167   opt_scalar_int_mode wider_mode_iter;
2168   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2169     {
2170       scalar_int_mode wider_mode = wider_mode_iter.require ();
2171       if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2172         {
2173           rtx xop0, temp;
2174           rtx_insn *last;
2175
2176           last = get_last_insn ();
2177
2178           if (target == 0)
2179             target = gen_reg_rtx (mode);
2180           xop0 = widen_operand (op0, wider_mode, mode,
2181                                 unoptab != clrsb_optab, false);
2182           temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2183                               unoptab != clrsb_optab);
2184           if (temp != 0)
2185             temp = expand_binop
2186               (wider_mode, sub_optab, temp,
2187                gen_int_mode (GET_MODE_PRECISION (wider_mode)
2188                              - GET_MODE_PRECISION (mode),
2189                              wider_mode),
2190                target, true, OPTAB_DIRECT);
2191           if (temp == 0)
2192             delete_insns_since (last);
2193
2194           return temp;
2195         }
2196     }
2197   return 0;
2198 }
2199
2200 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2201    quantities, choosing which based on whether the high word is nonzero.  */
2202 static rtx
2203 expand_doubleword_clz (scalar_int_mode mode, rtx op0, rtx target)
2204 {
2205   rtx xop0 = force_reg (mode, op0);
2206   rtx subhi = gen_highpart (word_mode, xop0);
2207   rtx sublo = gen_lowpart (word_mode, xop0);
2208   rtx_code_label *hi0_label = gen_label_rtx ();
2209   rtx_code_label *after_label = gen_label_rtx ();
2210   rtx_insn *seq;
2211   rtx temp, result;
2212
2213   /* If we were not given a target, use a word_mode register, not a
2214      'mode' register.  The result will fit, and nobody is expecting
2215      anything bigger (the return type of __builtin_clz* is int).  */
2216   if (!target)
2217     target = gen_reg_rtx (word_mode);
2218
2219   /* In any case, write to a word_mode scratch in both branches of the
2220      conditional, so we can ensure there is a single move insn setting
2221      'target' to tag a REG_EQUAL note on.  */
2222   result = gen_reg_rtx (word_mode);
2223
2224   start_sequence ();
2225
2226   /* If the high word is not equal to zero,
2227      then clz of the full value is clz of the high word.  */
2228   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2229                            word_mode, true, hi0_label);
2230
2231   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2232   if (!temp)
2233     goto fail;
2234
2235   if (temp != result)
2236     convert_move (result, temp, true);
2237
2238   emit_jump_insn (targetm.gen_jump (after_label));
2239   emit_barrier ();
2240
2241   /* Else clz of the full value is clz of the low word plus the number
2242      of bits in the high word.  */
2243   emit_label (hi0_label);
2244
2245   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2246   if (!temp)
2247     goto fail;
2248   temp = expand_binop (word_mode, add_optab, temp,
2249                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2250                        result, true, OPTAB_DIRECT);
2251   if (!temp)
2252     goto fail;
2253   if (temp != result)
2254     convert_move (result, temp, true);
2255
2256   emit_label (after_label);
2257   convert_move (target, result, true);
2258
2259   seq = get_insns ();
2260   end_sequence ();
2261
2262   add_equal_note (seq, target, CLZ, xop0, 0);
2263   emit_insn (seq);
2264   return target;
2265
2266  fail:
2267   end_sequence ();
2268   return 0;
2269 }
2270
2271 /* Try calculating popcount of a double-word quantity as two popcount's of
2272    word-sized quantities and summing up the results.  */
2273 static rtx
2274 expand_doubleword_popcount (scalar_int_mode mode, rtx op0, rtx target)
2275 {
2276   rtx t0, t1, t;
2277   rtx_insn *seq;
2278
2279   start_sequence ();
2280
2281   t0 = expand_unop_direct (word_mode, popcount_optab,
2282                            operand_subword_force (op0, 0, mode), NULL_RTX,
2283                            true);
2284   t1 = expand_unop_direct (word_mode, popcount_optab,
2285                            operand_subword_force (op0, 1, mode), NULL_RTX,
2286                            true);
2287   if (!t0 || !t1)
2288     {
2289       end_sequence ();
2290       return NULL_RTX;
2291     }
2292
2293   /* If we were not given a target, use a word_mode register, not a
2294      'mode' register.  The result will fit, and nobody is expecting
2295      anything bigger (the return type of __builtin_popcount* is int).  */
2296   if (!target)
2297     target = gen_reg_rtx (word_mode);
2298
2299   t = expand_binop (word_mode, add_optab, t0, t1, target, 0, OPTAB_DIRECT);
2300
2301   seq = get_insns ();
2302   end_sequence ();
2303
2304   add_equal_note (seq, t, POPCOUNT, op0, 0);
2305   emit_insn (seq);
2306   return t;
2307 }
2308
2309 /* Try calculating
2310         (parity:wide x)
2311    as
2312         (parity:narrow (low (x) ^ high (x))) */
2313 static rtx
2314 expand_doubleword_parity (scalar_int_mode mode, rtx op0, rtx target)
2315 {
2316   rtx t = expand_binop (word_mode, xor_optab,
2317                         operand_subword_force (op0, 0, mode),
2318                         operand_subword_force (op0, 1, mode),
2319                         NULL_RTX, 0, OPTAB_DIRECT);
2320   return expand_unop (word_mode, parity_optab, t, target, true);
2321 }
2322
2323 /* Try calculating
2324         (bswap:narrow x)
2325    as
2326         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2327 static rtx
2328 widen_bswap (scalar_int_mode mode, rtx op0, rtx target)
2329 {
2330   rtx x;
2331   rtx_insn *last;
2332   opt_scalar_int_mode wider_mode_iter;
2333
2334   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2335     if (optab_handler (bswap_optab, wider_mode_iter.require ())
2336         != CODE_FOR_nothing)
2337       break;
2338
2339   if (!wider_mode_iter.exists ())
2340     return NULL_RTX;
2341
2342   scalar_int_mode wider_mode = wider_mode_iter.require ();
2343   last = get_last_insn ();
2344
2345   x = widen_operand (op0, wider_mode, mode, true, true);
2346   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2347
2348   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2349               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2350   if (x != 0)
2351     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2352                       GET_MODE_BITSIZE (wider_mode)
2353                       - GET_MODE_BITSIZE (mode),
2354                       NULL_RTX, true);
2355
2356   if (x != 0)
2357     {
2358       if (target == 0)
2359         target = gen_reg_rtx (mode);
2360       emit_move_insn (target, gen_lowpart (mode, x));
2361     }
2362   else
2363     delete_insns_since (last);
2364
2365   return target;
2366 }
2367
2368 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2369
2370 static rtx
2371 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2372 {
2373   rtx t0, t1;
2374
2375   t1 = expand_unop (word_mode, bswap_optab,
2376                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2377   t0 = expand_unop (word_mode, bswap_optab,
2378                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2379
2380   if (target == 0 || !valid_multiword_target_p (target))
2381     target = gen_reg_rtx (mode);
2382   if (REG_P (target))
2383     emit_clobber (target);
2384   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2385   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2386
2387   return target;
2388 }
2389
2390 /* Try calculating (parity x) as (and (popcount x) 1), where
2391    popcount can also be done in a wider mode.  */
2392 static rtx
2393 expand_parity (scalar_int_mode mode, rtx op0, rtx target)
2394 {
2395   enum mode_class mclass = GET_MODE_CLASS (mode);
2396   opt_scalar_int_mode wider_mode_iter;
2397   FOR_EACH_MODE_FROM (wider_mode_iter, mode)
2398     {
2399       scalar_int_mode wider_mode = wider_mode_iter.require ();
2400       if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2401         {
2402           rtx xop0, temp;
2403           rtx_insn *last;
2404
2405           last = get_last_insn ();
2406
2407           if (target == 0 || GET_MODE (target) != wider_mode)
2408             target = gen_reg_rtx (wider_mode);
2409
2410           xop0 = widen_operand (op0, wider_mode, mode, true, false);
2411           temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2412                               true);
2413           if (temp != 0)
2414             temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2415                                  target, true, OPTAB_DIRECT);
2416
2417           if (temp)
2418             {
2419               if (mclass != MODE_INT
2420                   || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2421                 return convert_to_mode (mode, temp, 0);
2422               else
2423                 return gen_lowpart (mode, temp);
2424             }
2425           else
2426             delete_insns_since (last);
2427         }
2428     }
2429   return 0;
2430 }
2431
2432 /* Try calculating ctz(x) as K - clz(x & -x) ,
2433    where K is GET_MODE_PRECISION(mode) - 1.
2434
2435    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2436    don't have to worry about what the hardware does in that case.  (If
2437    the clz instruction produces the usual value at 0, which is K, the
2438    result of this code sequence will be -1; expand_ffs, below, relies
2439    on this.  It might be nice to have it be K instead, for consistency
2440    with the (very few) processors that provide a ctz with a defined
2441    value, but that would take one more instruction, and it would be
2442    less convenient for expand_ffs anyway.  */
2443
2444 static rtx
2445 expand_ctz (scalar_int_mode mode, rtx op0, rtx target)
2446 {
2447   rtx_insn *seq;
2448   rtx temp;
2449
2450   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2451     return 0;
2452
2453   start_sequence ();
2454
2455   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2456   if (temp)
2457     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2458                          true, OPTAB_DIRECT);
2459   if (temp)
2460     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2461   if (temp)
2462     temp = expand_binop (mode, sub_optab,
2463                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2464                          temp, target,
2465                          true, OPTAB_DIRECT);
2466   if (temp == 0)
2467     {
2468       end_sequence ();
2469       return 0;
2470     }
2471
2472   seq = get_insns ();
2473   end_sequence ();
2474
2475   add_equal_note (seq, temp, CTZ, op0, 0);
2476   emit_insn (seq);
2477   return temp;
2478 }
2479
2480
2481 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2482    else with the sequence used by expand_clz.
2483
2484    The ffs builtin promises to return zero for a zero value and ctz/clz
2485    may have an undefined value in that case.  If they do not give us a
2486    convenient value, we have to generate a test and branch.  */
2487 static rtx
2488 expand_ffs (scalar_int_mode mode, rtx op0, rtx target)
2489 {
2490   HOST_WIDE_INT val = 0;
2491   bool defined_at_zero = false;
2492   rtx temp;
2493   rtx_insn *seq;
2494
2495   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2496     {
2497       start_sequence ();
2498
2499       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2500       if (!temp)
2501         goto fail;
2502
2503       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2504     }
2505   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2506     {
2507       start_sequence ();
2508       temp = expand_ctz (mode, op0, 0);
2509       if (!temp)
2510         goto fail;
2511
2512       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2513         {
2514           defined_at_zero = true;
2515           val = (GET_MODE_PRECISION (mode) - 1) - val;
2516         }
2517     }
2518   else
2519     return 0;
2520
2521   if (defined_at_zero && val == -1)
2522     /* No correction needed at zero.  */;
2523   else
2524     {
2525       /* We don't try to do anything clever with the situation found
2526          on some processors (eg Alpha) where ctz(0:mode) ==
2527          bitsize(mode).  If someone can think of a way to send N to -1
2528          and leave alone all values in the range 0..N-1 (where N is a
2529          power of two), cheaper than this test-and-branch, please add it.
2530
2531          The test-and-branch is done after the operation itself, in case
2532          the operation sets condition codes that can be recycled for this.
2533          (This is true on i386, for instance.)  */
2534
2535       rtx_code_label *nonzero_label = gen_label_rtx ();
2536       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2537                                mode, true, nonzero_label);
2538
2539       convert_move (temp, GEN_INT (-1), false);
2540       emit_label (nonzero_label);
2541     }
2542
2543   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2544      to produce a value in the range 0..bitsize.  */
2545   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2546                        target, false, OPTAB_DIRECT);
2547   if (!temp)
2548     goto fail;
2549
2550   seq = get_insns ();
2551   end_sequence ();
2552
2553   add_equal_note (seq, temp, FFS, op0, 0);
2554   emit_insn (seq);
2555   return temp;
2556
2557  fail:
2558   end_sequence ();
2559   return 0;
2560 }
2561
2562 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2563    conditions, VAL may already be a SUBREG against which we cannot generate
2564    a further SUBREG.  In this case, we expect forcing the value into a
2565    register will work around the situation.  */
2566
2567 static rtx
2568 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
2569                            machine_mode imode)
2570 {
2571   rtx ret;
2572   ret = lowpart_subreg (omode, val, imode);
2573   if (ret == NULL)
2574     {
2575       val = force_reg (imode, val);
2576       ret = lowpart_subreg (omode, val, imode);
2577       gcc_assert (ret != NULL);
2578     }
2579   return ret;
2580 }
2581
2582 /* Expand a floating point absolute value or negation operation via a
2583    logical operation on the sign bit.  */
2584
2585 static rtx
2586 expand_absneg_bit (enum rtx_code code, scalar_float_mode mode,
2587                    rtx op0, rtx target)
2588 {
2589   const struct real_format *fmt;
2590   int bitpos, word, nwords, i;
2591   scalar_int_mode imode;
2592   rtx temp;
2593   rtx_insn *insns;
2594
2595   /* The format has to have a simple sign bit.  */
2596   fmt = REAL_MODE_FORMAT (mode);
2597   if (fmt == NULL)
2598     return NULL_RTX;
2599
2600   bitpos = fmt->signbit_rw;
2601   if (bitpos < 0)
2602     return NULL_RTX;
2603
2604   /* Don't create negative zeros if the format doesn't support them.  */
2605   if (code == NEG && !fmt->has_signed_zero)
2606     return NULL_RTX;
2607
2608   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2609     {
2610       if (!int_mode_for_mode (mode).exists (&imode))
2611         return NULL_RTX;
2612       word = 0;
2613       nwords = 1;
2614     }
2615   else
2616     {
2617       imode = word_mode;
2618
2619       if (FLOAT_WORDS_BIG_ENDIAN)
2620         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2621       else
2622         word = bitpos / BITS_PER_WORD;
2623       bitpos = bitpos % BITS_PER_WORD;
2624       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2625     }
2626
2627   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2628   if (code == ABS)
2629     mask = ~mask;
2630
2631   if (target == 0
2632       || target == op0
2633       || (nwords > 1 && !valid_multiword_target_p (target)))
2634     target = gen_reg_rtx (mode);
2635
2636   if (nwords > 1)
2637     {
2638       start_sequence ();
2639
2640       for (i = 0; i < nwords; ++i)
2641         {
2642           rtx targ_piece = operand_subword (target, i, 1, mode);
2643           rtx op0_piece = operand_subword_force (op0, i, mode);
2644
2645           if (i == word)
2646             {
2647               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2648                                    op0_piece,
2649                                    immed_wide_int_const (mask, imode),
2650                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2651               if (temp != targ_piece)
2652                 emit_move_insn (targ_piece, temp);
2653             }
2654           else
2655             emit_move_insn (targ_piece, op0_piece);
2656         }
2657
2658       insns = get_insns ();
2659       end_sequence ();
2660
2661       emit_insn (insns);
2662     }
2663   else
2664     {
2665       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2666                            gen_lowpart (imode, op0),
2667                            immed_wide_int_const (mask, imode),
2668                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2669       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2670
2671       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2672                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2673                         target);
2674     }
2675
2676   return target;
2677 }
2678
2679 /* As expand_unop, but will fail rather than attempt the operation in a
2680    different mode or with a libcall.  */
2681 static rtx
2682 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
2683                     int unsignedp)
2684 {
2685   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2686     {
2687       struct expand_operand ops[2];
2688       enum insn_code icode = optab_handler (unoptab, mode);
2689       rtx_insn *last = get_last_insn ();
2690       rtx_insn *pat;
2691
2692       create_output_operand (&ops[0], target, mode);
2693       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2694       pat = maybe_gen_insn (icode, 2, ops);
2695       if (pat)
2696         {
2697           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
2698               && ! add_equal_note (pat, ops[0].value,
2699                                    optab_to_code (unoptab),
2700                                    ops[1].value, NULL_RTX))
2701             {
2702               delete_insns_since (last);
2703               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
2704             }
2705
2706           emit_insn (pat);
2707
2708           return ops[0].value;
2709         }
2710     }
2711   return 0;
2712 }
2713
2714 /* Generate code to perform an operation specified by UNOPTAB
2715    on operand OP0, with result having machine-mode MODE.
2716
2717    UNSIGNEDP is for the case where we have to widen the operands
2718    to perform the operation.  It says to use zero-extension.
2719
2720    If TARGET is nonzero, the value
2721    is generated there, if it is convenient to do so.
2722    In all cases an rtx is returned for the locus of the value;
2723    this may or may not be TARGET.  */
2724
2725 rtx
2726 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
2727              int unsignedp)
2728 {
2729   enum mode_class mclass = GET_MODE_CLASS (mode);
2730   machine_mode wider_mode;
2731   scalar_int_mode int_mode;
2732   scalar_float_mode float_mode;
2733   rtx temp;
2734   rtx libfunc;
2735
2736   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
2737   if (temp)
2738     return temp;
2739
2740   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
2741
2742   /* Widening (or narrowing) clz needs special treatment.  */
2743   if (unoptab == clz_optab)
2744     {
2745       if (is_a <scalar_int_mode> (mode, &int_mode))
2746         {
2747           temp = widen_leading (int_mode, op0, target, unoptab);
2748           if (temp)
2749             return temp;
2750
2751           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2752               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2753             {
2754               temp = expand_doubleword_clz (int_mode, op0, target);
2755               if (temp)
2756                 return temp;
2757             }
2758         }
2759
2760       goto try_libcall;
2761     }
2762
2763   if (unoptab == clrsb_optab)
2764     {
2765       if (is_a <scalar_int_mode> (mode, &int_mode))
2766         {
2767           temp = widen_leading (int_mode, op0, target, unoptab);
2768           if (temp)
2769             return temp;
2770         }
2771       goto try_libcall;
2772     }
2773
2774   if (unoptab == popcount_optab
2775       && is_a <scalar_int_mode> (mode, &int_mode)
2776       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2777       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2778       && optimize_insn_for_speed_p ())
2779     {
2780       temp = expand_doubleword_popcount (int_mode, op0, target);
2781       if (temp)
2782         return temp;
2783     }
2784
2785   if (unoptab == parity_optab
2786       && is_a <scalar_int_mode> (mode, &int_mode)
2787       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2788       && (optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2789           || optab_handler (popcount_optab, word_mode) != CODE_FOR_nothing)
2790       && optimize_insn_for_speed_p ())
2791     {
2792       temp = expand_doubleword_parity (int_mode, op0, target);
2793       if (temp)
2794         return temp;
2795     }
2796
2797   /* Widening (or narrowing) bswap needs special treatment.  */
2798   if (unoptab == bswap_optab)
2799     {
2800       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
2801          or ROTATERT.  First try these directly; if this fails, then try the
2802          obvious pair of shifts with allowed widening, as this will probably
2803          be always more efficient than the other fallback methods.  */
2804       if (mode == HImode)
2805         {
2806           rtx_insn *last;
2807           rtx temp1, temp2;
2808
2809           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
2810             {
2811               temp = expand_binop (mode, rotl_optab, op0,
2812                                    gen_int_shift_amount (mode, 8),
2813                                    target, unsignedp, OPTAB_DIRECT);
2814               if (temp)
2815                 return temp;
2816              }
2817
2818           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
2819             {
2820               temp = expand_binop (mode, rotr_optab, op0,
2821                                    gen_int_shift_amount (mode, 8),
2822                                    target, unsignedp, OPTAB_DIRECT);
2823               if (temp)
2824                 return temp;
2825             }
2826
2827           last = get_last_insn ();
2828
2829           temp1 = expand_binop (mode, ashl_optab, op0,
2830                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2831                                 unsignedp, OPTAB_WIDEN);
2832           temp2 = expand_binop (mode, lshr_optab, op0,
2833                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2834                                 unsignedp, OPTAB_WIDEN);
2835           if (temp1 && temp2)
2836             {
2837               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
2838                                    unsignedp, OPTAB_WIDEN);
2839               if (temp)
2840                 return temp;
2841             }
2842
2843           delete_insns_since (last);
2844         }
2845
2846       if (is_a <scalar_int_mode> (mode, &int_mode))
2847         {
2848           temp = widen_bswap (int_mode, op0, target);
2849           if (temp)
2850             return temp;
2851
2852           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2853               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2854             {
2855               temp = expand_doubleword_bswap (mode, op0, target);
2856               if (temp)
2857                 return temp;
2858             }
2859         }
2860
2861       goto try_libcall;
2862     }
2863
2864   if (CLASS_HAS_WIDER_MODES_P (mclass))
2865     FOR_EACH_WIDER_MODE (wider_mode, mode)
2866       {
2867         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2868           {
2869             rtx xop0 = op0;
2870             rtx_insn *last = get_last_insn ();
2871
2872             /* For certain operations, we need not actually extend
2873                the narrow operand, as long as we will truncate the
2874                results to the same narrowness.  */
2875
2876             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
2877                                   (unoptab == neg_optab
2878                                    || unoptab == one_cmpl_optab)
2879                                   && mclass == MODE_INT);
2880
2881             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2882                                 unsignedp);
2883
2884             if (temp)
2885               {
2886                 if (mclass != MODE_INT
2887                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2888                   {
2889                     if (target == 0)
2890                       target = gen_reg_rtx (mode);
2891                     convert_move (target, temp, 0);
2892                     return target;
2893                   }
2894                 else
2895                   return gen_lowpart (mode, temp);
2896               }
2897             else
2898               delete_insns_since (last);
2899           }
2900       }
2901
2902   /* These can be done a word at a time.  */
2903   if (unoptab == one_cmpl_optab
2904       && is_int_mode (mode, &int_mode)
2905       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
2906       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2907     {
2908       int i;
2909       rtx_insn *insns;
2910
2911       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
2912         target = gen_reg_rtx (int_mode);
2913
2914       start_sequence ();
2915
2916       /* Do the actual arithmetic.  */
2917       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
2918         {
2919           rtx target_piece = operand_subword (target, i, 1, int_mode);
2920           rtx x = expand_unop (word_mode, unoptab,
2921                                operand_subword_force (op0, i, int_mode),
2922                                target_piece, unsignedp);
2923
2924           if (target_piece != x)
2925             emit_move_insn (target_piece, x);
2926         }
2927
2928       insns = get_insns ();
2929       end_sequence ();
2930
2931       emit_insn (insns);
2932       return target;
2933     }
2934
2935   if (optab_to_code (unoptab) == NEG)
2936     {
2937       /* Try negating floating point values by flipping the sign bit.  */
2938       if (is_a <scalar_float_mode> (mode, &float_mode))
2939         {
2940           temp = expand_absneg_bit (NEG, float_mode, op0, target);
2941           if (temp)
2942             return temp;
2943         }
2944
2945       /* If there is no negation pattern, and we have no negative zero,
2946          try subtracting from zero.  */
2947       if (!HONOR_SIGNED_ZEROS (mode))
2948         {
2949           temp = expand_binop (mode, (unoptab == negv_optab
2950                                       ? subv_optab : sub_optab),
2951                                CONST0_RTX (mode), op0, target,
2952                                unsignedp, OPTAB_DIRECT);
2953           if (temp)
2954             return temp;
2955         }
2956     }
2957
2958   /* Try calculating parity (x) as popcount (x) % 2.  */
2959   if (unoptab == parity_optab && is_a <scalar_int_mode> (mode, &int_mode))
2960     {
2961       temp = expand_parity (int_mode, op0, target);
2962       if (temp)
2963         return temp;
2964     }
2965
2966   /* Try implementing ffs (x) in terms of clz (x).  */
2967   if (unoptab == ffs_optab && is_a <scalar_int_mode> (mode, &int_mode))
2968     {
2969       temp = expand_ffs (int_mode, op0, target);
2970       if (temp)
2971         return temp;
2972     }
2973
2974   /* Try implementing ctz (x) in terms of clz (x).  */
2975   if (unoptab == ctz_optab && is_a <scalar_int_mode> (mode, &int_mode))
2976     {
2977       temp = expand_ctz (int_mode, op0, target);
2978       if (temp)
2979         return temp;
2980     }
2981
2982  try_libcall:
2983   /* Now try a library call in this mode.  */
2984   libfunc = optab_libfunc (unoptab, mode);
2985   if (libfunc)
2986     {
2987       rtx_insn *insns;
2988       rtx value;
2989       rtx eq_value;
2990       machine_mode outmode = mode;
2991
2992       /* All of these functions return small values.  Thus we choose to
2993          have them return something that isn't a double-word.  */
2994       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
2995           || unoptab == clrsb_optab || unoptab == popcount_optab
2996           || unoptab == parity_optab)
2997         outmode
2998           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
2999                                           optab_libfunc (unoptab, mode)));
3000
3001       start_sequence ();
3002
3003       /* Pass 1 for NO_QUEUE so we don't lose any increments
3004          if the libcall is cse'd or moved.  */
3005       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3006                                        op0, mode);
3007       insns = get_insns ();
3008       end_sequence ();
3009
3010       target = gen_reg_rtx (outmode);
3011       bool trapv = trapv_unoptab_p (unoptab);
3012       if (trapv)
3013         eq_value = NULL_RTX;
3014       else
3015         {
3016           eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3017           if (GET_MODE_UNIT_SIZE (outmode) < GET_MODE_UNIT_SIZE (mode))
3018             eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3019           else if (GET_MODE_UNIT_SIZE (outmode) > GET_MODE_UNIT_SIZE (mode))
3020             eq_value = simplify_gen_unary (ZERO_EXTEND,
3021                                            outmode, eq_value, mode);
3022         }
3023       emit_libcall_block_1 (insns, target, value, eq_value, trapv);
3024
3025       return target;
3026     }
3027
3028   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3029
3030   if (CLASS_HAS_WIDER_MODES_P (mclass))
3031     {
3032       FOR_EACH_WIDER_MODE (wider_mode, mode)
3033         {
3034           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3035               || optab_libfunc (unoptab, wider_mode))
3036             {
3037               rtx xop0 = op0;
3038               rtx_insn *last = get_last_insn ();
3039
3040               /* For certain operations, we need not actually extend
3041                  the narrow operand, as long as we will truncate the
3042                  results to the same narrowness.  */
3043               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3044                                     (unoptab == neg_optab
3045                                      || unoptab == one_cmpl_optab
3046                                      || unoptab == bswap_optab)
3047                                     && mclass == MODE_INT);
3048
3049               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3050                                   unsignedp);
3051
3052               /* If we are generating clz using wider mode, adjust the
3053                  result.  Similarly for clrsb.  */
3054               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3055                   && temp != 0)
3056                 {
3057                   scalar_int_mode wider_int_mode
3058                     = as_a <scalar_int_mode> (wider_mode);
3059                   int_mode = as_a <scalar_int_mode> (mode);
3060                   temp = expand_binop
3061                     (wider_mode, sub_optab, temp,
3062                      gen_int_mode (GET_MODE_PRECISION (wider_int_mode)
3063                                    - GET_MODE_PRECISION (int_mode),
3064                                    wider_int_mode),
3065                      target, true, OPTAB_DIRECT);
3066                 }
3067
3068               /* Likewise for bswap.  */
3069               if (unoptab == bswap_optab && temp != 0)
3070                 {
3071                   scalar_int_mode wider_int_mode
3072                     = as_a <scalar_int_mode> (wider_mode);
3073                   int_mode = as_a <scalar_int_mode> (mode);
3074                   gcc_assert (GET_MODE_PRECISION (wider_int_mode)
3075                               == GET_MODE_BITSIZE (wider_int_mode)
3076                               && GET_MODE_PRECISION (int_mode)
3077                                  == GET_MODE_BITSIZE (int_mode));
3078
3079                   temp = expand_shift (RSHIFT_EXPR, wider_int_mode, temp,
3080                                        GET_MODE_BITSIZE (wider_int_mode)
3081                                        - GET_MODE_BITSIZE (int_mode),
3082                                        NULL_RTX, true);
3083                 }
3084
3085               if (temp)
3086                 {
3087                   if (mclass != MODE_INT)
3088                     {
3089                       if (target == 0)
3090                         target = gen_reg_rtx (mode);
3091                       convert_move (target, temp, 0);
3092                       return target;
3093                     }
3094                   else
3095                     return gen_lowpart (mode, temp);
3096                 }
3097               else
3098                 delete_insns_since (last);
3099             }
3100         }
3101     }
3102
3103   /* One final attempt at implementing negation via subtraction,
3104      this time allowing widening of the operand.  */
3105   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3106     {
3107       rtx temp;
3108       temp = expand_binop (mode,
3109                            unoptab == negv_optab ? subv_optab : sub_optab,
3110                            CONST0_RTX (mode), op0,
3111                            target, unsignedp, OPTAB_LIB_WIDEN);
3112       if (temp)
3113         return temp;
3114     }
3115
3116   return 0;
3117 }
3118 \f
3119 /* Emit code to compute the absolute value of OP0, with result to
3120    TARGET if convenient.  (TARGET may be 0.)  The return value says
3121    where the result actually is to be found.
3122
3123    MODE is the mode of the operand; the mode of the result is
3124    different but can be deduced from MODE.
3125
3126  */
3127
3128 rtx
3129 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3130                    int result_unsignedp)
3131 {
3132   rtx temp;
3133
3134   if (GET_MODE_CLASS (mode) != MODE_INT
3135       || ! flag_trapv)
3136     result_unsignedp = 1;
3137
3138   /* First try to do it with a special abs instruction.  */
3139   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3140                       op0, target, 0);
3141   if (temp != 0)
3142     return temp;
3143
3144   /* For floating point modes, try clearing the sign bit.  */
3145   scalar_float_mode float_mode;
3146   if (is_a <scalar_float_mode> (mode, &float_mode))
3147     {
3148       temp = expand_absneg_bit (ABS, float_mode, op0, target);
3149       if (temp)
3150         return temp;
3151     }
3152
3153   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3154   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3155       && !HONOR_SIGNED_ZEROS (mode))
3156     {
3157       rtx_insn *last = get_last_insn ();
3158
3159       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3160                           op0, NULL_RTX, 0);
3161       if (temp != 0)
3162         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3163                              OPTAB_WIDEN);
3164
3165       if (temp != 0)
3166         return temp;
3167
3168       delete_insns_since (last);
3169     }
3170
3171   /* If this machine has expensive jumps, we can do integer absolute
3172      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3173      where W is the width of MODE.  */
3174
3175   scalar_int_mode int_mode;
3176   if (is_int_mode (mode, &int_mode)
3177       && BRANCH_COST (optimize_insn_for_speed_p (),
3178                       false) >= 2)
3179     {
3180       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3181                                    GET_MODE_PRECISION (int_mode) - 1,
3182                                    NULL_RTX, 0);
3183
3184       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3185                            OPTAB_LIB_WIDEN);
3186       if (temp != 0)
3187         temp = expand_binop (int_mode,
3188                              result_unsignedp ? sub_optab : subv_optab,
3189                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3190
3191       if (temp != 0)
3192         return temp;
3193     }
3194
3195   return NULL_RTX;
3196 }
3197
3198 rtx
3199 expand_abs (machine_mode mode, rtx op0, rtx target,
3200             int result_unsignedp, int safe)
3201 {
3202   rtx temp;
3203   rtx_code_label *op1;
3204
3205   if (GET_MODE_CLASS (mode) != MODE_INT
3206       || ! flag_trapv)
3207     result_unsignedp = 1;
3208
3209   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3210   if (temp != 0)
3211     return temp;
3212
3213   /* If that does not win, use conditional jump and negate.  */
3214
3215   /* It is safe to use the target if it is the same
3216      as the source if this is also a pseudo register */
3217   if (op0 == target && REG_P (op0)
3218       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3219     safe = 1;
3220
3221   op1 = gen_label_rtx ();
3222   if (target == 0 || ! safe
3223       || GET_MODE (target) != mode
3224       || (MEM_P (target) && MEM_VOLATILE_P (target))
3225       || (REG_P (target)
3226           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3227     target = gen_reg_rtx (mode);
3228
3229   emit_move_insn (target, op0);
3230   NO_DEFER_POP;
3231
3232   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3233                            NULL_RTX, NULL, op1,
3234                            profile_probability::uninitialized ());
3235
3236   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3237                      target, target, 0);
3238   if (op0 != target)
3239     emit_move_insn (target, op0);
3240   emit_label (op1);
3241   OK_DEFER_POP;
3242   return target;
3243 }
3244
3245 /* Emit code to compute the one's complement absolute value of OP0
3246    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3247    (TARGET may be NULL_RTX.)  The return value says where the result
3248    actually is to be found.
3249
3250    MODE is the mode of the operand; the mode of the result is
3251    different but can be deduced from MODE.  */
3252
3253 rtx
3254 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3255 {
3256   rtx temp;
3257
3258   /* Not applicable for floating point modes.  */
3259   if (FLOAT_MODE_P (mode))
3260     return NULL_RTX;
3261
3262   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3263   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3264     {
3265       rtx_insn *last = get_last_insn ();
3266
3267       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3268       if (temp != 0)
3269         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3270                              OPTAB_WIDEN);
3271
3272       if (temp != 0)
3273         return temp;
3274
3275       delete_insns_since (last);
3276     }
3277
3278   /* If this machine has expensive jumps, we can do one's complement
3279      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3280
3281   scalar_int_mode int_mode;
3282   if (is_int_mode (mode, &int_mode)
3283       && BRANCH_COST (optimize_insn_for_speed_p (),
3284                      false) >= 2)
3285     {
3286       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3287                                    GET_MODE_PRECISION (int_mode) - 1,
3288                                    NULL_RTX, 0);
3289
3290       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3291                            OPTAB_LIB_WIDEN);
3292
3293       if (temp != 0)
3294         return temp;
3295     }
3296
3297   return NULL_RTX;
3298 }
3299
3300 /* A subroutine of expand_copysign, perform the copysign operation using the
3301    abs and neg primitives advertised to exist on the target.  The assumption
3302    is that we have a split register file, and leaving op0 in fp registers,
3303    and not playing with subregs so much, will help the register allocator.  */
3304
3305 static rtx
3306 expand_copysign_absneg (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3307                         int bitpos, bool op0_is_abs)
3308 {
3309   scalar_int_mode imode;
3310   enum insn_code icode;
3311   rtx sign;
3312   rtx_code_label *label;
3313
3314   if (target == op1)
3315     target = NULL_RTX;
3316
3317   /* Check if the back end provides an insn that handles signbit for the
3318      argument's mode. */
3319   icode = optab_handler (signbit_optab, mode);
3320   if (icode != CODE_FOR_nothing)
3321     {
3322       imode = as_a <scalar_int_mode> (insn_data[(int) icode].operand[0].mode);
3323       sign = gen_reg_rtx (imode);
3324       emit_unop_insn (icode, sign, op1, UNKNOWN);
3325     }
3326   else
3327     {
3328       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3329         {
3330           if (!int_mode_for_mode (mode).exists (&imode))
3331             return NULL_RTX;
3332           op1 = gen_lowpart (imode, op1);
3333         }
3334       else
3335         {
3336           int word;
3337
3338           imode = word_mode;
3339           if (FLOAT_WORDS_BIG_ENDIAN)
3340             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3341           else
3342             word = bitpos / BITS_PER_WORD;
3343           bitpos = bitpos % BITS_PER_WORD;
3344           op1 = operand_subword_force (op1, word, mode);
3345         }
3346
3347       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3348       sign = expand_binop (imode, and_optab, op1,
3349                            immed_wide_int_const (mask, imode),
3350                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3351     }
3352
3353   if (!op0_is_abs)
3354     {
3355       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3356       if (op0 == NULL)
3357         return NULL_RTX;
3358       target = op0;
3359     }
3360   else
3361     {
3362       if (target == NULL_RTX)
3363         target = copy_to_reg (op0);
3364       else
3365         emit_move_insn (target, op0);
3366     }
3367
3368   label = gen_label_rtx ();
3369   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3370
3371   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3372     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3373   else
3374     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3375   if (op0 != target)
3376     emit_move_insn (target, op0);
3377
3378   emit_label (label);
3379
3380   return target;
3381 }
3382
3383
3384 /* A subroutine of expand_copysign, perform the entire copysign operation
3385    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3386    is true if op0 is known to have its sign bit clear.  */
3387
3388 static rtx
3389 expand_copysign_bit (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3390                      int bitpos, bool op0_is_abs)
3391 {
3392   scalar_int_mode imode;
3393   int word, nwords, i;
3394   rtx temp;
3395   rtx_insn *insns;
3396
3397   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3398     {
3399       if (!int_mode_for_mode (mode).exists (&imode))
3400         return NULL_RTX;
3401       word = 0;
3402       nwords = 1;
3403     }
3404   else
3405     {
3406       imode = word_mode;
3407
3408       if (FLOAT_WORDS_BIG_ENDIAN)
3409         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3410       else
3411         word = bitpos / BITS_PER_WORD;
3412       bitpos = bitpos % BITS_PER_WORD;
3413       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3414     }
3415
3416   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3417
3418   if (target == 0
3419       || target == op0
3420       || target == op1
3421       || (nwords > 1 && !valid_multiword_target_p (target)))
3422     target = gen_reg_rtx (mode);
3423
3424   if (nwords > 1)
3425     {
3426       start_sequence ();
3427
3428       for (i = 0; i < nwords; ++i)
3429         {
3430           rtx targ_piece = operand_subword (target, i, 1, mode);
3431           rtx op0_piece = operand_subword_force (op0, i, mode);
3432
3433           if (i == word)
3434             {
3435               if (!op0_is_abs)
3436                 op0_piece
3437                   = expand_binop (imode, and_optab, op0_piece,
3438                                   immed_wide_int_const (~mask, imode),
3439                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3440               op1 = expand_binop (imode, and_optab,
3441                                   operand_subword_force (op1, i, mode),
3442                                   immed_wide_int_const (mask, imode),
3443                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3444
3445               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3446                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3447               if (temp != targ_piece)
3448                 emit_move_insn (targ_piece, temp);
3449             }
3450           else
3451             emit_move_insn (targ_piece, op0_piece);
3452         }
3453
3454       insns = get_insns ();
3455       end_sequence ();
3456
3457       emit_insn (insns);
3458     }
3459   else
3460     {
3461       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3462                           immed_wide_int_const (mask, imode),
3463                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3464
3465       op0 = gen_lowpart (imode, op0);
3466       if (!op0_is_abs)
3467         op0 = expand_binop (imode, and_optab, op0,
3468                             immed_wide_int_const (~mask, imode),
3469                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3470
3471       temp = expand_binop (imode, ior_optab, op0, op1,
3472                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3473       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3474     }
3475
3476   return target;
3477 }
3478
3479 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3480    scalar floating point mode.  Return NULL if we do not know how to
3481    expand the operation inline.  */
3482
3483 rtx
3484 expand_copysign (rtx op0, rtx op1, rtx target)
3485 {
3486   scalar_float_mode mode;
3487   const struct real_format *fmt;
3488   bool op0_is_abs;
3489   rtx temp;
3490
3491   mode = as_a <scalar_float_mode> (GET_MODE (op0));
3492   gcc_assert (GET_MODE (op1) == mode);
3493
3494   /* First try to do it with a special instruction.  */
3495   temp = expand_binop (mode, copysign_optab, op0, op1,
3496                        target, 0, OPTAB_DIRECT);
3497   if (temp)
3498     return temp;
3499
3500   fmt = REAL_MODE_FORMAT (mode);
3501   if (fmt == NULL || !fmt->has_signed_zero)
3502     return NULL_RTX;
3503
3504   op0_is_abs = false;
3505   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3506     {
3507       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3508         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3509       op0_is_abs = true;
3510     }
3511
3512   if (fmt->signbit_ro >= 0
3513       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3514           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3515               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3516     {
3517       temp = expand_copysign_absneg (mode, op0, op1, target,
3518                                      fmt->signbit_ro, op0_is_abs);
3519       if (temp)
3520         return temp;
3521     }
3522
3523   if (fmt->signbit_rw < 0)
3524     return NULL_RTX;
3525   return expand_copysign_bit (mode, op0, op1, target,
3526                               fmt->signbit_rw, op0_is_abs);
3527 }
3528 \f
3529 /* Generate an instruction whose insn-code is INSN_CODE,
3530    with two operands: an output TARGET and an input OP0.
3531    TARGET *must* be nonzero, and the output is always stored there.
3532    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3533    the value that is stored into TARGET.
3534
3535    Return false if expansion failed.  */
3536
3537 bool
3538 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3539                       enum rtx_code code)
3540 {
3541   struct expand_operand ops[2];
3542   rtx_insn *pat;
3543
3544   create_output_operand (&ops[0], target, GET_MODE (target));
3545   create_input_operand (&ops[1], op0, GET_MODE (op0));
3546   pat = maybe_gen_insn (icode, 2, ops);
3547   if (!pat)
3548     return false;
3549
3550   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3551       && code != UNKNOWN)
3552     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3553
3554   emit_insn (pat);
3555
3556   if (ops[0].value != target)
3557     emit_move_insn (target, ops[0].value);
3558   return true;
3559 }
3560 /* Generate an instruction whose insn-code is INSN_CODE,
3561    with two operands: an output TARGET and an input OP0.
3562    TARGET *must* be nonzero, and the output is always stored there.
3563    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3564    the value that is stored into TARGET.  */
3565
3566 void
3567 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3568 {
3569   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3570   gcc_assert (ok);
3571 }
3572 \f
3573 struct no_conflict_data
3574 {
3575   rtx target;
3576   rtx_insn *first, *insn;
3577   bool must_stay;
3578 };
3579
3580 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3581    the currently examined clobber / store has to stay in the list of
3582    insns that constitute the actual libcall block.  */
3583 static void
3584 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3585 {
3586   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3587
3588   /* If this inns directly contributes to setting the target, it must stay.  */
3589   if (reg_overlap_mentioned_p (p->target, dest))
3590     p->must_stay = true;
3591   /* If we haven't committed to keeping any other insns in the list yet,
3592      there is nothing more to check.  */
3593   else if (p->insn == p->first)
3594     return;
3595   /* If this insn sets / clobbers a register that feeds one of the insns
3596      already in the list, this insn has to stay too.  */
3597   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3598            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3599            || reg_used_between_p (dest, p->first, p->insn)
3600            /* Likewise if this insn depends on a register set by a previous
3601               insn in the list, or if it sets a result (presumably a hard
3602               register) that is set or clobbered by a previous insn.
3603               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3604               SET_DEST perform the former check on the address, and the latter
3605               check on the MEM.  */
3606            || (GET_CODE (set) == SET
3607                && (modified_in_p (SET_SRC (set), p->first)
3608                    || modified_in_p (SET_DEST (set), p->first)
3609                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3610                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3611     p->must_stay = true;
3612 }
3613
3614 \f
3615 /* Emit code to make a call to a constant function or a library call.
3616
3617    INSNS is a list containing all insns emitted in the call.
3618    These insns leave the result in RESULT.  Our block is to copy RESULT
3619    to TARGET, which is logically equivalent to EQUIV.
3620
3621    We first emit any insns that set a pseudo on the assumption that these are
3622    loading constants into registers; doing so allows them to be safely cse'ed
3623    between blocks.  Then we emit all the other insns in the block, followed by
3624    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3625    note with an operand of EQUIV.  */
3626
3627 static void
3628 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3629                       bool equiv_may_trap)
3630 {
3631   rtx final_dest = target;
3632   rtx_insn *next, *last, *insn;
3633
3634   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3635      into a MEM later.  Protect the libcall block from this change.  */
3636   if (! REG_P (target) || REG_USERVAR_P (target))
3637     target = gen_reg_rtx (GET_MODE (target));
3638
3639   /* If we're using non-call exceptions, a libcall corresponding to an
3640      operation that may trap may also trap.  */
3641   /* ??? See the comment in front of make_reg_eh_region_note.  */
3642   if (cfun->can_throw_non_call_exceptions
3643       && (equiv_may_trap || may_trap_p (equiv)))
3644     {
3645       for (insn = insns; insn; insn = NEXT_INSN (insn))
3646         if (CALL_P (insn))
3647           {
3648             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3649             if (note)
3650               {
3651                 int lp_nr = INTVAL (XEXP (note, 0));
3652                 if (lp_nr == 0 || lp_nr == INT_MIN)
3653                   remove_note (insn, note);
3654               }
3655           }
3656     }
3657   else
3658     {
3659       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3660          reg note to indicate that this call cannot throw or execute a nonlocal
3661          goto (unless there is already a REG_EH_REGION note, in which case
3662          we update it).  */
3663       for (insn = insns; insn; insn = NEXT_INSN (insn))
3664         if (CALL_P (insn))
3665           make_reg_eh_region_note_nothrow_nononlocal (insn);
3666     }
3667
3668   /* First emit all insns that set pseudos.  Remove them from the list as
3669      we go.  Avoid insns that set pseudos which were referenced in previous
3670      insns.  These can be generated by move_by_pieces, for example,
3671      to update an address.  Similarly, avoid insns that reference things
3672      set in previous insns.  */
3673
3674   for (insn = insns; insn; insn = next)
3675     {
3676       rtx set = single_set (insn);
3677
3678       next = NEXT_INSN (insn);
3679
3680       if (set != 0 && REG_P (SET_DEST (set))
3681           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3682         {
3683           struct no_conflict_data data;
3684
3685           data.target = const0_rtx;
3686           data.first = insns;
3687           data.insn = insn;
3688           data.must_stay = 0;
3689           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3690           if (! data.must_stay)
3691             {
3692               if (PREV_INSN (insn))
3693                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3694               else
3695                 insns = next;
3696
3697               if (next)
3698                 SET_PREV_INSN (next) = PREV_INSN (insn);
3699
3700               add_insn (insn);
3701             }
3702         }
3703
3704       /* Some ports use a loop to copy large arguments onto the stack.
3705          Don't move anything outside such a loop.  */
3706       if (LABEL_P (insn))
3707         break;
3708     }
3709
3710   /* Write the remaining insns followed by the final copy.  */
3711   for (insn = insns; insn; insn = next)
3712     {
3713       next = NEXT_INSN (insn);
3714
3715       add_insn (insn);
3716     }
3717
3718   last = emit_move_insn (target, result);
3719   if (equiv)
3720     set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3721
3722   if (final_dest != target)
3723     emit_move_insn (final_dest, target);
3724 }
3725
3726 void
3727 emit_libcall_block (rtx_insn *insns, rtx target, rtx result, rtx equiv)
3728 {
3729   emit_libcall_block_1 (insns, target, result, equiv, false);
3730 }
3731 \f
3732 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3733    PURPOSE describes how this comparison will be used.  CODE is the rtx
3734    comparison code we will be using.
3735
3736    ??? Actually, CODE is slightly weaker than that.  A target is still
3737    required to implement all of the normal bcc operations, but not
3738    required to implement all (or any) of the unordered bcc operations.  */
3739
3740 int
3741 can_compare_p (enum rtx_code code, machine_mode mode,
3742                enum can_compare_purpose purpose)
3743 {
3744   rtx test;
3745   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
3746   do
3747     {
3748       enum insn_code icode;
3749
3750       if (purpose == ccp_jump
3751           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
3752           && insn_operand_matches (icode, 0, test))
3753         return 1;
3754       if (purpose == ccp_store_flag
3755           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
3756           && insn_operand_matches (icode, 1, test))
3757         return 1;
3758       if (purpose == ccp_cmov
3759           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
3760         return 1;
3761
3762       mode = GET_MODE_WIDER_MODE (mode).else_void ();
3763       PUT_MODE (test, mode);
3764     }
3765   while (mode != VOIDmode);
3766
3767   return 0;
3768 }
3769
3770 /* This function is called when we are going to emit a compare instruction that
3771    compares the values found in X and Y, using the rtl operator COMPARISON.
3772
3773    If they have mode BLKmode, then SIZE specifies the size of both operands.
3774
3775    UNSIGNEDP nonzero says that the operands are unsigned;
3776    this matters if they need to be widened (as given by METHODS).
3777
3778    *PTEST is where the resulting comparison RTX is returned or NULL_RTX
3779    if we failed to produce one.
3780
3781    *PMODE is the mode of the inputs (in case they are const_int).
3782
3783    This function performs all the setup necessary so that the caller only has
3784    to emit a single comparison insn.  This setup can involve doing a BLKmode
3785    comparison or emitting a library call to perform the comparison if no insn
3786    is available to handle it.
3787    The values which are passed in through pointers can be modified; the caller
3788    should perform the comparison on the modified values.  Constant
3789    comparisons must have already been folded.  */
3790
3791 static void
3792 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
3793                   int unsignedp, enum optab_methods methods,
3794                   rtx *ptest, machine_mode *pmode)
3795 {
3796   machine_mode mode = *pmode;
3797   rtx libfunc, test;
3798   machine_mode cmp_mode;
3799   enum mode_class mclass;
3800
3801   /* The other methods are not needed.  */
3802   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
3803               || methods == OPTAB_LIB_WIDEN);
3804
3805   /* If we are optimizing, force expensive constants into a register.  */
3806   if (CONSTANT_P (x) && optimize
3807       && (rtx_cost (x, mode, COMPARE, 0, optimize_insn_for_speed_p ())
3808           > COSTS_N_INSNS (1)))
3809     x = force_reg (mode, x);
3810
3811   if (CONSTANT_P (y) && optimize
3812       && (rtx_cost (y, mode, COMPARE, 1, optimize_insn_for_speed_p ())
3813           > COSTS_N_INSNS (1)))
3814     y = force_reg (mode, y);
3815
3816 #if HAVE_cc0
3817   /* Make sure if we have a canonical comparison.  The RTL
3818      documentation states that canonical comparisons are required only
3819      for targets which have cc0.  */
3820   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
3821 #endif
3822
3823   /* Don't let both operands fail to indicate the mode.  */
3824   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
3825     x = force_reg (mode, x);
3826   if (mode == VOIDmode)
3827     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
3828
3829   /* Handle all BLKmode compares.  */
3830
3831   if (mode == BLKmode)
3832     {
3833       machine_mode result_mode;
3834       enum insn_code cmp_code;
3835       rtx result;
3836       rtx opalign
3837         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
3838
3839       gcc_assert (size);
3840
3841       /* Try to use a memory block compare insn - either cmpstr
3842          or cmpmem will do.  */
3843       opt_scalar_int_mode cmp_mode_iter;
3844       FOR_EACH_MODE_IN_CLASS (cmp_mode_iter, MODE_INT)
3845         {
3846           scalar_int_mode cmp_mode = cmp_mode_iter.require ();
3847           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
3848           if (cmp_code == CODE_FOR_nothing)
3849             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
3850           if (cmp_code == CODE_FOR_nothing)
3851             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
3852           if (cmp_code == CODE_FOR_nothing)
3853             continue;
3854
3855           /* Must make sure the size fits the insn's mode.  */
3856           if (CONST_INT_P (size)
3857               ? INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode))
3858               : (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (size)))
3859                  > GET_MODE_BITSIZE (cmp_mode)))
3860             continue;
3861
3862           result_mode = insn_data[cmp_code].operand[0].mode;
3863           result = gen_reg_rtx (result_mode);
3864           size = convert_to_mode (cmp_mode, size, 1);
3865           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
3866
3867           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
3868           *pmode = result_mode;
3869           return;
3870         }
3871
3872       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
3873         goto fail;
3874
3875       /* Otherwise call a library function.  */
3876       result = emit_block_comp_via_libcall (XEXP (x, 0), XEXP (y, 0), size);
3877
3878       x = result;
3879       y = const0_rtx;
3880       mode = TYPE_MODE (integer_type_node);
3881       methods = OPTAB_LIB_WIDEN;
3882       unsignedp = false;
3883     }
3884
3885   /* Don't allow operands to the compare to trap, as that can put the
3886      compare and branch in different basic blocks.  */
3887   if (cfun->can_throw_non_call_exceptions)
3888     {
3889       if (may_trap_p (x))
3890         x = copy_to_reg (x);
3891       if (may_trap_p (y))
3892         y = copy_to_reg (y);
3893     }
3894
3895   if (GET_MODE_CLASS (mode) == MODE_CC)
3896     {
3897       enum insn_code icode = optab_handler (cbranch_optab, CCmode);
3898       test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3899       gcc_assert (icode != CODE_FOR_nothing
3900                   && insn_operand_matches (icode, 0, test));
3901       *ptest = test;
3902       return;
3903     }
3904
3905   mclass = GET_MODE_CLASS (mode);
3906   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3907   FOR_EACH_MODE_FROM (cmp_mode, mode)
3908     {
3909       enum insn_code icode;
3910       icode = optab_handler (cbranch_optab, cmp_mode);
3911       if (icode != CODE_FOR_nothing
3912           && insn_operand_matches (icode, 0, test))
3913         {
3914           rtx_insn *last = get_last_insn ();
3915           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
3916           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
3917           if (op0 && op1
3918               && insn_operand_matches (icode, 1, op0)
3919               && insn_operand_matches (icode, 2, op1))
3920             {
3921               XEXP (test, 0) = op0;
3922               XEXP (test, 1) = op1;
3923               *ptest = test;
3924               *pmode = cmp_mode;
3925               return;
3926             }
3927           delete_insns_since (last);
3928         }
3929
3930       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
3931         break;
3932     }
3933
3934   if (methods != OPTAB_LIB_WIDEN)
3935     goto fail;
3936
3937   if (!SCALAR_FLOAT_MODE_P (mode))
3938     {
3939       rtx result;
3940       machine_mode ret_mode;
3941
3942       /* Handle a libcall just for the mode we are using.  */
3943       libfunc = optab_libfunc (cmp_optab, mode);
3944       gcc_assert (libfunc);
3945
3946       /* If we want unsigned, and this mode has a distinct unsigned
3947          comparison routine, use that.  */
3948       if (unsignedp)
3949         {
3950           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
3951           if (ulibfunc)
3952             libfunc = ulibfunc;
3953         }
3954
3955       ret_mode = targetm.libgcc_cmp_return_mode ();
3956       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
3957                                         ret_mode, x, mode, y, mode);
3958
3959       /* There are two kinds of comparison routines. Biased routines
3960          return 0/1/2, and unbiased routines return -1/0/1. Other parts
3961          of gcc expect that the comparison operation is equivalent
3962          to the modified comparison. For signed comparisons compare the
3963          result against 1 in the biased case, and zero in the unbiased
3964          case. For unsigned comparisons always compare against 1 after
3965          biasing the unbiased result by adding 1. This gives us a way to
3966          represent LTU.
3967          The comparisons in the fixed-point helper library are always
3968          biased.  */
3969       x = result;
3970       y = const1_rtx;
3971
3972       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
3973         {
3974           if (unsignedp)
3975             x = plus_constant (ret_mode, result, 1);
3976           else
3977             y = const0_rtx;
3978         }
3979
3980       *pmode = ret_mode;
3981       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
3982                         ptest, pmode);
3983     }
3984   else
3985     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
3986
3987   return;
3988
3989  fail:
3990   *ptest = NULL_RTX;
3991 }
3992
3993 /* Before emitting an insn with code ICODE, make sure that X, which is going
3994    to be used for operand OPNUM of the insn, is converted from mode MODE to
3995    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
3996    that it is accepted by the operand predicate.  Return the new value.  */
3997
3998 rtx
3999 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
4000                  machine_mode wider_mode, int unsignedp)
4001 {
4002   if (mode != wider_mode)
4003     x = convert_modes (wider_mode, mode, x, unsignedp);
4004
4005   if (!insn_operand_matches (icode, opnum, x))
4006     {
4007       machine_mode op_mode = insn_data[(int) icode].operand[opnum].mode;
4008       if (reload_completed)
4009         return NULL_RTX;
4010       if (GET_MODE (x) != op_mode && GET_MODE (x) != VOIDmode)
4011         return NULL_RTX;
4012       x = copy_to_mode_reg (op_mode, x);
4013     }
4014
4015   return x;
4016 }
4017
4018 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4019    we can do the branch.  */
4020
4021 static void
4022 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label,
4023                           profile_probability prob)
4024 {
4025   machine_mode optab_mode;
4026   enum mode_class mclass;
4027   enum insn_code icode;
4028   rtx_insn *insn;
4029
4030   mclass = GET_MODE_CLASS (mode);
4031   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4032   icode = optab_handler (cbranch_optab, optab_mode);
4033
4034   gcc_assert (icode != CODE_FOR_nothing);
4035   gcc_assert (insn_operand_matches (icode, 0, test));
4036   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4037                                           XEXP (test, 1), label));
4038   if (prob.initialized_p ()
4039       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4040       && insn
4041       && JUMP_P (insn)
4042       && any_condjump_p (insn)
4043       && !find_reg_note (insn, REG_BR_PROB, 0))
4044     add_reg_br_prob_note (insn, prob);
4045 }
4046
4047 /* Generate code to compare X with Y so that the condition codes are
4048    set and to jump to LABEL if the condition is true.  If X is a
4049    constant and Y is not a constant, then the comparison is swapped to
4050    ensure that the comparison RTL has the canonical form.
4051
4052    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4053    need to be widened.  UNSIGNEDP is also used to select the proper
4054    branch condition code.
4055
4056    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4057
4058    MODE is the mode of the inputs (in case they are const_int).
4059
4060    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4061    It will be potentially converted into an unsigned variant based on
4062    UNSIGNEDP to select a proper jump instruction.
4063
4064    PROB is the probability of jumping to LABEL.  */
4065
4066 void
4067 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4068                          machine_mode mode, int unsignedp, rtx label,
4069                          profile_probability prob)
4070 {
4071   rtx op0 = x, op1 = y;
4072   rtx test;
4073
4074   /* Swap operands and condition to ensure canonical RTL.  */
4075   if (swap_commutative_operands_p (x, y)
4076       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4077     {
4078       op0 = y, op1 = x;
4079       comparison = swap_condition (comparison);
4080     }
4081
4082   /* If OP0 is still a constant, then both X and Y must be constants
4083      or the opposite comparison is not supported.  Force X into a register
4084      to create canonical RTL.  */
4085   if (CONSTANT_P (op0))
4086     op0 = force_reg (mode, op0);
4087
4088   if (unsignedp)
4089     comparison = unsigned_condition (comparison);
4090
4091   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4092                     &test, &mode);
4093   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4094 }
4095
4096 \f
4097 /* Emit a library call comparison between floating point X and Y.
4098    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4099
4100 static void
4101 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4102                        rtx *ptest, machine_mode *pmode)
4103 {
4104   enum rtx_code swapped = swap_condition (comparison);
4105   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4106   machine_mode orig_mode = GET_MODE (x);
4107   machine_mode mode;
4108   rtx true_rtx, false_rtx;
4109   rtx value, target, equiv;
4110   rtx_insn *insns;
4111   rtx libfunc = 0;
4112   bool reversed_p = false;
4113   scalar_int_mode cmp_mode = targetm.libgcc_cmp_return_mode ();
4114
4115   FOR_EACH_MODE_FROM (mode, orig_mode)
4116     {
4117       if (code_to_optab (comparison)
4118           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4119         break;
4120
4121       if (code_to_optab (swapped)
4122           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4123         {
4124           std::swap (x, y);
4125           comparison = swapped;
4126           break;
4127         }
4128
4129       if (code_to_optab (reversed)
4130           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4131         {
4132           comparison = reversed;
4133           reversed_p = true;
4134           break;
4135         }
4136     }
4137
4138   gcc_assert (mode != VOIDmode);
4139
4140   if (mode != orig_mode)
4141     {
4142       x = convert_to_mode (mode, x, 0);
4143       y = convert_to_mode (mode, y, 0);
4144     }
4145
4146   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4147      the RTL.  The allows the RTL optimizers to delete the libcall if the
4148      condition can be determined at compile-time.  */
4149   if (comparison == UNORDERED
4150       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4151     {
4152       true_rtx = const_true_rtx;
4153       false_rtx = const0_rtx;
4154     }
4155   else
4156     {
4157       switch (comparison)
4158         {
4159         case EQ:
4160           true_rtx = const0_rtx;
4161           false_rtx = const_true_rtx;
4162           break;
4163
4164         case NE:
4165           true_rtx = const_true_rtx;
4166           false_rtx = const0_rtx;
4167           break;
4168
4169         case GT:
4170           true_rtx = const1_rtx;
4171           false_rtx = const0_rtx;
4172           break;
4173
4174         case GE:
4175           true_rtx = const0_rtx;
4176           false_rtx = constm1_rtx;
4177           break;
4178
4179         case LT:
4180           true_rtx = constm1_rtx;
4181           false_rtx = const0_rtx;
4182           break;
4183
4184         case LE:
4185           true_rtx = const0_rtx;
4186           false_rtx = const1_rtx;
4187           break;
4188
4189         default:
4190           gcc_unreachable ();
4191         }
4192     }
4193
4194   if (comparison == UNORDERED)
4195     {
4196       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4197       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4198       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4199                                     temp, const_true_rtx, equiv);
4200     }
4201   else
4202     {
4203       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4204       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4205         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4206                                       equiv, true_rtx, false_rtx);
4207     }
4208
4209   start_sequence ();
4210   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4211                                    cmp_mode, x, mode, y, mode);
4212   insns = get_insns ();
4213   end_sequence ();
4214
4215   target = gen_reg_rtx (cmp_mode);
4216   emit_libcall_block (insns, target, value, equiv);
4217
4218   if (comparison == UNORDERED
4219       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4220       || reversed_p)
4221     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4222   else
4223     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4224
4225   *pmode = cmp_mode;
4226 }
4227 \f
4228 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4229
4230 void
4231 emit_indirect_jump (rtx loc)
4232 {
4233   if (!targetm.have_indirect_jump ())
4234     sorry ("indirect jumps are not available on this target");
4235   else
4236     {
4237       struct expand_operand ops[1];
4238       create_address_operand (&ops[0], loc);
4239       expand_jump_insn (targetm.code_for_indirect_jump, 1, ops);
4240       emit_barrier ();
4241     }
4242 }
4243 \f
4244
4245 /* Emit a conditional move instruction if the machine supports one for that
4246    condition and machine mode.
4247
4248    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4249    the mode to use should they be constants.  If it is VOIDmode, they cannot
4250    both be constants.
4251
4252    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4253    should be stored there.  MODE is the mode to use should they be constants.
4254    If it is VOIDmode, they cannot both be constants.
4255
4256    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4257    is not supported.  */
4258
4259 rtx
4260 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4261                        machine_mode cmode, rtx op2, rtx op3,
4262                        machine_mode mode, int unsignedp)
4263 {
4264   rtx comparison;
4265   rtx_insn *last;
4266   enum insn_code icode;
4267   enum rtx_code reversed;
4268
4269   /* If the two source operands are identical, that's just a move.  */
4270
4271   if (rtx_equal_p (op2, op3))
4272     {
4273       if (!target)
4274         target = gen_reg_rtx (mode);
4275
4276       emit_move_insn (target, op3);
4277       return target;
4278     }
4279
4280   /* If one operand is constant, make it the second one.  Only do this
4281      if the other operand is not constant as well.  */
4282
4283   if (swap_commutative_operands_p (op0, op1))
4284     {
4285       std::swap (op0, op1);
4286       code = swap_condition (code);
4287     }
4288
4289   /* get_condition will prefer to generate LT and GT even if the old
4290      comparison was against zero, so undo that canonicalization here since
4291      comparisons against zero are cheaper.  */
4292   if (code == LT && op1 == const1_rtx)
4293     code = LE, op1 = const0_rtx;
4294   else if (code == GT && op1 == constm1_rtx)
4295     code = GE, op1 = const0_rtx;
4296
4297   if (cmode == VOIDmode)
4298     cmode = GET_MODE (op0);
4299
4300   enum rtx_code orig_code = code;
4301   bool swapped = false;
4302   if (swap_commutative_operands_p (op2, op3)
4303       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4304           != UNKNOWN))
4305     {
4306       std::swap (op2, op3);
4307       code = reversed;
4308       swapped = true;
4309     }
4310
4311   if (mode == VOIDmode)
4312     mode = GET_MODE (op2);
4313
4314   icode = direct_optab_handler (movcc_optab, mode);
4315
4316   if (icode == CODE_FOR_nothing)
4317     return NULL_RTX;
4318
4319   if (!target)
4320     target = gen_reg_rtx (mode);
4321
4322   for (int pass = 0; ; pass++)
4323     {
4324       code = unsignedp ? unsigned_condition (code) : code;
4325       comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4326
4327       /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4328          punt and let the caller figure out how best to deal with this
4329          situation.  */
4330       if (COMPARISON_P (comparison))
4331         {
4332           saved_pending_stack_adjust save;
4333           save_pending_stack_adjust (&save);
4334           last = get_last_insn ();
4335           do_pending_stack_adjust ();
4336           prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4337                             GET_CODE (comparison), NULL_RTX, unsignedp,
4338                             OPTAB_WIDEN, &comparison, &cmode);
4339           if (comparison)
4340             {
4341               struct expand_operand ops[4];
4342
4343               create_output_operand (&ops[0], target, mode);
4344               create_fixed_operand (&ops[1], comparison);
4345               create_input_operand (&ops[2], op2, mode);
4346               create_input_operand (&ops[3], op3, mode);
4347               if (maybe_expand_insn (icode, 4, ops))
4348                 {
4349                   if (ops[0].value != target)
4350                     convert_move (target, ops[0].value, false);
4351                   return target;
4352                 }
4353             }
4354           delete_insns_since (last);
4355           restore_pending_stack_adjust (&save);
4356         }
4357
4358       if (pass == 1)
4359         return NULL_RTX;
4360
4361       /* If the preferred op2/op3 order is not usable, retry with other
4362          operand order, perhaps it will expand successfully.  */
4363       if (swapped)
4364         code = orig_code;
4365       else if ((reversed = reversed_comparison_code_parts (orig_code, op0, op1,
4366                                                            NULL))
4367                != UNKNOWN)
4368         code = reversed;
4369       else
4370         return NULL_RTX;
4371       std::swap (op2, op3);
4372     }
4373 }
4374
4375
4376 /* Emit a conditional negate or bitwise complement using the
4377    negcc or notcc optabs if available.  Return NULL_RTX if such operations
4378    are not available.  Otherwise return the RTX holding the result.
4379    TARGET is the desired destination of the result.  COMP is the comparison
4380    on which to negate.  If COND is true move into TARGET the negation
4381    or bitwise complement of OP1.  Otherwise move OP2 into TARGET.
4382    CODE is either NEG or NOT.  MODE is the machine mode in which the
4383    operation is performed.  */
4384
4385 rtx
4386 emit_conditional_neg_or_complement (rtx target, rtx_code code,
4387                                      machine_mode mode, rtx cond, rtx op1,
4388                                      rtx op2)
4389 {
4390   optab op = unknown_optab;
4391   if (code == NEG)
4392     op = negcc_optab;
4393   else if (code == NOT)
4394     op = notcc_optab;
4395   else
4396     gcc_unreachable ();
4397
4398   insn_code icode = direct_optab_handler (op, mode);
4399
4400   if (icode == CODE_FOR_nothing)
4401     return NULL_RTX;
4402
4403   if (!target)
4404     target = gen_reg_rtx (mode);
4405
4406   rtx_insn *last = get_last_insn ();
4407   struct expand_operand ops[4];
4408
4409   create_output_operand (&ops[0], target, mode);
4410   create_fixed_operand (&ops[1], cond);
4411   create_input_operand (&ops[2], op1, mode);
4412   create_input_operand (&ops[3], op2, mode);
4413
4414   if (maybe_expand_insn (icode, 4, ops))
4415     {
4416       if (ops[0].value != target)
4417         convert_move (target, ops[0].value, false);
4418
4419       return target;
4420     }
4421   delete_insns_since (last);
4422   return NULL_RTX;
4423 }
4424
4425 /* Emit a conditional addition instruction if the machine supports one for that
4426    condition and machine mode.
4427
4428    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4429    the mode to use should they be constants.  If it is VOIDmode, they cannot
4430    both be constants.
4431
4432    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4433    should be stored there.  MODE is the mode to use should they be constants.
4434    If it is VOIDmode, they cannot both be constants.
4435
4436    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4437    is not supported.  */
4438
4439 rtx
4440 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4441                       machine_mode cmode, rtx op2, rtx op3,
4442                       machine_mode mode, int unsignedp)
4443 {
4444   rtx comparison;
4445   rtx_insn *last;
4446   enum insn_code icode;
4447
4448   /* If one operand is constant, make it the second one.  Only do this
4449      if the other operand is not constant as well.  */
4450
4451   if (swap_commutative_operands_p (op0, op1))
4452     {
4453       std::swap (op0, op1);
4454       code = swap_condition (code);
4455     }
4456
4457   /* get_condition will prefer to generate LT and GT even if the old
4458      comparison was against zero, so undo that canonicalization here since
4459      comparisons against zero are cheaper.  */
4460   if (code == LT && op1 == const1_rtx)
4461     code = LE, op1 = const0_rtx;
4462   else if (code == GT && op1 == constm1_rtx)
4463     code = GE, op1 = const0_rtx;
4464
4465   if (cmode == VOIDmode)
4466     cmode = GET_MODE (op0);
4467
4468   if (mode == VOIDmode)
4469     mode = GET_MODE (op2);
4470
4471   icode = optab_handler (addcc_optab, mode);
4472
4473   if (icode == CODE_FOR_nothing)
4474     return 0;
4475
4476   if (!target)
4477     target = gen_reg_rtx (mode);
4478
4479   code = unsignedp ? unsigned_condition (code) : code;
4480   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4481
4482   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4483      return NULL and let the caller figure out how best to deal with this
4484      situation.  */
4485   if (!COMPARISON_P (comparison))
4486     return NULL_RTX;
4487
4488   do_pending_stack_adjust ();
4489   last = get_last_insn ();
4490   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4491                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4492                     &comparison, &cmode);
4493   if (comparison)
4494     {
4495       struct expand_operand ops[4];
4496
4497       create_output_operand (&ops[0], target, mode);
4498       create_fixed_operand (&ops[1], comparison);
4499       create_input_operand (&ops[2], op2, mode);
4500       create_input_operand (&ops[3], op3, mode);
4501       if (maybe_expand_insn (icode, 4, ops))
4502         {
4503           if (ops[0].value != target)
4504             convert_move (target, ops[0].value, false);
4505           return target;
4506         }
4507     }
4508   delete_insns_since (last);
4509   return NULL_RTX;
4510 }
4511 \f
4512 /* These functions attempt to generate an insn body, rather than
4513    emitting the insn, but if the gen function already emits them, we
4514    make no attempt to turn them back into naked patterns.  */
4515
4516 /* Generate and return an insn body to add Y to X.  */
4517
4518 rtx_insn *
4519 gen_add2_insn (rtx x, rtx y)
4520 {
4521   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4522
4523   gcc_assert (insn_operand_matches (icode, 0, x));
4524   gcc_assert (insn_operand_matches (icode, 1, x));
4525   gcc_assert (insn_operand_matches (icode, 2, y));
4526
4527   return GEN_FCN (icode) (x, x, y);
4528 }
4529
4530 /* Generate and return an insn body to add r1 and c,
4531    storing the result in r0.  */
4532
4533 rtx_insn *
4534 gen_add3_insn (rtx r0, rtx r1, rtx c)
4535 {
4536   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4537
4538   if (icode == CODE_FOR_nothing
4539       || !insn_operand_matches (icode, 0, r0)
4540       || !insn_operand_matches (icode, 1, r1)
4541       || !insn_operand_matches (icode, 2, c))
4542     return NULL;
4543
4544   return GEN_FCN (icode) (r0, r1, c);
4545 }
4546
4547 int
4548 have_add2_insn (rtx x, rtx y)
4549 {
4550   enum insn_code icode;
4551
4552   gcc_assert (GET_MODE (x) != VOIDmode);
4553
4554   icode = optab_handler (add_optab, GET_MODE (x));
4555
4556   if (icode == CODE_FOR_nothing)
4557     return 0;
4558
4559   if (!insn_operand_matches (icode, 0, x)
4560       || !insn_operand_matches (icode, 1, x)
4561       || !insn_operand_matches (icode, 2, y))
4562     return 0;
4563
4564   return 1;
4565 }
4566
4567 /* Generate and return an insn body to add Y to X.  */
4568
4569 rtx_insn *
4570 gen_addptr3_insn (rtx x, rtx y, rtx z)
4571 {
4572   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4573
4574   gcc_assert (insn_operand_matches (icode, 0, x));
4575   gcc_assert (insn_operand_matches (icode, 1, y));
4576   gcc_assert (insn_operand_matches (icode, 2, z));
4577
4578   return GEN_FCN (icode) (x, y, z);
4579 }
4580
4581 /* Return true if the target implements an addptr pattern and X, Y,
4582    and Z are valid for the pattern predicates.  */
4583
4584 int
4585 have_addptr3_insn (rtx x, rtx y, rtx z)
4586 {
4587   enum insn_code icode;
4588
4589   gcc_assert (GET_MODE (x) != VOIDmode);
4590
4591   icode = optab_handler (addptr3_optab, GET_MODE (x));
4592
4593   if (icode == CODE_FOR_nothing)
4594     return 0;
4595
4596   if (!insn_operand_matches (icode, 0, x)
4597       || !insn_operand_matches (icode, 1, y)
4598       || !insn_operand_matches (icode, 2, z))
4599     return 0;
4600
4601   return 1;
4602 }
4603
4604 /* Generate and return an insn body to subtract Y from X.  */
4605
4606 rtx_insn *
4607 gen_sub2_insn (rtx x, rtx y)
4608 {
4609   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4610
4611   gcc_assert (insn_operand_matches (icode, 0, x));
4612   gcc_assert (insn_operand_matches (icode, 1, x));
4613   gcc_assert (insn_operand_matches (icode, 2, y));
4614
4615   return GEN_FCN (icode) (x, x, y);
4616 }
4617
4618 /* Generate and return an insn body to subtract r1 and c,
4619    storing the result in r0.  */
4620
4621 rtx_insn *
4622 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4623 {
4624   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4625
4626   if (icode == CODE_FOR_nothing
4627       || !insn_operand_matches (icode, 0, r0)
4628       || !insn_operand_matches (icode, 1, r1)
4629       || !insn_operand_matches (icode, 2, c))
4630     return NULL;
4631
4632   return GEN_FCN (icode) (r0, r1, c);
4633 }
4634
4635 int
4636 have_sub2_insn (rtx x, rtx y)
4637 {
4638   enum insn_code icode;
4639
4640   gcc_assert (GET_MODE (x) != VOIDmode);
4641
4642   icode = optab_handler (sub_optab, GET_MODE (x));
4643
4644   if (icode == CODE_FOR_nothing)
4645     return 0;
4646
4647   if (!insn_operand_matches (icode, 0, x)
4648       || !insn_operand_matches (icode, 1, x)
4649       || !insn_operand_matches (icode, 2, y))
4650     return 0;
4651
4652   return 1;
4653 }
4654 \f
4655 /* Generate the body of an insn to extend Y (with mode MFROM)
4656    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4657
4658 rtx_insn *
4659 gen_extend_insn (rtx x, rtx y, machine_mode mto,
4660                  machine_mode mfrom, int unsignedp)
4661 {
4662   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4663   return GEN_FCN (icode) (x, y);
4664 }
4665 \f
4666 /* Generate code to convert FROM to floating point
4667    and store in TO.  FROM must be fixed point and not VOIDmode.
4668    UNSIGNEDP nonzero means regard FROM as unsigned.
4669    Normally this is done by correcting the final value
4670    if it is negative.  */
4671
4672 void
4673 expand_float (rtx to, rtx from, int unsignedp)
4674 {
4675   enum insn_code icode;
4676   rtx target = to;
4677   scalar_mode from_mode, to_mode;
4678   machine_mode fmode, imode;
4679   bool can_do_signed = false;
4680
4681   /* Crash now, because we won't be able to decide which mode to use.  */
4682   gcc_assert (GET_MODE (from) != VOIDmode);
4683
4684   /* Look for an insn to do the conversion.  Do it in the specified
4685      modes if possible; otherwise convert either input, output or both to
4686      wider mode.  If the integer mode is wider than the mode of FROM,
4687      we can do the conversion signed even if the input is unsigned.  */
4688
4689   FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
4690     FOR_EACH_MODE_FROM (imode, GET_MODE (from))
4691       {
4692         int doing_unsigned = unsignedp;
4693
4694         if (fmode != GET_MODE (to)
4695             && (significand_size (fmode)
4696                 < GET_MODE_UNIT_PRECISION (GET_MODE (from))))
4697           continue;
4698
4699         icode = can_float_p (fmode, imode, unsignedp);
4700         if (icode == CODE_FOR_nothing && unsignedp)
4701           {
4702             enum insn_code scode = can_float_p (fmode, imode, 0);
4703             if (scode != CODE_FOR_nothing)
4704               can_do_signed = true;
4705             if (imode != GET_MODE (from))
4706               icode = scode, doing_unsigned = 0;
4707           }
4708
4709         if (icode != CODE_FOR_nothing)
4710           {
4711             if (imode != GET_MODE (from))
4712               from = convert_to_mode (imode, from, unsignedp);
4713
4714             if (fmode != GET_MODE (to))
4715               target = gen_reg_rtx (fmode);
4716
4717             emit_unop_insn (icode, target, from,
4718                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
4719
4720             if (target != to)
4721               convert_move (to, target, 0);
4722             return;
4723           }
4724       }
4725
4726   /* Unsigned integer, and no way to convert directly.  Convert as signed,
4727      then unconditionally adjust the result.  */
4728   if (unsignedp
4729       && can_do_signed
4730       && is_a <scalar_mode> (GET_MODE (to), &to_mode)
4731       && is_a <scalar_mode> (GET_MODE (from), &from_mode))
4732     {
4733       opt_scalar_mode fmode_iter;
4734       rtx_code_label *label = gen_label_rtx ();
4735       rtx temp;
4736       REAL_VALUE_TYPE offset;
4737
4738       /* Look for a usable floating mode FMODE wider than the source and at
4739          least as wide as the target.  Using FMODE will avoid rounding woes
4740          with unsigned values greater than the signed maximum value.  */
4741
4742       FOR_EACH_MODE_FROM (fmode_iter, to_mode)
4743         {
4744           scalar_mode fmode = fmode_iter.require ();
4745           if (GET_MODE_PRECISION (from_mode) < GET_MODE_BITSIZE (fmode)
4746               && can_float_p (fmode, from_mode, 0) != CODE_FOR_nothing)
4747             break;
4748         }
4749
4750       if (!fmode_iter.exists (&fmode))
4751         {
4752           /* There is no such mode.  Pretend the target is wide enough.  */
4753           fmode = to_mode;
4754
4755           /* Avoid double-rounding when TO is narrower than FROM.  */
4756           if ((significand_size (fmode) + 1)
4757               < GET_MODE_PRECISION (from_mode))
4758             {
4759               rtx temp1;
4760               rtx_code_label *neglabel = gen_label_rtx ();
4761
4762               /* Don't use TARGET if it isn't a register, is a hard register,
4763                  or is the wrong mode.  */
4764               if (!REG_P (target)
4765                   || REGNO (target) < FIRST_PSEUDO_REGISTER
4766                   || GET_MODE (target) != fmode)
4767                 target = gen_reg_rtx (fmode);
4768
4769               imode = from_mode;
4770               do_pending_stack_adjust ();
4771
4772               /* Test whether the sign bit is set.  */
4773               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
4774                                        0, neglabel);
4775
4776               /* The sign bit is not set.  Convert as signed.  */
4777               expand_float (target, from, 0);
4778               emit_jump_insn (targetm.gen_jump (label));
4779               emit_barrier ();
4780
4781               /* The sign bit is set.
4782                  Convert to a usable (positive signed) value by shifting right
4783                  one bit, while remembering if a nonzero bit was shifted
4784                  out; i.e., compute  (from & 1) | (from >> 1).  */
4785
4786               emit_label (neglabel);
4787               temp = expand_binop (imode, and_optab, from, const1_rtx,
4788                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
4789               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
4790               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
4791                                    OPTAB_LIB_WIDEN);
4792               expand_float (target, temp, 0);
4793
4794               /* Multiply by 2 to undo the shift above.  */
4795               temp = expand_binop (fmode, add_optab, target, target,
4796                                    target, 0, OPTAB_LIB_WIDEN);
4797               if (temp != target)
4798                 emit_move_insn (target, temp);
4799
4800               do_pending_stack_adjust ();
4801               emit_label (label);
4802               goto done;
4803             }
4804         }
4805
4806       /* If we are about to do some arithmetic to correct for an
4807          unsigned operand, do it in a pseudo-register.  */
4808
4809       if (to_mode != fmode
4810           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
4811         target = gen_reg_rtx (fmode);
4812
4813       /* Convert as signed integer to floating.  */
4814       expand_float (target, from, 0);
4815
4816       /* If FROM is negative (and therefore TO is negative),
4817          correct its value by 2**bitwidth.  */
4818
4819       do_pending_stack_adjust ();
4820       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, from_mode,
4821                                0, label);
4822
4823
4824       real_2expN (&offset, GET_MODE_PRECISION (from_mode), fmode);
4825       temp = expand_binop (fmode, add_optab, target,
4826                            const_double_from_real_value (offset, fmode),
4827                            target, 0, OPTAB_LIB_WIDEN);
4828       if (temp != target)
4829         emit_move_insn (target, temp);
4830
4831       do_pending_stack_adjust ();
4832       emit_label (label);
4833       goto done;
4834     }
4835
4836   /* No hardware instruction available; call a library routine.  */
4837     {
4838       rtx libfunc;
4839       rtx_insn *insns;
4840       rtx value;
4841       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
4842
4843       if (is_narrower_int_mode (GET_MODE (from), SImode))
4844         from = convert_to_mode (SImode, from, unsignedp);
4845
4846       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
4847       gcc_assert (libfunc);
4848
4849       start_sequence ();
4850
4851       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4852                                        GET_MODE (to), from, GET_MODE (from));
4853       insns = get_insns ();
4854       end_sequence ();
4855
4856       emit_libcall_block (insns, target, value,
4857                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
4858                                          GET_MODE (to), from));
4859     }
4860
4861  done:
4862
4863   /* Copy result to requested destination
4864      if we have been computing in a temp location.  */
4865
4866   if (target != to)
4867     {
4868       if (GET_MODE (target) == GET_MODE (to))
4869         emit_move_insn (to, target);
4870       else
4871         convert_move (to, target, 0);
4872     }
4873 }
4874 \f
4875 /* Generate code to convert FROM to fixed point and store in TO.  FROM
4876    must be floating point.  */
4877
4878 void
4879 expand_fix (rtx to, rtx from, int unsignedp)
4880 {
4881   enum insn_code icode;
4882   rtx target = to;
4883   machine_mode fmode, imode;
4884   opt_scalar_mode fmode_iter;
4885   bool must_trunc = false;
4886
4887   /* We first try to find a pair of modes, one real and one integer, at
4888      least as wide as FROM and TO, respectively, in which we can open-code
4889      this conversion.  If the integer mode is wider than the mode of TO,
4890      we can do the conversion either signed or unsigned.  */
4891
4892   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
4893     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
4894       {
4895         int doing_unsigned = unsignedp;
4896
4897         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
4898         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
4899           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
4900
4901         if (icode != CODE_FOR_nothing)
4902           {
4903             rtx_insn *last = get_last_insn ();
4904             if (fmode != GET_MODE (from))
4905               from = convert_to_mode (fmode, from, 0);
4906
4907             if (must_trunc)
4908               {
4909                 rtx temp = gen_reg_rtx (GET_MODE (from));
4910                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
4911                                     temp, 0);
4912               }
4913
4914             if (imode != GET_MODE (to))
4915               target = gen_reg_rtx (imode);
4916
4917             if (maybe_emit_unop_insn (icode, target, from,
4918                                       doing_unsigned ? UNSIGNED_FIX : FIX))
4919               {
4920                 if (target != to)
4921                   convert_move (to, target, unsignedp);
4922                 return;
4923               }
4924             delete_insns_since (last);
4925           }
4926       }
4927
4928   /* For an unsigned conversion, there is one more way to do it.
4929      If we have a signed conversion, we generate code that compares
4930      the real value to the largest representable positive number.  If if
4931      is smaller, the conversion is done normally.  Otherwise, subtract
4932      one plus the highest signed number, convert, and add it back.
4933
4934      We only need to check all real modes, since we know we didn't find
4935      anything with a wider integer mode.
4936
4937      This code used to extend FP value into mode wider than the destination.
4938      This is needed for decimal float modes which cannot accurately
4939      represent one plus the highest signed number of the same size, but
4940      not for binary modes.  Consider, for instance conversion from SFmode
4941      into DImode.
4942
4943      The hot path through the code is dealing with inputs smaller than 2^63
4944      and doing just the conversion, so there is no bits to lose.
4945
4946      In the other path we know the value is positive in the range 2^63..2^64-1
4947      inclusive.  (as for other input overflow happens and result is undefined)
4948      So we know that the most important bit set in mantissa corresponds to
4949      2^63.  The subtraction of 2^63 should not generate any rounding as it
4950      simply clears out that bit.  The rest is trivial.  */
4951
4952   scalar_int_mode to_mode;
4953   if (unsignedp
4954       && is_a <scalar_int_mode> (GET_MODE (to), &to_mode)
4955       && HWI_COMPUTABLE_MODE_P (to_mode))
4956     FOR_EACH_MODE_FROM (fmode_iter, as_a <scalar_mode> (GET_MODE (from)))
4957       {
4958         scalar_mode fmode = fmode_iter.require ();
4959         if (CODE_FOR_nothing != can_fix_p (to_mode, fmode,
4960                                            0, &must_trunc)
4961             && (!DECIMAL_FLOAT_MODE_P (fmode)
4962                 || (GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (to_mode))))
4963           {
4964             int bitsize;
4965             REAL_VALUE_TYPE offset;
4966             rtx limit;
4967             rtx_code_label *lab1, *lab2;
4968             rtx_insn *insn;
4969
4970             bitsize = GET_MODE_PRECISION (to_mode);
4971             real_2expN (&offset, bitsize - 1, fmode);
4972             limit = const_double_from_real_value (offset, fmode);
4973             lab1 = gen_label_rtx ();
4974             lab2 = gen_label_rtx ();
4975
4976             if (fmode != GET_MODE (from))
4977               from = convert_to_mode (fmode, from, 0);
4978
4979             /* See if we need to do the subtraction.  */
4980             do_pending_stack_adjust ();
4981             emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX,
4982                                      GET_MODE (from), 0, lab1);
4983
4984             /* If not, do the signed "fix" and branch around fixup code.  */
4985             expand_fix (to, from, 0);
4986             emit_jump_insn (targetm.gen_jump (lab2));
4987             emit_barrier ();
4988
4989             /* Otherwise, subtract 2**(N-1), convert to signed number,
4990                then add 2**(N-1).  Do the addition using XOR since this
4991                will often generate better code.  */
4992             emit_label (lab1);
4993             target = expand_binop (GET_MODE (from), sub_optab, from, limit,
4994                                    NULL_RTX, 0, OPTAB_LIB_WIDEN);
4995             expand_fix (to, target, 0);
4996             target = expand_binop (to_mode, xor_optab, to,
4997                                    gen_int_mode
4998                                    (HOST_WIDE_INT_1 << (bitsize - 1),
4999                                     to_mode),
5000                                    to, 1, OPTAB_LIB_WIDEN);
5001
5002             if (target != to)
5003               emit_move_insn (to, target);
5004
5005             emit_label (lab2);
5006
5007             if (optab_handler (mov_optab, to_mode) != CODE_FOR_nothing)
5008               {
5009                 /* Make a place for a REG_NOTE and add it.  */
5010                 insn = emit_move_insn (to, to);
5011                 set_dst_reg_note (insn, REG_EQUAL,
5012                                   gen_rtx_fmt_e (UNSIGNED_FIX, to_mode,
5013                                                  copy_rtx (from)),
5014                                   to);
5015               }
5016
5017             return;
5018           }
5019       }
5020
5021   /* We can't do it with an insn, so use a library call.  But first ensure
5022      that the mode of TO is at least as wide as SImode, since those are the
5023      only library calls we know about.  */
5024
5025   if (is_narrower_int_mode (GET_MODE (to), SImode))
5026     {
5027       target = gen_reg_rtx (SImode);
5028
5029       expand_fix (target, from, unsignedp);
5030     }
5031   else
5032     {
5033       rtx_insn *insns;
5034       rtx value;
5035       rtx libfunc;
5036
5037       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5038       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5039       gcc_assert (libfunc);
5040
5041       start_sequence ();
5042
5043       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5044                                        GET_MODE (to), from, GET_MODE (from));
5045       insns = get_insns ();
5046       end_sequence ();
5047
5048       emit_libcall_block (insns, target, value,
5049                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5050                                          GET_MODE (to), from));
5051     }
5052
5053   if (target != to)
5054     {
5055       if (GET_MODE (to) == GET_MODE (target))
5056         emit_move_insn (to, target);
5057       else
5058         convert_move (to, target, 0);
5059     }
5060 }
5061
5062
5063 /* Promote integer arguments for a libcall if necessary.
5064    emit_library_call_value cannot do the promotion because it does not
5065    know if it should do a signed or unsigned promotion.  This is because
5066    there are no tree types defined for libcalls.  */
5067
5068 static rtx
5069 prepare_libcall_arg (rtx arg, int uintp)
5070 {
5071   scalar_int_mode mode;
5072   machine_mode arg_mode;
5073   if (is_a <scalar_int_mode> (GET_MODE (arg), &mode))
5074     {
5075       /*  If we need to promote the integer function argument we need to do
5076           it here instead of inside emit_library_call_value because in
5077           emit_library_call_value we don't know if we should do a signed or
5078           unsigned promotion.  */
5079
5080       int unsigned_p = 0;
5081       arg_mode = promote_function_mode (NULL_TREE, mode,
5082                                         &unsigned_p, NULL_TREE, 0);
5083       if (arg_mode != mode)
5084         return convert_to_mode (arg_mode, arg, uintp);
5085     }
5086     return arg;
5087 }
5088
5089 /* Generate code to convert FROM or TO a fixed-point.
5090    If UINTP is true, either TO or FROM is an unsigned integer.
5091    If SATP is true, we need to saturate the result.  */
5092
5093 void
5094 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5095 {
5096   machine_mode to_mode = GET_MODE (to);
5097   machine_mode from_mode = GET_MODE (from);
5098   convert_optab tab;
5099   enum rtx_code this_code;
5100   enum insn_code code;
5101   rtx_insn *insns;
5102   rtx value;
5103   rtx libfunc;
5104
5105   if (to_mode == from_mode)
5106     {
5107       emit_move_insn (to, from);
5108       return;
5109     }
5110
5111   if (uintp)
5112     {
5113       tab = satp ? satfractuns_optab : fractuns_optab;
5114       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5115     }
5116   else
5117     {
5118       tab = satp ? satfract_optab : fract_optab;
5119       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5120     }
5121   code = convert_optab_handler (tab, to_mode, from_mode);
5122   if (code != CODE_FOR_nothing)
5123     {
5124       emit_unop_insn (code, to, from, this_code);
5125       return;
5126     }
5127
5128   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5129   gcc_assert (libfunc);
5130
5131   from = prepare_libcall_arg (from, uintp);
5132   from_mode = GET_MODE (from);
5133
5134   start_sequence ();
5135   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5136                                    from, from_mode);
5137   insns = get_insns ();
5138   end_sequence ();
5139
5140   emit_libcall_block (insns, to, value,
5141                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5142 }
5143
5144 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5145    must be floating point, TO must be signed.  Use the conversion optab
5146    TAB to do the conversion.  */
5147
5148 bool
5149 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5150 {
5151   enum insn_code icode;
5152   rtx target = to;
5153   machine_mode fmode, imode;
5154
5155   /* We first try to find a pair of modes, one real and one integer, at
5156      least as wide as FROM and TO, respectively, in which we can open-code
5157      this conversion.  If the integer mode is wider than the mode of TO,
5158      we can do the conversion either signed or unsigned.  */
5159
5160   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
5161     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
5162       {
5163         icode = convert_optab_handler (tab, imode, fmode);
5164         if (icode != CODE_FOR_nothing)
5165           {
5166             rtx_insn *last = get_last_insn ();
5167             if (fmode != GET_MODE (from))
5168               from = convert_to_mode (fmode, from, 0);
5169
5170             if (imode != GET_MODE (to))
5171               target = gen_reg_rtx (imode);
5172
5173             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5174               {
5175                 delete_insns_since (last);
5176                 continue;
5177               }
5178             if (target != to)
5179               convert_move (to, target, 0);
5180             return true;
5181           }
5182       }
5183
5184   return false;
5185 }
5186 \f
5187 /* Report whether we have an instruction to perform the operation
5188    specified by CODE on operands of mode MODE.  */
5189 int
5190 have_insn_for (enum rtx_code code, machine_mode mode)
5191 {
5192   return (code_to_optab (code)
5193           && (optab_handler (code_to_optab (code), mode)
5194               != CODE_FOR_nothing));
5195 }
5196
5197 /* Print information about the current contents of the optabs on
5198    STDERR.  */
5199
5200 DEBUG_FUNCTION void
5201 debug_optab_libfuncs (void)
5202 {
5203   int i, j, k;
5204
5205   /* Dump the arithmetic optabs.  */
5206   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
5207     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5208       {
5209         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
5210         if (l)
5211           {
5212             gcc_assert (GET_CODE (l) == SYMBOL_REF);
5213             fprintf (stderr, "%s\t%s:\t%s\n",
5214                      GET_RTX_NAME (optab_to_code ((optab) i)),
5215                      GET_MODE_NAME (j),
5216                      XSTR (l, 0));
5217           }
5218       }
5219
5220   /* Dump the conversion optabs.  */
5221   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
5222     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5223       for (k = 0; k < NUM_MACHINE_MODES; ++k)
5224         {
5225           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
5226                                          (machine_mode) k);
5227           if (l)
5228             {
5229               gcc_assert (GET_CODE (l) == SYMBOL_REF);
5230               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
5231                        GET_RTX_NAME (optab_to_code ((optab) i)),
5232                        GET_MODE_NAME (j),
5233                        GET_MODE_NAME (k),
5234                        XSTR (l, 0));
5235             }
5236         }
5237 }
5238
5239 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
5240    CODE.  Return 0 on failure.  */
5241
5242 rtx_insn *
5243 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
5244 {
5245   machine_mode mode = GET_MODE (op1);
5246   enum insn_code icode;
5247   rtx_insn *insn;
5248   rtx trap_rtx;
5249
5250   if (mode == VOIDmode)
5251     return 0;
5252
5253   icode = optab_handler (ctrap_optab, mode);
5254   if (icode == CODE_FOR_nothing)
5255     return 0;
5256
5257   /* Some targets only accept a zero trap code.  */
5258   if (!insn_operand_matches (icode, 3, tcode))
5259     return 0;
5260
5261   do_pending_stack_adjust ();
5262   start_sequence ();
5263   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
5264                     &trap_rtx, &mode);
5265   if (!trap_rtx)
5266     insn = NULL;
5267   else
5268     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
5269                             tcode);
5270
5271   /* If that failed, then give up.  */
5272   if (insn == 0)
5273     {
5274       end_sequence ();
5275       return 0;
5276     }
5277
5278   emit_insn (insn);
5279   insn = get_insns ();
5280   end_sequence ();
5281   return insn;
5282 }
5283
5284 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
5285    or unsigned operation code.  */
5286
5287 enum rtx_code
5288 get_rtx_code (enum tree_code tcode, bool unsignedp)
5289 {
5290   enum rtx_code code;
5291   switch (tcode)
5292     {
5293     case EQ_EXPR:
5294       code = EQ;
5295       break;
5296     case NE_EXPR:
5297       code = NE;
5298       break;
5299     case LT_EXPR:
5300       code = unsignedp ? LTU : LT;
5301       break;
5302     case LE_EXPR:
5303       code = unsignedp ? LEU : LE;
5304       break;
5305     case GT_EXPR:
5306       code = unsignedp ? GTU : GT;
5307       break;
5308     case GE_EXPR:
5309       code = unsignedp ? GEU : GE;
5310       break;
5311
5312     case UNORDERED_EXPR:
5313       code = UNORDERED;
5314       break;
5315     case ORDERED_EXPR:
5316       code = ORDERED;
5317       break;
5318     case UNLT_EXPR:
5319       code = UNLT;
5320       break;
5321     case UNLE_EXPR:
5322       code = UNLE;
5323       break;
5324     case UNGT_EXPR:
5325       code = UNGT;
5326       break;
5327     case UNGE_EXPR:
5328       code = UNGE;
5329       break;
5330     case UNEQ_EXPR:
5331       code = UNEQ;
5332       break;
5333     case LTGT_EXPR:
5334       code = LTGT;
5335       break;
5336
5337     case BIT_AND_EXPR:
5338       code = AND;
5339       break;
5340
5341     case BIT_IOR_EXPR:
5342       code = IOR;
5343       break;
5344
5345     default:
5346       gcc_unreachable ();
5347     }
5348   return code;
5349 }
5350
5351 /* Return a comparison rtx of mode CMP_MODE for COND.  Use UNSIGNEDP to
5352    select signed or unsigned operators.  OPNO holds the index of the
5353    first comparison operand for insn ICODE.  Do not generate the
5354    compare instruction itself.  */
5355
5356 static rtx
5357 vector_compare_rtx (machine_mode cmp_mode, enum tree_code tcode,
5358                     tree t_op0, tree t_op1, bool unsignedp,
5359                     enum insn_code icode, unsigned int opno)
5360 {
5361   struct expand_operand ops[2];
5362   rtx rtx_op0, rtx_op1;
5363   machine_mode m0, m1;
5364   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
5365
5366   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
5367
5368   /* Expand operands.  For vector types with scalar modes, e.g. where int64x1_t
5369      has mode DImode, this can produce a constant RTX of mode VOIDmode; in such
5370      cases, use the original mode.  */
5371   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
5372                          EXPAND_STACK_PARM);
5373   m0 = GET_MODE (rtx_op0);
5374   if (m0 == VOIDmode)
5375     m0 = TYPE_MODE (TREE_TYPE (t_op0));
5376
5377   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
5378                          EXPAND_STACK_PARM);
5379   m1 = GET_MODE (rtx_op1);
5380   if (m1 == VOIDmode)
5381     m1 = TYPE_MODE (TREE_TYPE (t_op1));
5382
5383   create_input_operand (&ops[0], rtx_op0, m0);
5384   create_input_operand (&ops[1], rtx_op1, m1);
5385   if (!maybe_legitimize_operands (icode, opno, 2, ops))
5386     gcc_unreachable ();
5387   return gen_rtx_fmt_ee (rcode, cmp_mode, ops[0].value, ops[1].value);
5388 }
5389
5390 /* Check if vec_perm mask SEL is a constant equivalent to a shift of
5391    the first vec_perm operand, assuming the second operand is a constant
5392    vector of zeros.  Return the shift distance in bits if so, or NULL_RTX
5393    if the vec_perm is not a shift.  MODE is the mode of the value being
5394    shifted.  */
5395 static rtx
5396 shift_amt_for_vec_perm_mask (machine_mode mode, const vec_perm_indices &sel)
5397 {
5398   unsigned int nelt = GET_MODE_NUNITS (mode);
5399   unsigned int bitsize = GET_MODE_UNIT_BITSIZE (mode);
5400   unsigned int first = sel[0];
5401   if (first >= nelt)
5402     return NULL_RTX;
5403
5404   if (!sel.series_p (0, 1, first, 1))
5405     for (unsigned int i = 1; i < nelt; i++)
5406       {
5407         unsigned int expected = i + first;
5408         /* Indices into the second vector are all equivalent.  */
5409         if (MIN (nelt, sel[i]) != MIN (nelt, expected))
5410           return NULL_RTX;
5411       }
5412
5413   return gen_int_shift_amount (mode, first * bitsize);
5414 }
5415
5416 /* A subroutine of expand_vec_perm_var for expanding one vec_perm insn.  */
5417
5418 static rtx
5419 expand_vec_perm_1 (enum insn_code icode, rtx target,
5420                    rtx v0, rtx v1, rtx sel)
5421 {
5422   machine_mode tmode = GET_MODE (target);
5423   machine_mode smode = GET_MODE (sel);
5424   struct expand_operand ops[4];
5425
5426   gcc_assert (GET_MODE_CLASS (smode) == MODE_VECTOR_INT
5427               || mode_for_int_vector (tmode).require () == smode);
5428   create_output_operand (&ops[0], target, tmode);
5429   create_input_operand (&ops[3], sel, smode);
5430
5431   /* Make an effort to preserve v0 == v1.  The target expander is able to
5432      rely on this to determine if we're permuting a single input operand.  */
5433   if (rtx_equal_p (v0, v1))
5434     {
5435       if (!insn_operand_matches (icode, 1, v0))
5436         v0 = force_reg (tmode, v0);
5437       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
5438       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
5439
5440       create_fixed_operand (&ops[1], v0);
5441       create_fixed_operand (&ops[2], v0);
5442     }
5443   else
5444     {
5445       create_input_operand (&ops[1], v0, tmode);
5446       create_input_operand (&ops[2], v1, tmode);
5447     }
5448
5449   if (maybe_expand_insn (icode, 4, ops))
5450     return ops[0].value;
5451   return NULL_RTX;
5452 }
5453
5454 /* Implement a permutation of vectors v0 and v1 using the permutation
5455    vector in SEL and return the result.  Use TARGET to hold the result
5456    if nonnull and convenient.
5457
5458    MODE is the mode of the vectors being permuted (V0 and V1).  SEL_MODE
5459    is the TYPE_MODE associated with SEL, or BLKmode if SEL isn't known
5460    to have a particular mode.  */
5461
5462 rtx
5463 expand_vec_perm_const (machine_mode mode, rtx v0, rtx v1,
5464                        const vec_perm_builder &sel, machine_mode sel_mode,
5465                        rtx target)
5466 {
5467   if (!target || !register_operand (target, mode))
5468     target = gen_reg_rtx (mode);
5469
5470   /* Set QIMODE to a different vector mode with byte elements.
5471      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
5472   machine_mode qimode;
5473   if (!qimode_for_vec_perm (mode).exists (&qimode))
5474     qimode = VOIDmode;
5475
5476   rtx_insn *last = get_last_insn ();
5477
5478   bool single_arg_p = rtx_equal_p (v0, v1);
5479   /* Always specify two input vectors here and leave the target to handle
5480      cases in which the inputs are equal.  Not all backends can cope with
5481      the single-input representation when testing for a double-input
5482      target instruction.  */
5483   vec_perm_indices indices (sel, 2, GET_MODE_NUNITS (mode));
5484
5485   /* See if this can be handled with a vec_shr.  We only do this if the
5486      second vector is all zeroes.  */
5487   insn_code shift_code = optab_handler (vec_shr_optab, mode);
5488   insn_code shift_code_qi = ((qimode != VOIDmode && qimode != mode)
5489                              ? optab_handler (vec_shr_optab, qimode)
5490                              : CODE_FOR_nothing);
5491
5492   if (v1 == CONST0_RTX (GET_MODE (v1))
5493       && (shift_code != CODE_FOR_nothing
5494           || shift_code_qi != CODE_FOR_nothing))
5495     {
5496       rtx shift_amt = shift_amt_for_vec_perm_mask (mode, indices);
5497       if (shift_amt)
5498         {
5499           struct expand_operand ops[3];
5500           if (shift_code != CODE_FOR_nothing)
5501             {
5502               create_output_operand (&ops[0], target, mode);
5503               create_input_operand (&ops[1], v0, mode);
5504               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
5505               if (maybe_expand_insn (shift_code, 3, ops))
5506                 return ops[0].value;
5507             }
5508           if (shift_code_qi != CODE_FOR_nothing)
5509             {
5510               rtx tmp = gen_reg_rtx (qimode);
5511               create_output_operand (&ops[0], tmp, qimode);
5512               create_input_operand (&ops[1], gen_lowpart (qimode, v0), qimode);
5513               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
5514               if (maybe_expand_insn (shift_code_qi, 3, ops))
5515                 return gen_lowpart (mode, ops[0].value);
5516             }
5517         }
5518     }
5519
5520   if (targetm.vectorize.vec_perm_const != NULL)
5521     {
5522       v0 = force_reg (mode, v0);
5523       if (single_arg_p)
5524         v1 = v0;
5525       else
5526         v1 = force_reg (mode, v1);
5527
5528       if (targetm.vectorize.vec_perm_const (mode, target, v0, v1, indices))
5529         return target;
5530     }
5531
5532   /* Fall back to a constant byte-based permutation.  */
5533   vec_perm_indices qimode_indices;
5534   rtx target_qi = NULL_RTX, v0_qi = NULL_RTX, v1_qi = NULL_RTX;
5535   if (qimode != VOIDmode)
5536     {
5537       qimode_indices.new_expanded_vector (indices, GET_MODE_UNIT_SIZE (mode));
5538       target_qi = gen_reg_rtx (qimode);
5539       v0_qi = gen_lowpart (qimode, v0);
5540       v1_qi = gen_lowpart (qimode, v1);
5541       if (targetm.vectorize.vec_perm_const != NULL
5542           && targetm.vectorize.vec_perm_const (qimode, target_qi, v0_qi,
5543                                                v1_qi, qimode_indices))
5544         return gen_lowpart (mode, target_qi);
5545     }
5546
5547   /* Otherwise expand as a fully variable permuation.  */
5548
5549   /* The optabs are only defined for selectors with the same width
5550      as the values being permuted.  */
5551   machine_mode required_sel_mode;
5552   if (!mode_for_int_vector (mode).exists (&required_sel_mode)
5553       || !VECTOR_MODE_P (required_sel_mode))
5554     {
5555       delete_insns_since (last);
5556       return NULL_RTX;
5557     }
5558
5559   /* We know that it is semantically valid to treat SEL as having SEL_MODE.
5560      If that isn't the mode we want then we need to prove that using
5561      REQUIRED_SEL_MODE is OK.  */
5562   if (sel_mode != required_sel_mode)
5563     {
5564       if (!selector_fits_mode_p (required_sel_mode, indices))
5565         {
5566           delete_insns_since (last);
5567           return NULL_RTX;
5568         }
5569       sel_mode = required_sel_mode;
5570     }
5571
5572   insn_code icode = direct_optab_handler (vec_perm_optab, mode);
5573   if (icode != CODE_FOR_nothing)
5574     {
5575       rtx sel_rtx = vec_perm_indices_to_rtx (sel_mode, indices);
5576       rtx tmp = expand_vec_perm_1 (icode, target, v0, v1, sel_rtx);
5577       if (tmp)
5578         return tmp;
5579     }
5580
5581   if (qimode != VOIDmode
5582       && selector_fits_mode_p (qimode, qimode_indices))
5583     {
5584       icode = direct_optab_handler (vec_perm_optab, qimode);
5585       if (icode != CODE_FOR_nothing)
5586         {
5587           rtx sel_qi = vec_perm_indices_to_rtx (qimode, qimode_indices);
5588           rtx tmp = expand_vec_perm_1 (icode, target_qi, v0_qi, v1_qi, sel_qi);
5589           if (tmp)
5590             return gen_lowpart (mode, tmp);
5591         }
5592     }
5593
5594   delete_insns_since (last);
5595   return NULL_RTX;
5596 }
5597
5598 /* Implement a permutation of vectors v0 and v1 using the permutation
5599    vector in SEL and return the result.  Use TARGET to hold the result
5600    if nonnull and convenient.
5601
5602    MODE is the mode of the vectors being permuted (V0 and V1).
5603    SEL must have the integer equivalent of MODE and is known to be
5604    unsuitable for permutes with a constant permutation vector.  */
5605
5606 rtx
5607 expand_vec_perm_var (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
5608 {
5609   enum insn_code icode;
5610   unsigned int i, w, u;
5611   rtx tmp, sel_qi;
5612   rtvec vec;
5613
5614   w = GET_MODE_SIZE (mode);
5615   u = GET_MODE_UNIT_SIZE (mode);
5616
5617   if (!target || GET_MODE (target) != mode)
5618     target = gen_reg_rtx (mode);
5619
5620   icode = direct_optab_handler (vec_perm_optab, mode);
5621   if (icode != CODE_FOR_nothing)
5622     {
5623       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5624       if (tmp)
5625         return tmp;
5626     }
5627
5628   /* As a special case to aid several targets, lower the element-based
5629      permutation to a byte-based permutation and try again.  */
5630   machine_mode qimode;
5631   if (!qimode_for_vec_perm (mode).exists (&qimode)
5632       || GET_MODE_NUNITS (qimode) > GET_MODE_MASK (QImode) + 1)
5633     return NULL_RTX;
5634   icode = direct_optab_handler (vec_perm_optab, qimode);
5635   if (icode == CODE_FOR_nothing)
5636     return NULL_RTX;
5637
5638   /* Multiply each element by its byte size.  */
5639   machine_mode selmode = GET_MODE (sel);
5640   if (u == 2)
5641     sel = expand_simple_binop (selmode, PLUS, sel, sel,
5642                                NULL, 0, OPTAB_DIRECT);
5643   else
5644     sel = expand_simple_binop (selmode, ASHIFT, sel,
5645                                gen_int_shift_amount (selmode, exact_log2 (u)),
5646                                NULL, 0, OPTAB_DIRECT);
5647   gcc_assert (sel != NULL);
5648
5649   /* Broadcast the low byte each element into each of its bytes.
5650      The encoding has U interleaved stepped patterns, one for each
5651      byte of an element.  */
5652   vec_perm_builder const_sel (w, u, 3);
5653   unsigned int low_byte_in_u = BYTES_BIG_ENDIAN ? u - 1 : 0;
5654   for (i = 0; i < 3; ++i)
5655     for (unsigned int j = 0; j < u; ++j)
5656       const_sel.quick_push (i * u + low_byte_in_u);
5657   sel = gen_lowpart (qimode, sel);
5658   sel = expand_vec_perm_const (qimode, sel, sel, const_sel, qimode, NULL);
5659   gcc_assert (sel != NULL);
5660
5661   /* Add the byte offset to each byte element.  */
5662   /* Note that the definition of the indicies here is memory ordering,
5663      so there should be no difference between big and little endian.  */
5664   vec = rtvec_alloc (w);
5665   for (i = 0; i < w; ++i)
5666     RTVEC_ELT (vec, i) = GEN_INT (i % u);
5667   tmp = gen_rtx_CONST_VECTOR (qimode, vec);
5668   sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
5669                                 sel, 0, OPTAB_DIRECT);
5670   gcc_assert (sel_qi != NULL);
5671
5672   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5673   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5674                            gen_lowpart (qimode, v1), sel_qi);
5675   if (tmp)
5676     tmp = gen_lowpart (mode, tmp);
5677   return tmp;
5678 }
5679
5680 /* Generate insns for a VEC_COND_EXPR with mask, given its TYPE and its
5681    three operands.  */
5682
5683 rtx
5684 expand_vec_cond_mask_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5685                            rtx target)
5686 {
5687   struct expand_operand ops[4];
5688   machine_mode mode = TYPE_MODE (vec_cond_type);
5689   machine_mode mask_mode = TYPE_MODE (TREE_TYPE (op0));
5690   enum insn_code icode = get_vcond_mask_icode (mode, mask_mode);
5691   rtx mask, rtx_op1, rtx_op2;
5692
5693   if (icode == CODE_FOR_nothing)
5694     return 0;
5695
5696   mask = expand_normal (op0);
5697   rtx_op1 = expand_normal (op1);
5698   rtx_op2 = expand_normal (op2);
5699
5700   mask = force_reg (mask_mode, mask);
5701   rtx_op1 = force_reg (GET_MODE (rtx_op1), rtx_op1);
5702
5703   create_output_operand (&ops[0], target, mode);
5704   create_input_operand (&ops[1], rtx_op1, mode);
5705   create_input_operand (&ops[2], rtx_op2, mode);
5706   create_input_operand (&ops[3], mask, mask_mode);
5707   expand_insn (icode, 4, ops);
5708
5709   return ops[0].value;
5710 }
5711
5712 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
5713    three operands.  */
5714
5715 rtx
5716 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5717                       rtx target)
5718 {
5719   struct expand_operand ops[6];
5720   enum insn_code icode;
5721   rtx comparison, rtx_op1, rtx_op2;
5722   machine_mode mode = TYPE_MODE (vec_cond_type);
5723   machine_mode cmp_op_mode;
5724   bool unsignedp;
5725   tree op0a, op0b;
5726   enum tree_code tcode;
5727
5728   if (COMPARISON_CLASS_P (op0))
5729     {
5730       op0a = TREE_OPERAND (op0, 0);
5731       op0b = TREE_OPERAND (op0, 1);
5732       tcode = TREE_CODE (op0);
5733     }
5734   else
5735     {
5736       gcc_assert (VECTOR_BOOLEAN_TYPE_P (TREE_TYPE (op0)));
5737       if (get_vcond_mask_icode (mode, TYPE_MODE (TREE_TYPE (op0)))
5738           != CODE_FOR_nothing)
5739         return expand_vec_cond_mask_expr (vec_cond_type, op0, op1,
5740                                           op2, target);
5741       /* Fake op0 < 0.  */
5742       else
5743         {
5744           gcc_assert (GET_MODE_CLASS (TYPE_MODE (TREE_TYPE (op0)))
5745                       == MODE_VECTOR_INT);
5746           op0a = op0;
5747           op0b = build_zero_cst (TREE_TYPE (op0));
5748           tcode = LT_EXPR;
5749         }
5750     }
5751   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
5752   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5753
5754
5755   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
5756               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
5757
5758   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
5759   if (icode == CODE_FOR_nothing)
5760     {
5761       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5762         icode = get_vcond_eq_icode (mode, cmp_op_mode);
5763       if (icode == CODE_FOR_nothing)
5764         return 0;
5765     }
5766
5767   comparison = vector_compare_rtx (VOIDmode, tcode, op0a, op0b, unsignedp,
5768                                    icode, 4);
5769   rtx_op1 = expand_normal (op1);
5770   rtx_op2 = expand_normal (op2);
5771
5772   create_output_operand (&ops[0], target, mode);
5773   create_input_operand (&ops[1], rtx_op1, mode);
5774   create_input_operand (&ops[2], rtx_op2, mode);
5775   create_fixed_operand (&ops[3], comparison);
5776   create_fixed_operand (&ops[4], XEXP (comparison, 0));
5777   create_fixed_operand (&ops[5], XEXP (comparison, 1));
5778   expand_insn (icode, 6, ops);
5779   return ops[0].value;
5780 }
5781
5782 /* Generate VEC_SERIES_EXPR <OP0, OP1>, returning a value of mode VMODE.
5783    Use TARGET for the result if nonnull and convenient.  */
5784
5785 rtx
5786 expand_vec_series_expr (machine_mode vmode, rtx op0, rtx op1, rtx target)
5787 {
5788   struct expand_operand ops[3];
5789   enum insn_code icode;
5790   machine_mode emode = GET_MODE_INNER (vmode);
5791
5792   icode = direct_optab_handler (vec_series_optab, vmode);
5793   gcc_assert (icode != CODE_FOR_nothing);
5794
5795   create_output_operand (&ops[0], target, vmode);
5796   create_input_operand (&ops[1], op0, emode);
5797   create_input_operand (&ops[2], op1, emode);
5798
5799   expand_insn (icode, 3, ops);
5800   return ops[0].value;
5801 }
5802
5803 /* Generate insns for a vector comparison into a mask.  */
5804
5805 rtx
5806 expand_vec_cmp_expr (tree type, tree exp, rtx target)
5807 {
5808   struct expand_operand ops[4];
5809   enum insn_code icode;
5810   rtx comparison;
5811   machine_mode mask_mode = TYPE_MODE (type);
5812   machine_mode vmode;
5813   bool unsignedp;
5814   tree op0a, op0b;
5815   enum tree_code tcode;
5816
5817   op0a = TREE_OPERAND (exp, 0);
5818   op0b = TREE_OPERAND (exp, 1);
5819   tcode = TREE_CODE (exp);
5820
5821   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5822   vmode = TYPE_MODE (TREE_TYPE (op0a));
5823
5824   icode = get_vec_cmp_icode (vmode, mask_mode, unsignedp);
5825   if (icode == CODE_FOR_nothing)
5826     {
5827       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5828         icode = get_vec_cmp_eq_icode (vmode, mask_mode);
5829       if (icode == CODE_FOR_nothing)
5830         return 0;
5831     }
5832
5833   comparison = vector_compare_rtx (mask_mode, tcode, op0a, op0b,
5834                                    unsignedp, icode, 2);
5835   create_output_operand (&ops[0], target, mask_mode);
5836   create_fixed_operand (&ops[1], comparison);
5837   create_fixed_operand (&ops[2], XEXP (comparison, 0));
5838   create_fixed_operand (&ops[3], XEXP (comparison, 1));
5839   expand_insn (icode, 4, ops);
5840   return ops[0].value;
5841 }
5842
5843 /* Expand a highpart multiply.  */
5844
5845 rtx
5846 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
5847                       rtx target, bool uns_p)
5848 {
5849   struct expand_operand eops[3];
5850   enum insn_code icode;
5851   int method, i, nunits;
5852   machine_mode wmode;
5853   rtx m1, m2;
5854   optab tab1, tab2;
5855
5856   method = can_mult_highpart_p (mode, uns_p);
5857   switch (method)
5858     {
5859     case 0:
5860       return NULL_RTX;
5861     case 1:
5862       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
5863       return expand_binop (mode, tab1, op0, op1, target, uns_p,
5864                            OPTAB_LIB_WIDEN);
5865     case 2:
5866       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
5867       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
5868       break;
5869     case 3:
5870       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
5871       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
5872       if (BYTES_BIG_ENDIAN)
5873         std::swap (tab1, tab2);
5874       break;
5875     default:
5876       gcc_unreachable ();
5877     }
5878
5879   icode = optab_handler (tab1, mode);
5880   nunits = GET_MODE_NUNITS (mode);
5881   wmode = insn_data[icode].operand[0].mode;
5882   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
5883   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
5884
5885   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5886   create_input_operand (&eops[1], op0, mode);
5887   create_input_operand (&eops[2], op1, mode);
5888   expand_insn (icode, 3, eops);
5889   m1 = gen_lowpart (mode, eops[0].value);
5890
5891   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5892   create_input_operand (&eops[1], op0, mode);
5893   create_input_operand (&eops[2], op1, mode);
5894   expand_insn (optab_handler (tab2, mode), 3, eops);
5895   m2 = gen_lowpart (mode, eops[0].value);
5896
5897   vec_perm_builder sel;
5898   if (method == 2)
5899     {
5900       /* The encoding has 2 interleaved stepped patterns.  */
5901       sel.new_vector (nunits, 2, 3);
5902       for (i = 0; i < 6; ++i)
5903         sel.quick_push (!BYTES_BIG_ENDIAN + (i & ~1)
5904                         + ((i & 1) ? nunits : 0));
5905     }
5906   else
5907     {
5908       /* The encoding has a single interleaved stepped pattern.  */
5909       sel.new_vector (nunits, 1, 3);
5910       for (i = 0; i < 3; ++i)
5911         sel.quick_push (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
5912     }
5913
5914   return expand_vec_perm_const (mode, m1, m2, sel, BLKmode, target);
5915 }
5916 \f
5917 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
5918    pattern.  */
5919
5920 static void
5921 find_cc_set (rtx x, const_rtx pat, void *data)
5922 {
5923   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
5924       && GET_CODE (pat) == SET)
5925     {
5926       rtx *p_cc_reg = (rtx *) data;
5927       gcc_assert (!*p_cc_reg);
5928       *p_cc_reg = x;
5929     }
5930 }
5931
5932 /* This is a helper function for the other atomic operations.  This function
5933    emits a loop that contains SEQ that iterates until a compare-and-swap
5934    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
5935    a set of instructions that takes a value from OLD_REG as an input and
5936    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
5937    set to the current contents of MEM.  After SEQ, a compare-and-swap will
5938    attempt to update MEM with NEW_REG.  The function returns true when the
5939    loop was generated successfully.  */
5940
5941 static bool
5942 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
5943 {
5944   machine_mode mode = GET_MODE (mem);
5945   rtx_code_label *label;
5946   rtx cmp_reg, success, oldval;
5947
5948   /* The loop we want to generate looks like
5949
5950         cmp_reg = mem;
5951       label:
5952         old_reg = cmp_reg;
5953         seq;
5954         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
5955         if (success)
5956           goto label;
5957
5958      Note that we only do the plain load from memory once.  Subsequent
5959      iterations use the value loaded by the compare-and-swap pattern.  */
5960
5961   label = gen_label_rtx ();
5962   cmp_reg = gen_reg_rtx (mode);
5963
5964   emit_move_insn (cmp_reg, mem);
5965   emit_label (label);
5966   emit_move_insn (old_reg, cmp_reg);
5967   if (seq)
5968     emit_insn (seq);
5969
5970   success = NULL_RTX;
5971   oldval = cmp_reg;
5972   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
5973                                        new_reg, false, MEMMODEL_SYNC_SEQ_CST,
5974                                        MEMMODEL_RELAXED))
5975     return false;
5976
5977   if (oldval != cmp_reg)
5978     emit_move_insn (cmp_reg, oldval);
5979
5980   /* Mark this jump predicted not taken.  */
5981   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
5982                            GET_MODE (success), 1, label,
5983                            profile_probability::guessed_never ());
5984   return true;
5985 }
5986
5987
5988 /* This function tries to emit an atomic_exchange intruction.  VAL is written
5989    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
5990    using TARGET if possible.  */
5991
5992 static rtx
5993 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
5994 {
5995   machine_mode mode = GET_MODE (mem);
5996   enum insn_code icode;
5997
5998   /* If the target supports the exchange directly, great.  */
5999   icode = direct_optab_handler (atomic_exchange_optab, mode);
6000   if (icode != CODE_FOR_nothing)
6001     {
6002       struct expand_operand ops[4];
6003
6004       create_output_operand (&ops[0], target, mode);
6005       create_fixed_operand (&ops[1], mem);
6006       create_input_operand (&ops[2], val, mode);
6007       create_integer_operand (&ops[3], model);
6008       if (maybe_expand_insn (icode, 4, ops))
6009         return ops[0].value;
6010     }
6011
6012   return NULL_RTX;
6013 }
6014
6015 /* This function tries to implement an atomic exchange operation using
6016    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
6017    The previous contents of *MEM are returned, using TARGET if possible.
6018    Since this instructionn is an acquire barrier only, stronger memory
6019    models may require additional barriers to be emitted.  */
6020
6021 static rtx
6022 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
6023                                    enum memmodel model)
6024 {
6025   machine_mode mode = GET_MODE (mem);
6026   enum insn_code icode;
6027   rtx_insn *last_insn = get_last_insn ();
6028
6029   icode = optab_handler (sync_lock_test_and_set_optab, mode);
6030
6031   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
6032      exists, and the memory model is stronger than acquire, add a release
6033      barrier before the instruction.  */
6034
6035   if (is_mm_seq_cst (model) || is_mm_release (model) || is_mm_acq_rel (model))
6036     expand_mem_thread_fence (model);
6037
6038   if (icode != CODE_FOR_nothing)
6039     {
6040       struct expand_operand ops[3];
6041       create_output_operand (&ops[0], target, mode);
6042       create_fixed_operand (&ops[1], mem);
6043       create_input_operand (&ops[2], val, mode);
6044       if (maybe_expand_insn (icode, 3, ops))
6045         return ops[0].value;
6046     }
6047
6048   /* If an external test-and-set libcall is provided, use that instead of
6049      any external compare-and-swap that we might get from the compare-and-
6050      swap-loop expansion later.  */
6051   if (!can_compare_and_swap_p (mode, false))
6052     {
6053       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
6054       if (libfunc != NULL)
6055         {
6056           rtx addr;
6057
6058           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6059           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6060                                           mode, addr, ptr_mode,
6061                                           val, mode);
6062         }
6063     }
6064
6065   /* If the test_and_set can't be emitted, eliminate any barrier that might
6066      have been emitted.  */
6067   delete_insns_since (last_insn);
6068   return NULL_RTX;
6069 }
6070
6071 /* This function tries to implement an atomic exchange operation using a
6072    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
6073    *MEM are returned, using TARGET if possible.  No memory model is required
6074    since a compare_and_swap loop is seq-cst.  */
6075
6076 static rtx
6077 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
6078 {
6079   machine_mode mode = GET_MODE (mem);
6080
6081   if (can_compare_and_swap_p (mode, true))
6082     {
6083       if (!target || !register_operand (target, mode))
6084         target = gen_reg_rtx (mode);
6085       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
6086         return target;
6087     }
6088
6089   return NULL_RTX;
6090 }
6091
6092 /* This function tries to implement an atomic test-and-set operation
6093    using the atomic_test_and_set instruction pattern.  A boolean value
6094    is returned from the operation, using TARGET if possible.  */
6095
6096 static rtx
6097 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6098 {
6099   machine_mode pat_bool_mode;
6100   struct expand_operand ops[3];
6101
6102   if (!targetm.have_atomic_test_and_set ())
6103     return NULL_RTX;
6104
6105   /* While we always get QImode from __atomic_test_and_set, we get
6106      other memory modes from __sync_lock_test_and_set.  Note that we
6107      use no endian adjustment here.  This matches the 4.6 behavior
6108      in the Sparc backend.  */
6109   enum insn_code icode = targetm.code_for_atomic_test_and_set;
6110   gcc_checking_assert (insn_data[icode].operand[1].mode == QImode);
6111   if (GET_MODE (mem) != QImode)
6112     mem = adjust_address_nv (mem, QImode, 0);
6113
6114   pat_bool_mode = insn_data[icode].operand[0].mode;
6115   create_output_operand (&ops[0], target, pat_bool_mode);
6116   create_fixed_operand (&ops[1], mem);
6117   create_integer_operand (&ops[2], model);
6118
6119   if (maybe_expand_insn (icode, 3, ops))
6120     return ops[0].value;
6121   return NULL_RTX;
6122 }
6123
6124 /* This function expands the legacy _sync_lock test_and_set operation which is
6125    generally an atomic exchange.  Some limited targets only allow the
6126    constant 1 to be stored.  This is an ACQUIRE operation.
6127
6128    TARGET is an optional place to stick the return value.
6129    MEM is where VAL is stored.  */
6130
6131 rtx
6132 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
6133 {
6134   rtx ret;
6135
6136   /* Try an atomic_exchange first.  */
6137   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_SYNC_ACQUIRE);
6138   if (ret)
6139     return ret;
6140
6141   ret = maybe_emit_sync_lock_test_and_set (target, mem, val,
6142                                            MEMMODEL_SYNC_ACQUIRE);
6143   if (ret)
6144     return ret;
6145
6146   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6147   if (ret)
6148     return ret;
6149
6150   /* If there are no other options, try atomic_test_and_set if the value
6151      being stored is 1.  */
6152   if (val == const1_rtx)
6153     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_SYNC_ACQUIRE);
6154
6155   return ret;
6156 }
6157
6158 /* This function expands the atomic test_and_set operation:
6159    atomically store a boolean TRUE into MEM and return the previous value.
6160
6161    MEMMODEL is the memory model variant to use.
6162    TARGET is an optional place to stick the return value.  */
6163
6164 rtx
6165 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6166 {
6167   machine_mode mode = GET_MODE (mem);
6168   rtx ret, trueval, subtarget;
6169
6170   ret = maybe_emit_atomic_test_and_set (target, mem, model);
6171   if (ret)
6172     return ret;
6173
6174   /* Be binary compatible with non-default settings of trueval, and different
6175      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
6176      another only has atomic-exchange.  */
6177   if (targetm.atomic_test_and_set_trueval == 1)
6178     {
6179       trueval = const1_rtx;
6180       subtarget = target ? target : gen_reg_rtx (mode);
6181     }
6182   else
6183     {
6184       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
6185       subtarget = gen_reg_rtx (mode);
6186     }
6187
6188   /* Try the atomic-exchange optab...  */
6189   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
6190
6191   /* ... then an atomic-compare-and-swap loop ... */
6192   if (!ret)
6193     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
6194
6195   /* ... before trying the vaguely defined legacy lock_test_and_set. */
6196   if (!ret)
6197     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
6198
6199   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
6200      things with the value 1.  Thus we try again without trueval.  */
6201   if (!ret && targetm.atomic_test_and_set_trueval != 1)
6202     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
6203
6204   /* Failing all else, assume a single threaded environment and simply
6205      perform the operation.  */
6206   if (!ret)
6207     {
6208       /* If the result is ignored skip the move to target.  */
6209       if (subtarget != const0_rtx)
6210         emit_move_insn (subtarget, mem);
6211
6212       emit_move_insn (mem, trueval);
6213       ret = subtarget;
6214     }
6215
6216   /* Recall that have to return a boolean value; rectify if trueval
6217      is not exactly one.  */
6218   if (targetm.atomic_test_and_set_trueval != 1)
6219     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
6220
6221   return ret;
6222 }
6223
6224 /* This function expands the atomic exchange operation:
6225    atomically store VAL in MEM and return the previous value in MEM.
6226
6227    MEMMODEL is the memory model variant to use.
6228    TARGET is an optional place to stick the return value.  */
6229
6230 rtx
6231 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6232 {
6233   machine_mode mode = GET_MODE (mem);
6234   rtx ret;
6235
6236   /* If loads are not atomic for the required size and we are not called to
6237      provide a __sync builtin, do not do anything so that we stay consistent
6238      with atomic loads of the same size.  */
6239   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6240     return NULL_RTX;
6241
6242   ret = maybe_emit_atomic_exchange (target, mem, val, model);
6243
6244   /* Next try a compare-and-swap loop for the exchange.  */
6245   if (!ret)
6246     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6247
6248   return ret;
6249 }
6250
6251 /* This function expands the atomic compare exchange operation:
6252
6253    *PTARGET_BOOL is an optional place to store the boolean success/failure.
6254    *PTARGET_OVAL is an optional place to store the old value from memory.
6255    Both target parameters may be NULL or const0_rtx to indicate that we do
6256    not care about that return value.  Both target parameters are updated on
6257    success to the actual location of the corresponding result.
6258
6259    MEMMODEL is the memory model variant to use.
6260
6261    The return value of the function is true for success.  */
6262
6263 bool
6264 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
6265                                 rtx mem, rtx expected, rtx desired,
6266                                 bool is_weak, enum memmodel succ_model,
6267                                 enum memmodel fail_model)
6268 {
6269   machine_mode mode = GET_MODE (mem);
6270   struct expand_operand ops[8];
6271   enum insn_code icode;
6272   rtx target_oval, target_bool = NULL_RTX;
6273   rtx libfunc;
6274
6275   /* If loads are not atomic for the required size and we are not called to
6276      provide a __sync builtin, do not do anything so that we stay consistent
6277      with atomic loads of the same size.  */
6278   if (!can_atomic_load_p (mode) && !is_mm_sync (succ_model))
6279     return false;
6280
6281   /* Load expected into a register for the compare and swap.  */
6282   if (MEM_P (expected))
6283     expected = copy_to_reg (expected);
6284
6285   /* Make sure we always have some place to put the return oldval.
6286      Further, make sure that place is distinct from the input expected,
6287      just in case we need that path down below.  */
6288   if (ptarget_oval && *ptarget_oval == const0_rtx)
6289     ptarget_oval = NULL;
6290
6291   if (ptarget_oval == NULL
6292       || (target_oval = *ptarget_oval) == NULL
6293       || reg_overlap_mentioned_p (expected, target_oval))
6294     target_oval = gen_reg_rtx (mode);
6295
6296   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
6297   if (icode != CODE_FOR_nothing)
6298     {
6299       machine_mode bool_mode = insn_data[icode].operand[0].mode;
6300
6301       if (ptarget_bool && *ptarget_bool == const0_rtx)
6302         ptarget_bool = NULL;
6303
6304       /* Make sure we always have a place for the bool operand.  */
6305       if (ptarget_bool == NULL
6306           || (target_bool = *ptarget_bool) == NULL
6307           || GET_MODE (target_bool) != bool_mode)
6308         target_bool = gen_reg_rtx (bool_mode);
6309
6310       /* Emit the compare_and_swap.  */
6311       create_output_operand (&ops[0], target_bool, bool_mode);
6312       create_output_operand (&ops[1], target_oval, mode);
6313       create_fixed_operand (&ops[2], mem);
6314       create_input_operand (&ops[3], expected, mode);
6315       create_input_operand (&ops[4], desired, mode);
6316       create_integer_operand (&ops[5], is_weak);
6317       create_integer_operand (&ops[6], succ_model);
6318       create_integer_operand (&ops[7], fail_model);
6319       if (maybe_expand_insn (icode, 8, ops))
6320         {
6321           /* Return success/failure.  */
6322           target_bool = ops[0].value;
6323           target_oval = ops[1].value;
6324           goto success;
6325         }
6326     }
6327
6328   /* Otherwise fall back to the original __sync_val_compare_and_swap
6329      which is always seq-cst.  */
6330   icode = optab_handler (sync_compare_and_swap_optab, mode);
6331   if (icode != CODE_FOR_nothing)
6332     {
6333       rtx cc_reg;
6334
6335       create_output_operand (&ops[0], target_oval, mode);
6336       create_fixed_operand (&ops[1], mem);
6337       create_input_operand (&ops[2], expected, mode);
6338       create_input_operand (&ops[3], desired, mode);
6339       if (!maybe_expand_insn (icode, 4, ops))
6340         return false;
6341
6342       target_oval = ops[0].value;
6343
6344       /* If the caller isn't interested in the boolean return value,
6345          skip the computation of it.  */
6346       if (ptarget_bool == NULL)
6347         goto success;
6348
6349       /* Otherwise, work out if the compare-and-swap succeeded.  */
6350       cc_reg = NULL_RTX;
6351       if (have_insn_for (COMPARE, CCmode))
6352         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
6353       if (cc_reg)
6354         {
6355           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
6356                                                const0_rtx, VOIDmode, 0, 1);
6357           goto success;
6358         }
6359       goto success_bool_from_val;
6360     }
6361
6362   /* Also check for library support for __sync_val_compare_and_swap.  */
6363   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
6364   if (libfunc != NULL)
6365     {
6366       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6367       rtx target = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6368                                             mode, addr, ptr_mode,
6369                                             expected, mode, desired, mode);
6370       emit_move_insn (target_oval, target);
6371
6372       /* Compute the boolean return value only if requested.  */
6373       if (ptarget_bool)
6374         goto success_bool_from_val;
6375       else
6376         goto success;
6377     }
6378
6379   /* Failure.  */
6380   return false;
6381
6382  success_bool_from_val:
6383    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
6384                                         expected, VOIDmode, 1, 1);
6385  success:
6386   /* Make sure that the oval output winds up where the caller asked.  */
6387   if (ptarget_oval)
6388     *ptarget_oval = target_oval;
6389   if (ptarget_bool)
6390     *ptarget_bool = target_bool;
6391   return true;
6392 }
6393
6394 /* Generate asm volatile("" : : : "memory") as the memory blockage.  */
6395
6396 static void
6397 expand_asm_memory_blockage (void)
6398 {
6399   rtx asm_op, clob;
6400
6401   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, "", "", 0,
6402                                  rtvec_alloc (0), rtvec_alloc (0),
6403                                  rtvec_alloc (0), UNKNOWN_LOCATION);
6404   MEM_VOLATILE_P (asm_op) = 1;
6405
6406   clob = gen_rtx_SCRATCH (VOIDmode);
6407   clob = gen_rtx_MEM (BLKmode, clob);
6408   clob = gen_rtx_CLOBBER (VOIDmode, clob);
6409
6410   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
6411 }
6412
6413 /* Do not propagate memory accesses across this point.  */
6414
6415 static void
6416 expand_memory_blockage (void)
6417 {
6418   if (targetm.have_memory_blockage ())
6419     emit_insn (targetm.gen_memory_blockage ());
6420   else
6421     expand_asm_memory_blockage ();
6422 }
6423
6424 /* This routine will either emit the mem_thread_fence pattern or issue a
6425    sync_synchronize to generate a fence for memory model MEMMODEL.  */
6426
6427 void
6428 expand_mem_thread_fence (enum memmodel model)
6429 {
6430   if (is_mm_relaxed (model))
6431     return;
6432   if (targetm.have_mem_thread_fence ())
6433     {
6434       emit_insn (targetm.gen_mem_thread_fence (GEN_INT (model)));
6435       expand_memory_blockage ();
6436     }
6437   else if (targetm.have_memory_barrier ())
6438     emit_insn (targetm.gen_memory_barrier ());
6439   else if (synchronize_libfunc != NULL_RTX)
6440     emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode);
6441   else
6442     expand_memory_blockage ();
6443 }
6444
6445 /* Emit a signal fence with given memory model.  */
6446
6447 void
6448 expand_mem_signal_fence (enum memmodel model)
6449 {
6450   /* No machine barrier is required to implement a signal fence, but
6451      a compiler memory barrier must be issued, except for relaxed MM.  */
6452   if (!is_mm_relaxed (model))
6453     expand_memory_blockage ();
6454 }
6455
6456 /* This function expands the atomic load operation:
6457    return the atomically loaded value in MEM.
6458
6459    MEMMODEL is the memory model variant to use.
6460    TARGET is an option place to stick the return value.  */
6461
6462 rtx
6463 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
6464 {
6465   machine_mode mode = GET_MODE (mem);
6466   enum insn_code icode;
6467
6468   /* If the target supports the load directly, great.  */
6469   icode = direct_optab_handler (atomic_load_optab, mode);
6470   if (icode != CODE_FOR_nothing)
6471     {
6472       struct expand_operand ops[3];
6473       rtx_insn *last = get_last_insn ();
6474       if (is_mm_seq_cst (model))
6475         expand_memory_blockage ();
6476
6477       create_output_operand (&ops[0], target, mode);
6478       create_fixed_operand (&ops[1], mem);
6479       create_integer_operand (&ops[2], model);
6480       if (maybe_expand_insn (icode, 3, ops))
6481         {
6482           if (!is_mm_relaxed (model))
6483             expand_memory_blockage ();
6484           return ops[0].value;
6485         }
6486       delete_insns_since (last);
6487     }
6488
6489   /* If the size of the object is greater than word size on this target,
6490      then we assume that a load will not be atomic.  We could try to
6491      emulate a load with a compare-and-swap operation, but the store that
6492      doing this could result in would be incorrect if this is a volatile
6493      atomic load or targetting read-only-mapped memory.  */
6494   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6495     /* If there is no atomic load, leave the library call.  */
6496     return NULL_RTX;
6497
6498   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
6499   if (!target || target == const0_rtx)
6500     target = gen_reg_rtx (mode);
6501
6502   /* For SEQ_CST, emit a barrier before the load.  */
6503   if (is_mm_seq_cst (model))
6504     expand_mem_thread_fence (model);
6505
6506   emit_move_insn (target, mem);
6507
6508   /* Emit the appropriate barrier after the load.  */
6509   expand_mem_thread_fence (model);
6510
6511   return target;
6512 }
6513
6514 /* This function expands the atomic store operation:
6515    Atomically store VAL in MEM.
6516    MEMMODEL is the memory model variant to use.
6517    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
6518    function returns const0_rtx if a pattern was emitted.  */
6519
6520 rtx
6521 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
6522 {
6523   machine_mode mode = GET_MODE (mem);
6524   enum insn_code icode;
6525   struct expand_operand ops[3];
6526
6527   /* If the target supports the store directly, great.  */
6528   icode = direct_optab_handler (atomic_store_optab, mode);
6529   if (icode != CODE_FOR_nothing)
6530     {
6531       rtx_insn *last = get_last_insn ();
6532       if (!is_mm_relaxed (model))
6533         expand_memory_blockage ();
6534       create_fixed_operand (&ops[0], mem);
6535       create_input_operand (&ops[1], val, mode);
6536       create_integer_operand (&ops[2], model);
6537       if (maybe_expand_insn (icode, 3, ops))
6538         {
6539           if (is_mm_seq_cst (model))
6540             expand_memory_blockage ();
6541           return const0_rtx;
6542         }
6543       delete_insns_since (last);
6544     }
6545
6546   /* If using __sync_lock_release is a viable alternative, try it.
6547      Note that this will not be set to true if we are expanding a generic
6548      __atomic_store_n.  */
6549   if (use_release)
6550     {
6551       icode = direct_optab_handler (sync_lock_release_optab, mode);
6552       if (icode != CODE_FOR_nothing)
6553         {
6554           create_fixed_operand (&ops[0], mem);
6555           create_input_operand (&ops[1], const0_rtx, mode);
6556           if (maybe_expand_insn (icode, 2, ops))
6557             {
6558               /* lock_release is only a release barrier.  */
6559               if (is_mm_seq_cst (model))
6560                 expand_mem_thread_fence (model);
6561               return const0_rtx;
6562             }
6563         }
6564     }
6565
6566   /* If the size of the object is greater than word size on this target,
6567      a default store will not be atomic.  */
6568   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6569     {
6570       /* If loads are atomic or we are called to provide a __sync builtin,
6571          we can try a atomic_exchange and throw away the result.  Otherwise,
6572          don't do anything so that we do not create an inconsistency between
6573          loads and stores.  */
6574       if (can_atomic_load_p (mode) || is_mm_sync (model))
6575         {
6576           rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
6577           if (!target)
6578             target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem,
6579                                                                 val);
6580           if (target)
6581             return const0_rtx;
6582         }
6583         return NULL_RTX;
6584     }
6585
6586   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
6587   expand_mem_thread_fence (model);
6588
6589   emit_move_insn (mem, val);
6590
6591   /* For SEQ_CST, also emit a barrier after the store.  */
6592   if (is_mm_seq_cst (model))
6593     expand_mem_thread_fence (model);
6594
6595   return const0_rtx;
6596 }
6597
6598
6599 /* Structure containing the pointers and values required to process the
6600    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
6601
6602 struct atomic_op_functions
6603 {
6604   direct_optab mem_fetch_before;
6605   direct_optab mem_fetch_after;
6606   direct_optab mem_no_result;
6607   optab fetch_before;
6608   optab fetch_after;
6609   direct_optab no_result;
6610   enum rtx_code reverse_code;
6611 };
6612
6613
6614 /* Fill in structure pointed to by OP with the various optab entries for an
6615    operation of type CODE.  */
6616
6617 static void
6618 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
6619 {
6620   gcc_assert (op!= NULL);
6621
6622   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
6623      in the source code during compilation, and the optab entries are not
6624      computable until runtime.  Fill in the values at runtime.  */
6625   switch (code)
6626     {
6627     case PLUS:
6628       op->mem_fetch_before = atomic_fetch_add_optab;
6629       op->mem_fetch_after = atomic_add_fetch_optab;
6630       op->mem_no_result = atomic_add_optab;
6631       op->fetch_before = sync_old_add_optab;
6632       op->fetch_after = sync_new_add_optab;
6633       op->no_result = sync_add_optab;
6634       op->reverse_code = MINUS;
6635       break;
6636     case MINUS:
6637       op->mem_fetch_before = atomic_fetch_sub_optab;
6638       op->mem_fetch_after = atomic_sub_fetch_optab;
6639       op->mem_no_result = atomic_sub_optab;
6640       op->fetch_before = sync_old_sub_optab;
6641       op->fetch_after = sync_new_sub_optab;
6642       op->no_result = sync_sub_optab;
6643       op->reverse_code = PLUS;
6644       break;
6645     case XOR:
6646       op->mem_fetch_before = atomic_fetch_xor_optab;
6647       op->mem_fetch_after = atomic_xor_fetch_optab;
6648       op->mem_no_result = atomic_xor_optab;
6649       op->fetch_before = sync_old_xor_optab;
6650       op->fetch_after = sync_new_xor_optab;
6651       op->no_result = sync_xor_optab;
6652       op->reverse_code = XOR;
6653       break;
6654     case AND:
6655       op->mem_fetch_before = atomic_fetch_and_optab;
6656       op->mem_fetch_after = atomic_and_fetch_optab;
6657       op->mem_no_result = atomic_and_optab;
6658       op->fetch_before = sync_old_and_optab;
6659       op->fetch_after = sync_new_and_optab;
6660       op->no_result = sync_and_optab;
6661       op->reverse_code = UNKNOWN;
6662       break;
6663     case IOR:
6664       op->mem_fetch_before = atomic_fetch_or_optab;
6665       op->mem_fetch_after = atomic_or_fetch_optab;
6666       op->mem_no_result = atomic_or_optab;
6667       op->fetch_before = sync_old_ior_optab;
6668       op->fetch_after = sync_new_ior_optab;
6669       op->no_result = sync_ior_optab;
6670       op->reverse_code = UNKNOWN;
6671       break;
6672     case NOT:
6673       op->mem_fetch_before = atomic_fetch_nand_optab;
6674       op->mem_fetch_after = atomic_nand_fetch_optab;
6675       op->mem_no_result = atomic_nand_optab;
6676       op->fetch_before = sync_old_nand_optab;
6677       op->fetch_after = sync_new_nand_optab;
6678       op->no_result = sync_nand_optab;
6679       op->reverse_code = UNKNOWN;
6680       break;
6681     default:
6682       gcc_unreachable ();
6683     }
6684 }
6685
6686 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
6687    using memory order MODEL.  If AFTER is true the operation needs to return
6688    the value of *MEM after the operation, otherwise the previous value.
6689    TARGET is an optional place to place the result.  The result is unused if
6690    it is const0_rtx.
6691    Return the result if there is a better sequence, otherwise NULL_RTX.  */
6692
6693 static rtx
6694 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6695                          enum memmodel model, bool after)
6696 {
6697   /* If the value is prefetched, or not used, it may be possible to replace
6698      the sequence with a native exchange operation.  */
6699   if (!after || target == const0_rtx)
6700     {
6701       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
6702       if (code == AND && val == const0_rtx)
6703         {
6704           if (target == const0_rtx)
6705             target = gen_reg_rtx (GET_MODE (mem));
6706           return maybe_emit_atomic_exchange (target, mem, val, model);
6707         }
6708
6709       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
6710       if (code == IOR && val == constm1_rtx)
6711         {
6712           if (target == const0_rtx)
6713             target = gen_reg_rtx (GET_MODE (mem));
6714           return maybe_emit_atomic_exchange (target, mem, val, model);
6715         }
6716     }
6717
6718   return NULL_RTX;
6719 }
6720
6721 /* Try to emit an instruction for a specific operation varaition.
6722    OPTAB contains the OP functions.
6723    TARGET is an optional place to return the result. const0_rtx means unused.
6724    MEM is the memory location to operate on.
6725    VAL is the value to use in the operation.
6726    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
6727    MODEL is the memory model, if used.
6728    AFTER is true if the returned result is the value after the operation.  */
6729
6730 static rtx
6731 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
6732                rtx val, bool use_memmodel, enum memmodel model, bool after)
6733 {
6734   machine_mode mode = GET_MODE (mem);
6735   struct expand_operand ops[4];
6736   enum insn_code icode;
6737   int op_counter = 0;
6738   int num_ops;
6739
6740   /* Check to see if there is a result returned.  */
6741   if (target == const0_rtx)
6742     {
6743       if (use_memmodel)
6744         {
6745           icode = direct_optab_handler (optab->mem_no_result, mode);
6746           create_integer_operand (&ops[2], model);
6747           num_ops = 3;
6748         }
6749       else
6750         {
6751           icode = direct_optab_handler (optab->no_result, mode);
6752           num_ops = 2;
6753         }
6754     }
6755   /* Otherwise, we need to generate a result.  */
6756   else
6757     {
6758       if (use_memmodel)
6759         {
6760           icode = direct_optab_handler (after ? optab->mem_fetch_after
6761                                         : optab->mem_fetch_before, mode);
6762           create_integer_operand (&ops[3], model);
6763           num_ops = 4;
6764         }
6765       else
6766         {
6767           icode = optab_handler (after ? optab->fetch_after
6768                                  : optab->fetch_before, mode);
6769           num_ops = 3;
6770         }
6771       create_output_operand (&ops[op_counter++], target, mode);
6772     }
6773   if (icode == CODE_FOR_nothing)
6774     return NULL_RTX;
6775
6776   create_fixed_operand (&ops[op_counter++], mem);
6777   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
6778   create_convert_operand_to (&ops[op_counter++], val, mode, true);
6779
6780   if (maybe_expand_insn (icode, num_ops, ops))
6781     return (target == const0_rtx ? const0_rtx : ops[0].value);
6782
6783   return NULL_RTX;
6784 }
6785
6786
6787 /* This function expands an atomic fetch_OP or OP_fetch operation:
6788    TARGET is an option place to stick the return value.  const0_rtx indicates
6789    the result is unused.
6790    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6791    CODE is the operation being performed (OP)
6792    MEMMODEL is the memory model variant to use.
6793    AFTER is true to return the result of the operation (OP_fetch).
6794    AFTER is false to return the value before the operation (fetch_OP).
6795
6796    This function will *only* generate instructions if there is a direct
6797    optab. No compare and swap loops or libcalls will be generated. */
6798
6799 static rtx
6800 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
6801                                     enum rtx_code code, enum memmodel model,
6802                                     bool after)
6803 {
6804   machine_mode mode = GET_MODE (mem);
6805   struct atomic_op_functions optab;
6806   rtx result;
6807   bool unused_result = (target == const0_rtx);
6808
6809   get_atomic_op_for_code (&optab, code);
6810
6811   /* Check to see if there are any better instructions.  */
6812   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
6813   if (result)
6814     return result;
6815
6816   /* Check for the case where the result isn't used and try those patterns.  */
6817   if (unused_result)
6818     {
6819       /* Try the memory model variant first.  */
6820       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
6821       if (result)
6822         return result;
6823
6824       /* Next try the old style withuot a memory model.  */
6825       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
6826       if (result)
6827         return result;
6828
6829       /* There is no no-result pattern, so try patterns with a result.  */
6830       target = NULL_RTX;
6831     }
6832
6833   /* Try the __atomic version.  */
6834   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
6835   if (result)
6836     return result;
6837
6838   /* Try the older __sync version.  */
6839   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
6840   if (result)
6841     return result;
6842
6843   /* If the fetch value can be calculated from the other variation of fetch,
6844      try that operation.  */
6845   if (after || unused_result || optab.reverse_code != UNKNOWN)
6846     {
6847       /* Try the __atomic version, then the older __sync version.  */
6848       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
6849       if (!result)
6850         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
6851
6852       if (result)
6853         {
6854           /* If the result isn't used, no need to do compensation code.  */
6855           if (unused_result)
6856             return result;
6857
6858           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
6859              Fetch_before == after REVERSE_OP val.  */
6860           if (!after)
6861             code = optab.reverse_code;
6862           if (code == NOT)
6863             {
6864               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
6865                                             true, OPTAB_LIB_WIDEN);
6866               result = expand_simple_unop (mode, NOT, result, target, true);
6867             }
6868           else
6869             result = expand_simple_binop (mode, code, result, val, target,
6870                                           true, OPTAB_LIB_WIDEN);
6871           return result;
6872         }
6873     }
6874
6875   /* No direct opcode can be generated.  */
6876   return NULL_RTX;
6877 }
6878
6879
6880
6881 /* This function expands an atomic fetch_OP or OP_fetch operation:
6882    TARGET is an option place to stick the return value.  const0_rtx indicates
6883    the result is unused.
6884    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6885    CODE is the operation being performed (OP)
6886    MEMMODEL is the memory model variant to use.
6887    AFTER is true to return the result of the operation (OP_fetch).
6888    AFTER is false to return the value before the operation (fetch_OP).  */
6889 rtx
6890 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6891                         enum memmodel model, bool after)
6892 {
6893   machine_mode mode = GET_MODE (mem);
6894   rtx result;
6895   bool unused_result = (target == const0_rtx);
6896
6897   /* If loads are not atomic for the required size and we are not called to
6898      provide a __sync builtin, do not do anything so that we stay consistent
6899      with atomic loads of the same size.  */
6900   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6901     return NULL_RTX;
6902
6903   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
6904                                                after);
6905
6906   if (result)
6907     return result;
6908
6909   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
6910   if (code == PLUS || code == MINUS)
6911     {
6912       rtx tmp;
6913       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
6914
6915       start_sequence ();
6916       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
6917       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
6918                                                    model, after);
6919       if (result)
6920         {
6921           /* PLUS worked so emit the insns and return.  */
6922           tmp = get_insns ();
6923           end_sequence ();
6924           emit_insn (tmp);
6925           return result;
6926         }
6927
6928       /* PLUS did not work, so throw away the negation code and continue.  */
6929       end_sequence ();
6930     }
6931
6932   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
6933   if (!can_compare_and_swap_p (mode, false))
6934     {
6935       rtx libfunc;
6936       bool fixup = false;
6937       enum rtx_code orig_code = code;
6938       struct atomic_op_functions optab;
6939
6940       get_atomic_op_for_code (&optab, code);
6941       libfunc = optab_libfunc (after ? optab.fetch_after
6942                                : optab.fetch_before, mode);
6943       if (libfunc == NULL
6944           && (after || unused_result || optab.reverse_code != UNKNOWN))
6945         {
6946           fixup = true;
6947           if (!after)
6948             code = optab.reverse_code;
6949           libfunc = optab_libfunc (after ? optab.fetch_before
6950                                    : optab.fetch_after, mode);
6951         }
6952       if (libfunc != NULL)
6953         {
6954           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6955           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
6956                                             addr, ptr_mode, val, mode);
6957
6958           if (!unused_result && fixup)
6959             result = expand_simple_binop (mode, code, result, val, target,
6960                                           true, OPTAB_LIB_WIDEN);
6961           return result;
6962         }
6963
6964       /* We need the original code for any further attempts.  */
6965       code = orig_code;
6966     }
6967
6968   /* If nothing else has succeeded, default to a compare and swap loop.  */
6969   if (can_compare_and_swap_p (mode, true))
6970     {
6971       rtx_insn *insn;
6972       rtx t0 = gen_reg_rtx (mode), t1;
6973
6974       start_sequence ();
6975
6976       /* If the result is used, get a register for it.  */
6977       if (!unused_result)
6978         {
6979           if (!target || !register_operand (target, mode))
6980             target = gen_reg_rtx (mode);
6981           /* If fetch_before, copy the value now.  */
6982           if (!after)
6983             emit_move_insn (target, t0);
6984         }
6985       else
6986         target = const0_rtx;
6987
6988       t1 = t0;
6989       if (code == NOT)
6990         {
6991           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
6992                                     true, OPTAB_LIB_WIDEN);
6993           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
6994         }
6995       else
6996         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
6997                                   OPTAB_LIB_WIDEN);
6998
6999       /* For after, copy the value now.  */
7000       if (!unused_result && after)
7001         emit_move_insn (target, t1);
7002       insn = get_insns ();
7003       end_sequence ();
7004
7005       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
7006         return target;
7007     }
7008
7009   return NULL_RTX;
7010 }
7011 \f
7012 /* Return true if OPERAND is suitable for operand number OPNO of
7013    instruction ICODE.  */
7014
7015 bool
7016 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
7017 {
7018   return (!insn_data[(int) icode].operand[opno].predicate
7019           || (insn_data[(int) icode].operand[opno].predicate
7020               (operand, insn_data[(int) icode].operand[opno].mode)));
7021 }
7022 \f
7023 /* TARGET is a target of a multiword operation that we are going to
7024    implement as a series of word-mode operations.  Return true if
7025    TARGET is suitable for this purpose.  */
7026
7027 bool
7028 valid_multiword_target_p (rtx target)
7029 {
7030   machine_mode mode;
7031   int i;
7032
7033   mode = GET_MODE (target);
7034   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
7035     if (!validate_subreg (word_mode, mode, target, i))
7036       return false;
7037   return true;
7038 }
7039
7040 /* Make OP describe an input operand that has value INTVAL and that has
7041    no inherent mode.  This function should only be used for operands that
7042    are always expand-time constants.  The backend may request that INTVAL
7043    be copied into a different kind of rtx, but it must specify the mode
7044    of that rtx if so.  */
7045
7046 void
7047 create_integer_operand (struct expand_operand *op, poly_int64 intval)
7048 {
7049   create_expand_operand (op, EXPAND_INTEGER,
7050                          gen_int_mode (intval, MAX_MODE_INT),
7051                          VOIDmode, false, intval);
7052 }
7053
7054 /* Like maybe_legitimize_operand, but do not change the code of the
7055    current rtx value.  */
7056
7057 static bool
7058 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
7059                                     struct expand_operand *op)
7060 {
7061   /* See if the operand matches in its current form.  */
7062   if (insn_operand_matches (icode, opno, op->value))
7063     return true;
7064
7065   /* If the operand is a memory whose address has no side effects,
7066      try forcing the address into a non-virtual pseudo register.
7067      The check for side effects is important because copy_to_mode_reg
7068      cannot handle things like auto-modified addresses.  */
7069   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
7070     {
7071       rtx addr, mem;
7072
7073       mem = op->value;
7074       addr = XEXP (mem, 0);
7075       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
7076           && !side_effects_p (addr))
7077         {
7078           rtx_insn *last;
7079           machine_mode mode;
7080
7081           last = get_last_insn ();
7082           mode = get_address_mode (mem);
7083           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
7084           if (insn_operand_matches (icode, opno, mem))
7085             {
7086               op->value = mem;
7087               return true;
7088             }
7089           delete_insns_since (last);
7090         }
7091     }
7092
7093   return false;
7094 }
7095
7096 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
7097    on success, storing the new operand value back in OP.  */
7098
7099 static bool
7100 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
7101                           struct expand_operand *op)
7102 {
7103   machine_mode mode, imode;
7104   bool old_volatile_ok, result;
7105
7106   mode = op->mode;
7107   switch (op->type)
7108     {
7109     case EXPAND_FIXED:
7110       old_volatile_ok = volatile_ok;
7111       volatile_ok = true;
7112       result = maybe_legitimize_operand_same_code (icode, opno, op);
7113       volatile_ok = old_volatile_ok;
7114       return result;
7115
7116     case EXPAND_OUTPUT:
7117       gcc_assert (mode != VOIDmode);
7118       if (op->value
7119           && op->value != const0_rtx
7120           && GET_MODE (op->value) == mode
7121           && maybe_legitimize_operand_same_code (icode, opno, op))
7122         return true;
7123
7124       op->value = gen_reg_rtx (mode);
7125       op->target = 0;
7126       break;
7127
7128     case EXPAND_INPUT:
7129     input:
7130       gcc_assert (mode != VOIDmode);
7131       gcc_assert (GET_MODE (op->value) == VOIDmode
7132                   || GET_MODE (op->value) == mode);
7133       if (maybe_legitimize_operand_same_code (icode, opno, op))
7134         return true;
7135
7136       op->value = copy_to_mode_reg (mode, op->value);
7137       break;
7138
7139     case EXPAND_CONVERT_TO:
7140       gcc_assert (mode != VOIDmode);
7141       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
7142       goto input;
7143
7144     case EXPAND_CONVERT_FROM:
7145       if (GET_MODE (op->value) != VOIDmode)
7146         mode = GET_MODE (op->value);
7147       else
7148         /* The caller must tell us what mode this value has.  */
7149         gcc_assert (mode != VOIDmode);
7150
7151       imode = insn_data[(int) icode].operand[opno].mode;
7152       if (imode != VOIDmode && imode != mode)
7153         {
7154           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
7155           mode = imode;
7156         }
7157       goto input;
7158
7159     case EXPAND_ADDRESS:
7160       op->value = convert_memory_address (as_a <scalar_int_mode> (mode),
7161                                           op->value);
7162       goto input;
7163
7164     case EXPAND_INTEGER:
7165       mode = insn_data[(int) icode].operand[opno].mode;
7166       if (mode != VOIDmode
7167           && known_eq (trunc_int_for_mode (op->int_value, mode),
7168                        op->int_value))
7169         {
7170           op->value = gen_int_mode (op->int_value, mode);
7171           goto input;
7172         }
7173       break;
7174     }
7175   return insn_operand_matches (icode, opno, op->value);
7176 }
7177
7178 /* Make OP describe an input operand that should have the same value
7179    as VALUE, after any mode conversion that the target might request.
7180    TYPE is the type of VALUE.  */
7181
7182 void
7183 create_convert_operand_from_type (struct expand_operand *op,
7184                                   rtx value, tree type)
7185 {
7186   create_convert_operand_from (op, value, TYPE_MODE (type),
7187                                TYPE_UNSIGNED (type));
7188 }
7189
7190 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
7191    of instruction ICODE.  Return true on success, leaving the new operand
7192    values in the OPS themselves.  Emit no code on failure.  */
7193
7194 bool
7195 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
7196                            unsigned int nops, struct expand_operand *ops)
7197 {
7198   rtx_insn *last;
7199   unsigned int i;
7200
7201   last = get_last_insn ();
7202   for (i = 0; i < nops; i++)
7203     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
7204       {
7205         delete_insns_since (last);
7206         return false;
7207       }
7208   return true;
7209 }
7210
7211 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
7212    as its operands.  Return the instruction pattern on success,
7213    and emit any necessary set-up code.  Return null and emit no
7214    code on failure.  */
7215
7216 rtx_insn *
7217 maybe_gen_insn (enum insn_code icode, unsigned int nops,
7218                 struct expand_operand *ops)
7219 {
7220   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
7221   if (!maybe_legitimize_operands (icode, 0, nops, ops))
7222     return NULL;
7223
7224   switch (nops)
7225     {
7226     case 1:
7227       return GEN_FCN (icode) (ops[0].value);
7228     case 2:
7229       return GEN_FCN (icode) (ops[0].value, ops[1].value);
7230     case 3:
7231       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
7232     case 4:
7233       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7234                               ops[3].value);
7235     case 5:
7236       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7237                               ops[3].value, ops[4].value);
7238     case 6:
7239       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7240                               ops[3].value, ops[4].value, ops[5].value);
7241     case 7:
7242       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7243                               ops[3].value, ops[4].value, ops[5].value,
7244                               ops[6].value);
7245     case 8:
7246       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7247                               ops[3].value, ops[4].value, ops[5].value,
7248                               ops[6].value, ops[7].value);
7249     case 9:
7250       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7251                               ops[3].value, ops[4].value, ops[5].value,
7252                               ops[6].value, ops[7].value, ops[8].value);
7253     }
7254   gcc_unreachable ();
7255 }
7256
7257 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
7258    as its operands.  Return true on success and emit no code on failure.  */
7259
7260 bool
7261 maybe_expand_insn (enum insn_code icode, unsigned int nops,
7262                    struct expand_operand *ops)
7263 {
7264   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7265   if (pat)
7266     {
7267       emit_insn (pat);
7268       return true;
7269     }
7270   return false;
7271 }
7272
7273 /* Like maybe_expand_insn, but for jumps.  */
7274
7275 bool
7276 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
7277                         struct expand_operand *ops)
7278 {
7279   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7280   if (pat)
7281     {
7282       emit_jump_insn (pat);
7283       return true;
7284     }
7285   return false;
7286 }
7287
7288 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
7289    as its operands.  */
7290
7291 void
7292 expand_insn (enum insn_code icode, unsigned int nops,
7293              struct expand_operand *ops)
7294 {
7295   if (!maybe_expand_insn (icode, nops, ops))
7296     gcc_unreachable ();
7297 }
7298
7299 /* Like expand_insn, but for jumps.  */
7300
7301 void
7302 expand_jump_insn (enum insn_code icode, unsigned int nops,
7303                   struct expand_operand *ops)
7304 {
7305   if (!maybe_expand_jump_insn (icode, nops, ops))
7306     gcc_unreachable ();
7307 }