gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2017 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "backend.h"
  25 #include "target.h"
  26 #include "rtl.h"
  27 #include "tree.h"
  28 #include "memmodel.h"
  29 #include "predict.h"
  30 #include "tm_p.h"
  31 #include "expmed.h"
  32 #include "optabs.h"
  33 #include "emit-rtl.h"
  34 #include "recog.h"
  35 #include "diagnostic-core.h"
  36
  37 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  38    is properly defined.  */
  39 #include "stor-layout.h"
  40 #include "except.h"
  41 #include "dojump.h"
  42 #include "explow.h"
  43 #include "expr.h"
  44 #include "optabs-tree.h"
  45 #include "libfuncs.h"
  46
  47 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  48                                    machine_mode *);
  49 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  50 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  51
  52 /* Debug facility for use in GDB.  */
  53 void debug_optab_libfuncs (void);
  54 \f
  55 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
  56    the result of operation CODE applied to OP0 (and OP1 if it is a binary
  57    operation).
  58
  59    If the last insn does not set TARGET, don't do anything, but return 1.
  60
  61    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
  62    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
  63    try again, ensuring that TARGET is not one of the operands.  */
  64
  65 static int
  66 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
  67 {
  68   rtx_insn *last_insn;
  69   rtx set;
  70   rtx note;
  71
  72   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
  73
  74   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
  75       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
  76       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
  77       && GET_RTX_CLASS (code) != RTX_COMPARE
  78       && GET_RTX_CLASS (code) != RTX_UNARY)
  79     return 1;
  80
  81   if (GET_CODE (target) == ZERO_EXTRACT)
  82     return 1;
  83
  84   for (last_insn = insns;
  85        NEXT_INSN (last_insn) != NULL_RTX;
  86        last_insn = NEXT_INSN (last_insn))
  87     ;
  88
  89   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
  90      a value changing in the insn, so the note would be invalid for CSE.  */
  91   if (reg_overlap_mentioned_p (target, op0)
  92       || (op1 && reg_overlap_mentioned_p (target, op1)))
  93     {
  94       if (MEM_P (target)
  95           && (rtx_equal_p (target, op0)
  96               || (op1 && rtx_equal_p (target, op1))))
  97         {
  98           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
  99              over expanding it as temp = MEM op X, MEM = temp.  If the target
 100              supports MEM = MEM op X instructions, it is sometimes too hard
 101              to reconstruct that form later, especially if X is also a memory,
 102              and due to multiple occurrences of addresses the address might
 103              be forced into register unnecessarily.
 104              Note that not emitting the REG_EQUIV note might inhibit
 105              CSE in some cases.  */
 106           set = single_set (last_insn);
 107           if (set
 108               && GET_CODE (SET_SRC (set)) == code
 109               && MEM_P (SET_DEST (set))
 110               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 111                   || (op1 && rtx_equal_p (SET_DEST (set),
 112                                           XEXP (SET_SRC (set), 1)))))
 113             return 1;
 114         }
 115       return 0;
 116     }
 117
 118   set = set_for_reg_notes (last_insn);
 119   if (set == NULL_RTX)
 120     return 1;
 121
 122   if (! rtx_equal_p (SET_DEST (set), target)
 123       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 124       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 125           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 126     return 1;
 127
 128   if (GET_RTX_CLASS (code) == RTX_UNARY)
 129     switch (code)
 130       {
 131       case FFS:
 132       case CLZ:
 133       case CTZ:
 134       case CLRSB:
 135       case POPCOUNT:
 136       case PARITY:
 137       case BSWAP:
 138         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 139           {
 140             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 141             if (GET_MODE_UNIT_SIZE (GET_MODE (op0))
 142                 > GET_MODE_UNIT_SIZE (GET_MODE (target)))
 143               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 144                                          note, GET_MODE (op0));
 145             else
 146               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 147                                          note, GET_MODE (op0));
 148             break;
 149           }
 150         /* FALLTHRU */
 151       default:
 152         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 153         break;
 154       }
 155   else
 156     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 157
 158   set_unique_reg_note (last_insn, REG_EQUAL, note);
 159
 160   return 1;
 161 }
 162 \f
 163 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 164    for a widening operation would be.  In most cases this would be OP0, but if
 165    that's a constant it'll be VOIDmode, which isn't useful.  */
 166
 167 static machine_mode
 168 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 169 {
 170   machine_mode m0 = GET_MODE (op0);
 171   machine_mode m1 = GET_MODE (op1);
 172   machine_mode result;
 173
 174   if (m0 == VOIDmode && m1 == VOIDmode)
 175     return to_mode;
 176   else if (m0 == VOIDmode || GET_MODE_UNIT_SIZE (m0) < GET_MODE_UNIT_SIZE (m1))
 177     result = m1;
 178   else
 179     result = m0;
 180
 181   if (GET_MODE_UNIT_SIZE (result) > GET_MODE_UNIT_SIZE (to_mode))
 182     return to_mode;
 183
 184   return result;
 185 }
 186 \f
 187 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 188    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 189    not actually do a sign-extend or zero-extend, but can leave the
 190    higher-order bits of the result rtx undefined, for example, in the case
 191    of logical operations, but not right shifts.  */
 192
 193 static rtx
 194 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 195                int unsignedp, int no_extend)
 196 {
 197   rtx result;
 198   scalar_int_mode int_mode;
 199
 200   /* If we don't have to extend and this is a constant, return it.  */
 201   if (no_extend && GET_MODE (op) == VOIDmode)
 202     return op;
 203
 204   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 205      extend since it will be more efficient to do so unless the signedness of
 206      a promoted object differs from our extension.  */
 207   if (! no_extend
 208       || !is_a <scalar_int_mode> (mode, &int_mode)
 209       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 210           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 211     return convert_modes (mode, oldmode, op, unsignedp);
 212
 213   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 214      SUBREG.  */
 215   if (GET_MODE_SIZE (int_mode) <= UNITS_PER_WORD)
 216     return gen_lowpart (int_mode, force_reg (GET_MODE (op), op));
 217
 218   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 219      part to OP.  */
 220
 221   result = gen_reg_rtx (int_mode);
 222   emit_clobber (result);
 223   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 224   return result;
 225 }
 226 \f
 227 /* Expand vector widening operations.
 228
 229    There are two different classes of operations handled here:
 230    1) Operations whose result is wider than all the arguments to the operation.
 231       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 232       In this case OP0 and optionally OP1 would be initialized,
 233       but WIDE_OP wouldn't (not relevant for this case).
 234    2) Operations whose result is of the same size as the last argument to the
 235       operation, but wider than all the other arguments to the operation.
 236       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 237       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 238
 239    E.g, when called to expand the following operations, this is how
 240    the arguments will be initialized:
 241                                 nops    OP0     OP1     WIDE_OP
 242    widening-sum                 2       oprnd0  -       oprnd1
 243    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 244    widening-mult                2       oprnd0  oprnd1  -
 245    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 246
 247 rtx
 248 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 249                            rtx target, int unsignedp)
 250 {
 251   struct expand_operand eops[4];
 252   tree oprnd0, oprnd1, oprnd2;
 253   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 254   optab widen_pattern_optab;
 255   enum insn_code icode;
 256   int nops = TREE_CODE_LENGTH (ops->code);
 257   int op;
 258
 259   oprnd0 = ops->op0;
 260   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 261   widen_pattern_optab =
 262     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 263   if (ops->code == WIDEN_MULT_PLUS_EXPR
 264       || ops->code == WIDEN_MULT_MINUS_EXPR)
 265     icode = find_widening_optab_handler (widen_pattern_optab,
 266                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 267                                          tmode0);
 268   else
 269     icode = optab_handler (widen_pattern_optab, tmode0);
 270   gcc_assert (icode != CODE_FOR_nothing);
 271
 272   if (nops >= 2)
 273     {
 274       oprnd1 = ops->op1;
 275       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 276     }
 277
 278   /* The last operand is of a wider mode than the rest of the operands.  */
 279   if (nops == 2)
 280     wmode = tmode1;
 281   else if (nops == 3)
 282     {
 283       gcc_assert (tmode1 == tmode0);
 284       gcc_assert (op1);
 285       oprnd2 = ops->op2;
 286       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 287     }
 288
 289   op = 0;
 290   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 291   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 292   if (op1)
 293     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 294   if (wide_op)
 295     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 296   expand_insn (icode, op, eops);
 297   return eops[0].value;
 298 }
 299
 300 /* Generate code to perform an operation specified by TERNARY_OPTAB
 301    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 302
 303    UNSIGNEDP is for the case where we have to widen the operands
 304    to perform the operation.  It says to use zero-extension.
 305
 306    If TARGET is nonzero, the value
 307    is generated there, if it is convenient to do so.
 308    In all cases an rtx is returned for the locus of the value;
 309    this may or may not be TARGET.  */
 310
 311 rtx
 312 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 313                    rtx op1, rtx op2, rtx target, int unsignedp)
 314 {
 315   struct expand_operand ops[4];
 316   enum insn_code icode = optab_handler (ternary_optab, mode);
 317
 318   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 319
 320   create_output_operand (&ops[0], target, mode);
 321   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 322   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 323   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 324   expand_insn (icode, 4, ops);
 325   return ops[0].value;
 326 }
 327
 328
 329 /* Like expand_binop, but return a constant rtx if the result can be
 330    calculated at compile time.  The arguments and return value are
 331    otherwise the same as for expand_binop.  */
 332
 333 rtx
 334 simplify_expand_binop (machine_mode mode, optab binoptab,
 335                        rtx op0, rtx op1, rtx target, int unsignedp,
 336                        enum optab_methods methods)
 337 {
 338   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 339     {
 340       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 341                                          mode, op0, op1);
 342       if (x)
 343         return x;
 344     }
 345
 346   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 347 }
 348
 349 /* Like simplify_expand_binop, but always put the result in TARGET.
 350    Return true if the expansion succeeded.  */
 351
 352 bool
 353 force_expand_binop (machine_mode mode, optab binoptab,
 354                     rtx op0, rtx op1, rtx target, int unsignedp,
 355                     enum optab_methods methods)
 356 {
 357   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 358                                  target, unsignedp, methods);
 359   if (x == 0)
 360     return false;
 361   if (x != target)
 362     emit_move_insn (target, x);
 363   return true;
 364 }
 365
 366 /* Create a new vector value in VMODE with all elements set to OP.  The
 367    mode of OP must be the element mode of VMODE.  If OP is a constant,
 368    then the return value will be a constant.  */
 369
 370 rtx
 371 expand_vector_broadcast (machine_mode vmode, rtx op)
 372 {
 373   enum insn_code icode;
 374   rtvec vec;
 375   rtx ret;
 376   int i, n;
 377
 378   gcc_checking_assert (VECTOR_MODE_P (vmode));
 379
 380   if (valid_for_const_vector_p (vmode, op))
 381     return gen_const_vec_duplicate (vmode, op);
 382
 383   icode = optab_handler (vec_duplicate_optab, vmode);
 384   if (icode != CODE_FOR_nothing)
 385     {
 386       struct expand_operand ops[2];
 387       create_output_operand (&ops[0], NULL_RTX, vmode);
 388       create_input_operand (&ops[1], op, GET_MODE (op));
 389       expand_insn (icode, 2, ops);
 390       return ops[0].value;
 391     }
 392
 393   /* ??? If the target doesn't have a vec_init, then we have no easy way
 394      of performing this operation.  Most of this sort of generic support
 395      is hidden away in the vector lowering support in gimple.  */
 396   icode = convert_optab_handler (vec_init_optab, vmode,
 397                                  GET_MODE_INNER (vmode));
 398   if (icode == CODE_FOR_nothing)
 399     return NULL;
 400
 401   n = GET_MODE_NUNITS (vmode);
 402   vec = rtvec_alloc (n);
 403   for (i = 0; i < n; ++i)
 404     RTVEC_ELT (vec, i) = op;
 405   ret = gen_reg_rtx (vmode);
 406   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 407
 408   return ret;
 409 }
 410
 411 /* This subroutine of expand_doubleword_shift handles the cases in which
 412    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 413    value are the same as for the parent routine, except that SUPERWORD_OP1
 414    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 415    INTO_TARGET may be null if the caller has decided to calculate it.  */
 416
 417 static bool
 418 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 419                         rtx outof_target, rtx into_target,
 420                         int unsignedp, enum optab_methods methods)
 421 {
 422   if (into_target != 0)
 423     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 424                              into_target, unsignedp, methods))
 425       return false;
 426
 427   if (outof_target != 0)
 428     {
 429       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 430          of the sign bit, otherwise we must fill it with zeros.  */
 431       if (binoptab != ashr_optab)
 432         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 433       else
 434         if (!force_expand_binop (word_mode, binoptab, outof_input,
 435                                  gen_int_shift_amount (word_mode,
 436                                                        BITS_PER_WORD - 1),
 437                                  outof_target, unsignedp, methods))
 438           return false;
 439     }
 440   return true;
 441 }
 442
 443 /* This subroutine of expand_doubleword_shift handles the cases in which
 444    the effective shift value is < BITS_PER_WORD.  The arguments and return
 445    value are the same as for the parent routine.  */
 446
 447 static bool
 448 expand_subword_shift (scalar_int_mode op1_mode, optab binoptab,
 449                       rtx outof_input, rtx into_input, rtx op1,
 450                       rtx outof_target, rtx into_target,
 451                       int unsignedp, enum optab_methods methods,
 452                       unsigned HOST_WIDE_INT shift_mask)
 453 {
 454   optab reverse_unsigned_shift, unsigned_shift;
 455   rtx tmp, carries;
 456
 457   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 458   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 459
 460   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 461      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 462      the opposite direction to BINOPTAB.  */
 463   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 464     {
 465       carries = outof_input;
 466       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 467                                             op1_mode), op1_mode);
 468       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 469                                    0, true, methods);
 470     }
 471   else
 472     {
 473       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 474          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 475          has unknown behavior.  Do a single shift first, then shift by the
 476          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 477          are truncated to the mode size.  */
 478       carries = expand_binop (word_mode, reverse_unsigned_shift,
 479                               outof_input, const1_rtx, 0, unsignedp, methods);
 480       if (shift_mask == BITS_PER_WORD - 1)
 481         {
 482           tmp = immed_wide_int_const
 483             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 484           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 485                                        0, true, methods);
 486         }
 487       else
 488         {
 489           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 490                                                 op1_mode), op1_mode);
 491           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 492                                        0, true, methods);
 493         }
 494     }
 495   if (tmp == 0 || carries == 0)
 496     return false;
 497   carries = expand_binop (word_mode, reverse_unsigned_shift,
 498                           carries, tmp, 0, unsignedp, methods);
 499   if (carries == 0)
 500     return false;
 501
 502   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 503      so the result can go directly into INTO_TARGET if convenient.  */
 504   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 505                       into_target, unsignedp, methods);
 506   if (tmp == 0)
 507     return false;
 508
 509   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 510   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 511                            into_target, unsignedp, methods))
 512     return false;
 513
 514   /* Use a standard word_mode shift for the out-of half.  */
 515   if (outof_target != 0)
 516     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 517                              outof_target, unsignedp, methods))
 518       return false;
 519
 520   return true;
 521 }
 522
 523
 524 /* Try implementing expand_doubleword_shift using conditional moves.
 525    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 526    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 527    are the shift counts to use in the former and latter case.  All other
 528    arguments are the same as the parent routine.  */
 529
 530 static bool
 531 expand_doubleword_shift_condmove (scalar_int_mode op1_mode, optab binoptab,
 532                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 533                                   rtx outof_input, rtx into_input,
 534                                   rtx subword_op1, rtx superword_op1,
 535                                   rtx outof_target, rtx into_target,
 536                                   int unsignedp, enum optab_methods methods,
 537                                   unsigned HOST_WIDE_INT shift_mask)
 538 {
 539   rtx outof_superword, into_superword;
 540
 541   /* Put the superword version of the output into OUTOF_SUPERWORD and
 542      INTO_SUPERWORD.  */
 543   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 544   if (outof_target != 0 && subword_op1 == superword_op1)
 545     {
 546       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 547          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 548       into_superword = outof_target;
 549       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 550                                    outof_superword, 0, unsignedp, methods))
 551         return false;
 552     }
 553   else
 554     {
 555       into_superword = gen_reg_rtx (word_mode);
 556       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 557                                    outof_superword, into_superword,
 558                                    unsignedp, methods))
 559         return false;
 560     }
 561
 562   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 563   if (!expand_subword_shift (op1_mode, binoptab,
 564                              outof_input, into_input, subword_op1,
 565                              outof_target, into_target,
 566                              unsignedp, methods, shift_mask))
 567     return false;
 568
 569   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 570      might be the current value of OUTOF_TARGET.  */
 571   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 572                               into_target, into_superword, word_mode, false))
 573     return false;
 574
 575   if (outof_target != 0)
 576     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 577                                 outof_target, outof_superword,
 578                                 word_mode, false))
 579       return false;
 580
 581   return true;
 582 }
 583
 584 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 585    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 586    input operand; the shift moves bits in the direction OUTOF_INPUT->
 587    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 588    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 589    If OP1 is constant, it will have been truncated as appropriate
 590    and is known to be nonzero.
 591
 592    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 593    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 594    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 595
 596    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 597    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 598    fill with zeros or sign bits as appropriate.
 599
 600    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 601    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 602    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
 603    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
 604    are undefined.
 605
 606    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
 607    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
 608    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
 609    function wants to calculate it itself.
 610
 611    Return true if the shift could be successfully synthesized.  */
 612
 613 static bool
 614 expand_doubleword_shift (scalar_int_mode op1_mode, optab binoptab,
 615                          rtx outof_input, rtx into_input, rtx op1,
 616                          rtx outof_target, rtx into_target,
 617                          int unsignedp, enum optab_methods methods,
 618                          unsigned HOST_WIDE_INT shift_mask)
 619 {
 620   rtx superword_op1, tmp, cmp1, cmp2;
 621   enum rtx_code cmp_code;
 622
 623   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
 624      fill the result with sign or zero bits as appropriate.  If so, the value
 625      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
 626      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
 627      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
 628
 629      This isn't worthwhile for constant shifts since the optimizers will
 630      cope better with in-range shift counts.  */
 631   if (shift_mask >= BITS_PER_WORD
 632       && outof_target != 0
 633       && !CONSTANT_P (op1))
 634     {
 635       if (!expand_doubleword_shift (op1_mode, binoptab,
 636                                     outof_input, into_input, op1,
 637                                     0, into_target,
 638                                     unsignedp, methods, shift_mask))
 639         return false;
 640       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 641                                outof_target, unsignedp, methods))
 642         return false;
 643       return true;
 644     }
 645
 646   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
 647      is true when the effective shift value is less than BITS_PER_WORD.
 648      Set SUPERWORD_OP1 to the shift count that should be used to shift
 649      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
 650   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
 651   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
 652     {
 653       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
 654          is a subword shift count.  */
 655       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
 656                                     0, true, methods);
 657       cmp2 = CONST0_RTX (op1_mode);
 658       cmp_code = EQ;
 659       superword_op1 = op1;
 660     }
 661   else
 662     {
 663       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
 664       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
 665                                     0, true, methods);
 666       cmp2 = CONST0_RTX (op1_mode);
 667       cmp_code = LT;
 668       superword_op1 = cmp1;
 669     }
 670   if (cmp1 == 0)
 671     return false;
 672
 673   /* If we can compute the condition at compile time, pick the
 674      appropriate subroutine.  */
 675   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
 676   if (tmp != 0 && CONST_INT_P (tmp))
 677     {
 678       if (tmp == const0_rtx)
 679         return expand_superword_shift (binoptab, outof_input, superword_op1,
 680                                        outof_target, into_target,
 681                                        unsignedp, methods);
 682       else
 683         return expand_subword_shift (op1_mode, binoptab,
 684                                      outof_input, into_input, op1,
 685                                      outof_target, into_target,
 686                                      unsignedp, methods, shift_mask);
 687     }
 688
 689   /* Try using conditional moves to generate straight-line code.  */
 690   if (HAVE_conditional_move)
 691     {
 692       rtx_insn *start = get_last_insn ();
 693       if (expand_doubleword_shift_condmove (op1_mode, binoptab,
 694                                             cmp_code, cmp1, cmp2,
 695                                             outof_input, into_input,
 696                                             op1, superword_op1,
 697                                             outof_target, into_target,
 698                                             unsignedp, methods, shift_mask))
 699         return true;
 700       delete_insns_since (start);
 701     }
 702
 703   /* As a last resort, use branches to select the correct alternative.  */
 704   rtx_code_label *subword_label = gen_label_rtx ();
 705   rtx_code_label *done_label = gen_label_rtx ();
 706
 707   NO_DEFER_POP;
 708   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
 709                            0, 0, subword_label,
 710                            profile_probability::uninitialized ());
 711   OK_DEFER_POP;
 712
 713   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 714                                outof_target, into_target,
 715                                unsignedp, methods))
 716     return false;
 717
 718   emit_jump_insn (targetm.gen_jump (done_label));
 719   emit_barrier ();
 720   emit_label (subword_label);
 721
 722   if (!expand_subword_shift (op1_mode, binoptab,
 723                              outof_input, into_input, op1,
 724                              outof_target, into_target,
 725                              unsignedp, methods, shift_mask))
 726     return false;
 727
 728   emit_label (done_label);
 729   return true;
 730 }
 731 \f
 732 /* Subroutine of expand_binop.  Perform a double word multiplication of
 733    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
 734    as the target's word_mode.  This function return NULL_RTX if anything
 735    goes wrong, in which case it may have already emitted instructions
 736    which need to be deleted.
 737
 738    If we want to multiply two two-word values and have normal and widening
 739    multiplies of single-word values, we can do this with three smaller
 740    multiplications.
 741
 742    The multiplication proceeds as follows:
 743                                  _______________________
 744                                 [__op0_high_|__op0_low__]
 745                                  _______________________
 746         *                       [__op1_high_|__op1_low__]
 747         _______________________________________________
 748                                  _______________________
 749     (1)                         [__op0_low__*__op1_low__]
 750                      _______________________
 751     (2a)            [__op0_low__*__op1_high_]
 752                      _______________________
 753     (2b)            [__op0_high_*__op1_low__]
 754          _______________________
 755     (3) [__op0_high_*__op1_high_]
 756
 757
 758   This gives a 4-word result.  Since we are only interested in the
 759   lower 2 words, partial result (3) and the upper words of (2a) and
 760   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
 761   calculated using non-widening multiplication.
 762
 763   (1), however, needs to be calculated with an unsigned widening
 764   multiplication.  If this operation is not directly supported we
 765   try using a signed widening multiplication and adjust the result.
 766   This adjustment works as follows:
 767
 768       If both operands are positive then no adjustment is needed.
 769
 770       If the operands have different signs, for example op0_low < 0 and
 771       op1_low >= 0, the instruction treats the most significant bit of
 772       op0_low as a sign bit instead of a bit with significance
 773       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
 774       with 2**BITS_PER_WORD - op0_low, and two's complements the
 775       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
 776       the result.
 777
 778       Similarly, if both operands are negative, we need to add
 779       (op0_low + op1_low) * 2**BITS_PER_WORD.
 780
 781       We use a trick to adjust quickly.  We logically shift op0_low right
 782       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
 783       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
 784       logical shift exists, we do an arithmetic right shift and subtract
 785       the 0 or -1.  */
 786
 787 static rtx
 788 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
 789                        bool umulp, enum optab_methods methods)
 790 {
 791   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
 792   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
 793   rtx wordm1 = (umulp ? NULL_RTX
 794                 : gen_int_shift_amount (word_mode, BITS_PER_WORD - 1));
 795   rtx product, adjust, product_high, temp;
 796
 797   rtx op0_high = operand_subword_force (op0, high, mode);
 798   rtx op0_low = operand_subword_force (op0, low, mode);
 799   rtx op1_high = operand_subword_force (op1, high, mode);
 800   rtx op1_low = operand_subword_force (op1, low, mode);
 801
 802   /* If we're using an unsigned multiply to directly compute the product
 803      of the low-order words of the operands and perform any required
 804      adjustments of the operands, we begin by trying two more multiplications
 805      and then computing the appropriate sum.
 806
 807      We have checked above that the required addition is provided.
 808      Full-word addition will normally always succeed, especially if
 809      it is provided at all, so we don't worry about its failure.  The
 810      multiplication may well fail, however, so we do handle that.  */
 811
 812   if (!umulp)
 813     {
 814       /* ??? This could be done with emit_store_flag where available.  */
 815       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
 816                            NULL_RTX, 1, methods);
 817       if (temp)
 818         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
 819                                  NULL_RTX, 0, OPTAB_DIRECT);
 820       else
 821         {
 822           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
 823                                NULL_RTX, 0, methods);
 824           if (!temp)
 825             return NULL_RTX;
 826           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
 827                                    NULL_RTX, 0, OPTAB_DIRECT);
 828         }
 829
 830       if (!op0_high)
 831         return NULL_RTX;
 832     }
 833
 834   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
 835                          NULL_RTX, 0, OPTAB_DIRECT);
 836   if (!adjust)
 837     return NULL_RTX;
 838
 839   /* OP0_HIGH should now be dead.  */
 840
 841   if (!umulp)
 842     {
 843       /* ??? This could be done with emit_store_flag where available.  */
 844       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
 845                            NULL_RTX, 1, methods);
 846       if (temp)
 847         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
 848                                  NULL_RTX, 0, OPTAB_DIRECT);
 849       else
 850         {
 851           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
 852                                NULL_RTX, 0, methods);
 853           if (!temp)
 854             return NULL_RTX;
 855           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
 856                                    NULL_RTX, 0, OPTAB_DIRECT);
 857         }
 858
 859       if (!op1_high)
 860         return NULL_RTX;
 861     }
 862
 863   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
 864                        NULL_RTX, 0, OPTAB_DIRECT);
 865   if (!temp)
 866     return NULL_RTX;
 867
 868   /* OP1_HIGH should now be dead.  */
 869
 870   adjust = expand_binop (word_mode, add_optab, adjust, temp,
 871                          NULL_RTX, 0, OPTAB_DIRECT);
 872
 873   if (target && !REG_P (target))
 874     target = NULL_RTX;
 875
 876   /* *_widen_optab needs to determine operand mode, make sure at least
 877      one operand has non-VOID mode.  */
 878   if (GET_MODE (op0_low) == VOIDmode && GET_MODE (op1_low) == VOIDmode)
 879     op0_low = force_reg (word_mode, op0_low);
 880
 881   if (umulp)
 882     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
 883                             target, 1, OPTAB_DIRECT);
 884   else
 885     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
 886                             target, 1, OPTAB_DIRECT);
 887
 888   if (!product)
 889     return NULL_RTX;
 890
 891   product_high = operand_subword (product, high, 1, mode);
 892   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
 893                          NULL_RTX, 0, OPTAB_DIRECT);
 894   emit_move_insn (product_high, adjust);
 895   return product;
 896 }
 897 \f
 898 /* Wrapper around expand_binop which takes an rtx code to specify
 899    the operation to perform, not an optab pointer.  All other
 900    arguments are the same.  */
 901 rtx
 902 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
 903                      rtx op1, rtx target, int unsignedp,
 904                      enum optab_methods methods)
 905 {
 906   optab binop = code_to_optab (code);
 907   gcc_assert (binop);
 908
 909   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
 910 }
 911
 912 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
 913    binop.  Order them according to commutative_operand_precedence and, if
 914    possible, try to put TARGET or a pseudo first.  */
 915 static bool
 916 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
 917 {
 918   int op0_prec = commutative_operand_precedence (op0);
 919   int op1_prec = commutative_operand_precedence (op1);
 920
 921   if (op0_prec < op1_prec)
 922     return true;
 923
 924   if (op0_prec > op1_prec)
 925     return false;
 926
 927   /* With equal precedence, both orders are ok, but it is better if the
 928      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
 929   if (target == 0 || REG_P (target))
 930     return (REG_P (op1) && !REG_P (op0)) || target == op1;
 931   else
 932     return rtx_equal_p (op1, target);
 933 }
 934
 935 /* Return true if BINOPTAB implements a shift operation.  */
 936
 937 static bool
 938 shift_optab_p (optab binoptab)
 939 {
 940   switch (optab_to_code (binoptab))
 941     {
 942     case ASHIFT:
 943     case SS_ASHIFT:
 944     case US_ASHIFT:
 945     case ASHIFTRT:
 946     case LSHIFTRT:
 947     case ROTATE:
 948     case ROTATERT:
 949       return true;
 950
 951     default:
 952       return false;
 953     }
 954 }
 955
 956 /* Return true if BINOPTAB implements a commutative binary operation.  */
 957
 958 static bool
 959 commutative_optab_p (optab binoptab)
 960 {
 961   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
 962           || binoptab == smul_widen_optab
 963           || binoptab == umul_widen_optab
 964           || binoptab == smul_highpart_optab
 965           || binoptab == umul_highpart_optab);
 966 }
 967
 968 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
 969    optimizing, and if the operand is a constant that costs more than
 970    1 instruction, force the constant into a register and return that
 971    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
 972
 973 static rtx
 974 avoid_expensive_constant (machine_mode mode, optab binoptab,
 975                           int opn, rtx x, bool unsignedp)
 976 {
 977   bool speed = optimize_insn_for_speed_p ();
 978
 979   if (mode != VOIDmode
 980       && optimize
 981       && CONSTANT_P (x)
 982       && (rtx_cost (x, mode, optab_to_code (binoptab), opn, speed)
 983           > set_src_cost (x, mode, speed)))
 984     {
 985       if (CONST_INT_P (x))
 986         {
 987           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
 988           if (intval != INTVAL (x))
 989             x = GEN_INT (intval);
 990         }
 991       else
 992         x = convert_modes (mode, VOIDmode, x, unsignedp);
 993       x = force_reg (mode, x);
 994     }
 995   return x;
 996 }
 997
 998 /* Helper function for expand_binop: handle the case where there
 999    is an insn ICODE that directly implements the indicated operation.
1000    Returns null if this is not possible.  */
1001 static rtx
1002 expand_binop_directly (enum insn_code icode, machine_mode mode, optab binoptab,
1003                        rtx op0, rtx op1,
1004                        rtx target, int unsignedp, enum optab_methods methods,
1005                        rtx_insn *last)
1006 {
1007   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1008   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1009   machine_mode mode0, mode1, tmp_mode;
1010   struct expand_operand ops[3];
1011   bool commutative_p;
1012   rtx_insn *pat;
1013   rtx xop0 = op0, xop1 = op1;
1014   bool canonicalize_op1 = false;
1015
1016   /* If it is a commutative operator and the modes would match
1017      if we would swap the operands, we can save the conversions.  */
1018   commutative_p = commutative_optab_p (binoptab);
1019   if (commutative_p
1020       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1021       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1022     std::swap (xop0, xop1);
1023
1024   /* If we are optimizing, force expensive constants into a register.  */
1025   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1026   if (!shift_optab_p (binoptab))
1027     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1028   else
1029     /* Shifts and rotates often use a different mode for op1 from op0;
1030        for VOIDmode constants we don't know the mode, so force it
1031        to be canonicalized using convert_modes.  */
1032     canonicalize_op1 = true;
1033
1034   /* In case the insn wants input operands in modes different from
1035      those of the actual operands, convert the operands.  It would
1036      seem that we don't need to convert CONST_INTs, but we do, so
1037      that they're properly zero-extended, sign-extended or truncated
1038      for their mode.  */
1039
1040   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1041   if (xmode0 != VOIDmode && xmode0 != mode0)
1042     {
1043       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1044       mode0 = xmode0;
1045     }
1046
1047   mode1 = ((GET_MODE (xop1) != VOIDmode || canonicalize_op1)
1048            ? GET_MODE (xop1) : mode);
1049   if (xmode1 != VOIDmode && xmode1 != mode1)
1050     {
1051       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1052       mode1 = xmode1;
1053     }
1054
1055   /* If operation is commutative,
1056      try to make the first operand a register.
1057      Even better, try to make it the same as the target.
1058      Also try to make the last operand a constant.  */
1059   if (commutative_p
1060       && swap_commutative_operands_with_target (target, xop0, xop1))
1061     std::swap (xop0, xop1);
1062
1063   /* Now, if insn's predicates don't allow our operands, put them into
1064      pseudo regs.  */
1065
1066   if (binoptab == vec_pack_trunc_optab
1067       || binoptab == vec_pack_usat_optab
1068       || binoptab == vec_pack_ssat_optab
1069       || binoptab == vec_pack_ufix_trunc_optab
1070       || binoptab == vec_pack_sfix_trunc_optab)
1071     {
1072       /* The mode of the result is different then the mode of the
1073          arguments.  */
1074       tmp_mode = insn_data[(int) icode].operand[0].mode;
1075       if (VECTOR_MODE_P (mode)
1076           && GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1077         {
1078           delete_insns_since (last);
1079           return NULL_RTX;
1080         }
1081     }
1082   else
1083     tmp_mode = mode;
1084
1085   create_output_operand (&ops[0], target, tmp_mode);
1086   create_input_operand (&ops[1], xop0, mode0);
1087   create_input_operand (&ops[2], xop1, mode1);
1088   pat = maybe_gen_insn (icode, 3, ops);
1089   if (pat)
1090     {
1091       /* If PAT is composed of more than one insn, try to add an appropriate
1092          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1093          operand, call expand_binop again, this time without a target.  */
1094       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1095           && ! add_equal_note (pat, ops[0].value,
1096                                optab_to_code (binoptab),
1097                                ops[1].value, ops[2].value))
1098         {
1099           delete_insns_since (last);
1100           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1101                                unsignedp, methods);
1102         }
1103
1104       emit_insn (pat);
1105       return ops[0].value;
1106     }
1107   delete_insns_since (last);
1108   return NULL_RTX;
1109 }
1110
1111 /* Generate code to perform an operation specified by BINOPTAB
1112    on operands OP0 and OP1, with result having machine-mode MODE.
1113
1114    UNSIGNEDP is for the case where we have to widen the operands
1115    to perform the operation.  It says to use zero-extension.
1116
1117    If TARGET is nonzero, the value
1118    is generated there, if it is convenient to do so.
1119    In all cases an rtx is returned for the locus of the value;
1120    this may or may not be TARGET.  */
1121
1122 rtx
1123 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1124               rtx target, int unsignedp, enum optab_methods methods)
1125 {
1126   enum optab_methods next_methods
1127     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1128        ? OPTAB_WIDEN : methods);
1129   enum mode_class mclass;
1130   enum insn_code icode;
1131   machine_mode wider_mode;
1132   scalar_int_mode int_mode;
1133   rtx libfunc;
1134   rtx temp;
1135   rtx_insn *entry_last = get_last_insn ();
1136   rtx_insn *last;
1137
1138   mclass = GET_MODE_CLASS (mode);
1139
1140   /* If subtracting an integer constant, convert this into an addition of
1141      the negated constant.  */
1142
1143   if (binoptab == sub_optab && CONST_INT_P (op1))
1144     {
1145       op1 = negate_rtx (mode, op1);
1146       binoptab = add_optab;
1147     }
1148   /* For shifts, constant invalid op1 might be expanded from different
1149      mode than MODE.  As those are invalid, force them to a register
1150      to avoid further problems during expansion.  */
1151   else if (CONST_INT_P (op1)
1152            && shift_optab_p (binoptab)
1153            && UINTVAL (op1) >= GET_MODE_BITSIZE (GET_MODE_INNER (mode)))
1154     {
1155       op1 = gen_int_mode (INTVAL (op1), GET_MODE_INNER (mode));
1156       op1 = force_reg (GET_MODE_INNER (mode), op1);
1157     }
1158
1159   /* Record where to delete back to if we backtrack.  */
1160   last = get_last_insn ();
1161
1162   /* If we can do it with a three-operand insn, do so.  */
1163
1164   if (methods != OPTAB_MUST_WIDEN)
1165     {
1166       if (convert_optab_p (binoptab))
1167         {
1168           machine_mode from_mode = widened_mode (mode, op0, op1);
1169           icode = find_widening_optab_handler (binoptab, mode, from_mode);
1170         }
1171       else
1172         icode = optab_handler (binoptab, mode);
1173       if (icode != CODE_FOR_nothing)
1174         {
1175           temp = expand_binop_directly (icode, mode, binoptab, op0, op1,
1176                                         target, unsignedp, methods, last);
1177           if (temp)
1178             return temp;
1179         }
1180     }
1181
1182   /* If we were trying to rotate, and that didn't work, try rotating
1183      the other direction before falling back to shifts and bitwise-or.  */
1184   if (((binoptab == rotl_optab
1185         && (icode = optab_handler (rotr_optab, mode)) != CODE_FOR_nothing)
1186        || (binoptab == rotr_optab
1187            && (icode = optab_handler (rotl_optab, mode)) != CODE_FOR_nothing))
1188       && is_int_mode (mode, &int_mode))
1189     {
1190       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1191       rtx newop1;
1192       unsigned int bits = GET_MODE_PRECISION (int_mode);
1193
1194       if (CONST_INT_P (op1))
1195         newop1 = gen_int_shift_amount (int_mode, bits - INTVAL (op1));
1196       else if (targetm.shift_truncation_mask (int_mode) == bits - 1)
1197         newop1 = negate_rtx (GET_MODE (op1), op1);
1198       else
1199         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1200                                gen_int_mode (bits, GET_MODE (op1)), op1,
1201                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1202
1203       temp = expand_binop_directly (icode, int_mode, otheroptab, op0, newop1,
1204                                     target, unsignedp, methods, last);
1205       if (temp)
1206         return temp;
1207     }
1208
1209   /* If this is a multiply, see if we can do a widening operation that
1210      takes operands of this mode and makes a wider mode.  */
1211
1212   if (binoptab == smul_optab
1213       && GET_MODE_2XWIDER_MODE (mode).exists (&wider_mode)
1214       && (convert_optab_handler ((unsignedp
1215                                   ? umul_widen_optab
1216                                   : smul_widen_optab),
1217                                  wider_mode, mode) != CODE_FOR_nothing))
1218     {
1219       /* *_widen_optab needs to determine operand mode, make sure at least
1220          one operand has non-VOID mode.  */
1221       if (GET_MODE (op0) == VOIDmode && GET_MODE (op1) == VOIDmode)
1222         op0 = force_reg (mode, op0);
1223       temp = expand_binop (wider_mode,
1224                            unsignedp ? umul_widen_optab : smul_widen_optab,
1225                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1226
1227       if (temp != 0)
1228         {
1229           if (GET_MODE_CLASS (mode) == MODE_INT
1230               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1231             return gen_lowpart (mode, temp);
1232           else
1233             return convert_to_mode (mode, temp, unsignedp);
1234         }
1235     }
1236
1237   /* If this is a vector shift by a scalar, see if we can do a vector
1238      shift by a vector.  If so, broadcast the scalar into a vector.  */
1239   if (mclass == MODE_VECTOR_INT)
1240     {
1241       optab otheroptab = unknown_optab;
1242
1243       if (binoptab == ashl_optab)
1244         otheroptab = vashl_optab;
1245       else if (binoptab == ashr_optab)
1246         otheroptab = vashr_optab;
1247       else if (binoptab == lshr_optab)
1248         otheroptab = vlshr_optab;
1249       else if (binoptab == rotl_optab)
1250         otheroptab = vrotl_optab;
1251       else if (binoptab == rotr_optab)
1252         otheroptab = vrotr_optab;
1253
1254       if (otheroptab
1255           && (icode = optab_handler (otheroptab, mode)) != CODE_FOR_nothing)
1256         {
1257           /* The scalar may have been extended to be too wide.  Truncate
1258              it back to the proper size to fit in the broadcast vector.  */
1259           scalar_mode inner_mode = GET_MODE_INNER (mode);
1260           if (!CONST_INT_P (op1)
1261               && (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (op1)))
1262                   > GET_MODE_BITSIZE (inner_mode)))
1263             op1 = force_reg (inner_mode,
1264                              simplify_gen_unary (TRUNCATE, inner_mode, op1,
1265                                                  GET_MODE (op1)));
1266           rtx vop1 = expand_vector_broadcast (mode, op1);
1267           if (vop1)
1268             {
1269               temp = expand_binop_directly (icode, mode, otheroptab, op0, vop1,
1270                                             target, unsignedp, methods, last);
1271               if (temp)
1272                 return temp;
1273             }
1274         }
1275     }
1276
1277   /* Look for a wider mode of the same class for which we think we
1278      can open-code the operation.  Check for a widening multiply at the
1279      wider mode as well.  */
1280
1281   if (CLASS_HAS_WIDER_MODES_P (mclass)
1282       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1283     FOR_EACH_WIDER_MODE (wider_mode, mode)
1284       {
1285         machine_mode next_mode;
1286         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1287             || (binoptab == smul_optab
1288                 && GET_MODE_WIDER_MODE (wider_mode).exists (&next_mode)
1289                 && (find_widening_optab_handler ((unsignedp
1290                                                   ? umul_widen_optab
1291                                                   : smul_widen_optab),
1292                                                  next_mode, mode)
1293                     != CODE_FOR_nothing)))
1294           {
1295             rtx xop0 = op0, xop1 = op1;
1296             int no_extend = 0;
1297
1298             /* For certain integer operations, we need not actually extend
1299                the narrow operands, as long as we will truncate
1300                the results to the same narrowness.  */
1301
1302             if ((binoptab == ior_optab || binoptab == and_optab
1303                  || binoptab == xor_optab
1304                  || binoptab == add_optab || binoptab == sub_optab
1305                  || binoptab == smul_optab || binoptab == ashl_optab)
1306                 && mclass == MODE_INT)
1307               {
1308                 no_extend = 1;
1309                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1310                                                  xop0, unsignedp);
1311                 if (binoptab != ashl_optab)
1312                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1313                                                    xop1, unsignedp);
1314               }
1315
1316             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1317
1318             /* The second operand of a shift must always be extended.  */
1319             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1320                                   no_extend && binoptab != ashl_optab);
1321
1322             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1323                                  unsignedp, OPTAB_DIRECT);
1324             if (temp)
1325               {
1326                 if (mclass != MODE_INT
1327                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1328                   {
1329                     if (target == 0)
1330                       target = gen_reg_rtx (mode);
1331                     convert_move (target, temp, 0);
1332                     return target;
1333                   }
1334                 else
1335                   return gen_lowpart (mode, temp);
1336               }
1337             else
1338               delete_insns_since (last);
1339           }
1340       }
1341
1342   /* If operation is commutative,
1343      try to make the first operand a register.
1344      Even better, try to make it the same as the target.
1345      Also try to make the last operand a constant.  */
1346   if (commutative_optab_p (binoptab)
1347       && swap_commutative_operands_with_target (target, op0, op1))
1348     std::swap (op0, op1);
1349
1350   /* These can be done a word at a time.  */
1351   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1352       && is_int_mode (mode, &int_mode)
1353       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
1354       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1355     {
1356       int i;
1357       rtx_insn *insns;
1358
1359       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1360          won't be accurate, so use a new target.  */
1361       if (target == 0
1362           || target == op0
1363           || target == op1
1364           || !valid_multiword_target_p (target))
1365         target = gen_reg_rtx (int_mode);
1366
1367       start_sequence ();
1368
1369       /* Do the actual arithmetic.  */
1370       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
1371         {
1372           rtx target_piece = operand_subword (target, i, 1, int_mode);
1373           rtx x = expand_binop (word_mode, binoptab,
1374                                 operand_subword_force (op0, i, int_mode),
1375                                 operand_subword_force (op1, i, int_mode),
1376                                 target_piece, unsignedp, next_methods);
1377
1378           if (x == 0)
1379             break;
1380
1381           if (target_piece != x)
1382             emit_move_insn (target_piece, x);
1383         }
1384
1385       insns = get_insns ();
1386       end_sequence ();
1387
1388       if (i == GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD)
1389         {
1390           emit_insn (insns);
1391           return target;
1392         }
1393     }
1394
1395   /* Synthesize double word shifts from single word shifts.  */
1396   if ((binoptab == lshr_optab || binoptab == ashl_optab
1397        || binoptab == ashr_optab)
1398       && is_int_mode (mode, &int_mode)
1399       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1400       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1401       && GET_MODE_PRECISION (int_mode) == GET_MODE_BITSIZE (int_mode)
1402       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1403       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1404       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1405     {
1406       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1407       scalar_int_mode op1_mode;
1408
1409       double_shift_mask = targetm.shift_truncation_mask (int_mode);
1410       shift_mask = targetm.shift_truncation_mask (word_mode);
1411       op1_mode = (GET_MODE (op1) != VOIDmode
1412                   ? as_a <scalar_int_mode> (GET_MODE (op1))
1413                   : word_mode);
1414
1415       /* Apply the truncation to constant shifts.  */
1416       if (double_shift_mask > 0 && CONST_INT_P (op1))
1417         op1 = gen_int_mode (INTVAL (op1) & double_shift_mask, op1_mode);
1418
1419       if (op1 == CONST0_RTX (op1_mode))
1420         return op0;
1421
1422       /* Make sure that this is a combination that expand_doubleword_shift
1423          can handle.  See the comments there for details.  */
1424       if (double_shift_mask == 0
1425           || (shift_mask == BITS_PER_WORD - 1
1426               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1427         {
1428           rtx_insn *insns;
1429           rtx into_target, outof_target;
1430           rtx into_input, outof_input;
1431           int left_shift, outof_word;
1432
1433           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1434              won't be accurate, so use a new target.  */
1435           if (target == 0
1436               || target == op0
1437               || target == op1
1438               || !valid_multiword_target_p (target))
1439             target = gen_reg_rtx (int_mode);
1440
1441           start_sequence ();
1442
1443           /* OUTOF_* is the word we are shifting bits away from, and
1444              INTO_* is the word that we are shifting bits towards, thus
1445              they differ depending on the direction of the shift and
1446              WORDS_BIG_ENDIAN.  */
1447
1448           left_shift = binoptab == ashl_optab;
1449           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1450
1451           outof_target = operand_subword (target, outof_word, 1, int_mode);
1452           into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1453
1454           outof_input = operand_subword_force (op0, outof_word, int_mode);
1455           into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1456
1457           if (expand_doubleword_shift (op1_mode, binoptab,
1458                                        outof_input, into_input, op1,
1459                                        outof_target, into_target,
1460                                        unsignedp, next_methods, shift_mask))
1461             {
1462               insns = get_insns ();
1463               end_sequence ();
1464
1465               emit_insn (insns);
1466               return target;
1467             }
1468           end_sequence ();
1469         }
1470     }
1471
1472   /* Synthesize double word rotates from single word shifts.  */
1473   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1474       && is_int_mode (mode, &int_mode)
1475       && CONST_INT_P (op1)
1476       && GET_MODE_PRECISION (int_mode) == 2 * BITS_PER_WORD
1477       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1478       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1479     {
1480       rtx_insn *insns;
1481       rtx into_target, outof_target;
1482       rtx into_input, outof_input;
1483       rtx inter;
1484       int shift_count, left_shift, outof_word;
1485
1486       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1487          won't be accurate, so use a new target. Do this also if target is not
1488          a REG, first because having a register instead may open optimization
1489          opportunities, and second because if target and op0 happen to be MEMs
1490          designating the same location, we would risk clobbering it too early
1491          in the code sequence we generate below.  */
1492       if (target == 0
1493           || target == op0
1494           || target == op1
1495           || !REG_P (target)
1496           || !valid_multiword_target_p (target))
1497         target = gen_reg_rtx (int_mode);
1498
1499       start_sequence ();
1500
1501       shift_count = INTVAL (op1);
1502
1503       /* OUTOF_* is the word we are shifting bits away from, and
1504          INTO_* is the word that we are shifting bits towards, thus
1505          they differ depending on the direction of the shift and
1506          WORDS_BIG_ENDIAN.  */
1507
1508       left_shift = (binoptab == rotl_optab);
1509       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1510
1511       outof_target = operand_subword (target, outof_word, 1, int_mode);
1512       into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1513
1514       outof_input = operand_subword_force (op0, outof_word, int_mode);
1515       into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1516
1517       if (shift_count == BITS_PER_WORD)
1518         {
1519           /* This is just a word swap.  */
1520           emit_move_insn (outof_target, into_input);
1521           emit_move_insn (into_target, outof_input);
1522           inter = const0_rtx;
1523         }
1524       else
1525         {
1526           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1527           HOST_WIDE_INT first_shift_count, second_shift_count;
1528           optab reverse_unsigned_shift, unsigned_shift;
1529
1530           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1531                                     ? lshr_optab : ashl_optab);
1532
1533           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1534                             ? ashl_optab : lshr_optab);
1535
1536           if (shift_count > BITS_PER_WORD)
1537             {
1538               first_shift_count = shift_count - BITS_PER_WORD;
1539               second_shift_count = 2 * BITS_PER_WORD - shift_count;
1540             }
1541           else
1542             {
1543               first_shift_count = BITS_PER_WORD - shift_count;
1544               second_shift_count = shift_count;
1545             }
1546           rtx first_shift_count_rtx
1547             = gen_int_shift_amount (word_mode, first_shift_count);
1548           rtx second_shift_count_rtx
1549             = gen_int_shift_amount (word_mode, second_shift_count);
1550
1551           into_temp1 = expand_binop (word_mode, unsigned_shift,
1552                                      outof_input, first_shift_count_rtx,
1553                                      NULL_RTX, unsignedp, next_methods);
1554           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1555                                      into_input, second_shift_count_rtx,
1556                                      NULL_RTX, unsignedp, next_methods);
1557
1558           if (into_temp1 != 0 && into_temp2 != 0)
1559             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1560                                   into_target, unsignedp, next_methods);
1561           else
1562             inter = 0;
1563
1564           if (inter != 0 && inter != into_target)
1565             emit_move_insn (into_target, inter);
1566
1567           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1568                                       into_input, first_shift_count_rtx,
1569                                       NULL_RTX, unsignedp, next_methods);
1570           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1571                                       outof_input, second_shift_count_rtx,
1572                                       NULL_RTX, unsignedp, next_methods);
1573
1574           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1575             inter = expand_binop (word_mode, ior_optab,
1576                                   outof_temp1, outof_temp2,
1577                                   outof_target, unsignedp, next_methods);
1578
1579           if (inter != 0 && inter != outof_target)
1580             emit_move_insn (outof_target, inter);
1581         }
1582
1583       insns = get_insns ();
1584       end_sequence ();
1585
1586       if (inter != 0)
1587         {
1588           emit_insn (insns);
1589           return target;
1590         }
1591     }
1592
1593   /* These can be done a word at a time by propagating carries.  */
1594   if ((binoptab == add_optab || binoptab == sub_optab)
1595       && is_int_mode (mode, &int_mode)
1596       && GET_MODE_SIZE (int_mode) >= 2 * UNITS_PER_WORD
1597       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1598     {
1599       unsigned int i;
1600       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1601       const unsigned int nwords = GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD;
1602       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1603       rtx xop0, xop1, xtarget;
1604
1605       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1606          value is one of those, use it.  Otherwise, use 1 since it is the
1607          one easiest to get.  */
1608 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1609       int normalizep = STORE_FLAG_VALUE;
1610 #else
1611       int normalizep = 1;
1612 #endif
1613
1614       /* Prepare the operands.  */
1615       xop0 = force_reg (int_mode, op0);
1616       xop1 = force_reg (int_mode, op1);
1617
1618       xtarget = gen_reg_rtx (int_mode);
1619
1620       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1621         target = xtarget;
1622
1623       /* Indicate for flow that the entire target reg is being set.  */
1624       if (REG_P (target))
1625         emit_clobber (xtarget);
1626
1627       /* Do the actual arithmetic.  */
1628       for (i = 0; i < nwords; i++)
1629         {
1630           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1631           rtx target_piece = operand_subword (xtarget, index, 1, int_mode);
1632           rtx op0_piece = operand_subword_force (xop0, index, int_mode);
1633           rtx op1_piece = operand_subword_force (xop1, index, int_mode);
1634           rtx x;
1635
1636           /* Main add/subtract of the input operands.  */
1637           x = expand_binop (word_mode, binoptab,
1638                             op0_piece, op1_piece,
1639                             target_piece, unsignedp, next_methods);
1640           if (x == 0)
1641             break;
1642
1643           if (i + 1 < nwords)
1644             {
1645               /* Store carry from main add/subtract.  */
1646               carry_out = gen_reg_rtx (word_mode);
1647               carry_out = emit_store_flag_force (carry_out,
1648                                                  (binoptab == add_optab
1649                                                   ? LT : GT),
1650                                                  x, op0_piece,
1651                                                  word_mode, 1, normalizep);
1652             }
1653
1654           if (i > 0)
1655             {
1656               rtx newx;
1657
1658               /* Add/subtract previous carry to main result.  */
1659               newx = expand_binop (word_mode,
1660                                    normalizep == 1 ? binoptab : otheroptab,
1661                                    x, carry_in,
1662                                    NULL_RTX, 1, next_methods);
1663
1664               if (i + 1 < nwords)
1665                 {
1666                   /* Get out carry from adding/subtracting carry in.  */
1667                   rtx carry_tmp = gen_reg_rtx (word_mode);
1668                   carry_tmp = emit_store_flag_force (carry_tmp,
1669                                                      (binoptab == add_optab
1670                                                       ? LT : GT),
1671                                                      newx, x,
1672                                                      word_mode, 1, normalizep);
1673
1674                   /* Logical-ior the two poss. carry together.  */
1675                   carry_out = expand_binop (word_mode, ior_optab,
1676                                             carry_out, carry_tmp,
1677                                             carry_out, 0, next_methods);
1678                   if (carry_out == 0)
1679                     break;
1680                 }
1681               emit_move_insn (target_piece, newx);
1682             }
1683           else
1684             {
1685               if (x != target_piece)
1686                 emit_move_insn (target_piece, x);
1687             }
1688
1689           carry_in = carry_out;
1690         }
1691
1692       if (i == GET_MODE_BITSIZE (int_mode) / (unsigned) BITS_PER_WORD)
1693         {
1694           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing
1695               || ! rtx_equal_p (target, xtarget))
1696             {
1697               rtx_insn *temp = emit_move_insn (target, xtarget);
1698
1699               set_dst_reg_note (temp, REG_EQUAL,
1700                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
1701                                                 int_mode, copy_rtx (xop0),
1702                                                 copy_rtx (xop1)),
1703                                 target);
1704             }
1705           else
1706             target = xtarget;
1707
1708           return target;
1709         }
1710
1711       else
1712         delete_insns_since (last);
1713     }
1714
1715   /* Attempt to synthesize double word multiplies using a sequence of word
1716      mode multiplications.  We first attempt to generate a sequence using a
1717      more efficient unsigned widening multiply, and if that fails we then
1718      try using a signed widening multiply.  */
1719
1720   if (binoptab == smul_optab
1721       && is_int_mode (mode, &int_mode)
1722       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1723       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
1724       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
1725     {
1726       rtx product = NULL_RTX;
1727       if (convert_optab_handler (umul_widen_optab, int_mode, word_mode)
1728           != CODE_FOR_nothing)
1729         {
1730           product = expand_doubleword_mult (int_mode, op0, op1, target,
1731                                             true, methods);
1732           if (!product)
1733             delete_insns_since (last);
1734         }
1735
1736       if (product == NULL_RTX
1737           && (convert_optab_handler (smul_widen_optab, int_mode, word_mode)
1738               != CODE_FOR_nothing))
1739         {
1740           product = expand_doubleword_mult (int_mode, op0, op1, target,
1741                                             false, methods);
1742           if (!product)
1743             delete_insns_since (last);
1744         }
1745
1746       if (product != NULL_RTX)
1747         {
1748           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing)
1749             {
1750               rtx_insn *move = emit_move_insn (target ? target : product,
1751                                                product);
1752               set_dst_reg_note (move,
1753                                 REG_EQUAL,
1754                                 gen_rtx_fmt_ee (MULT, int_mode,
1755                                                 copy_rtx (op0),
1756                                                 copy_rtx (op1)),
1757                                 target ? target : product);
1758             }
1759           return product;
1760         }
1761     }
1762
1763   /* It can't be open-coded in this mode.
1764      Use a library call if one is available and caller says that's ok.  */
1765
1766   libfunc = optab_libfunc (binoptab, mode);
1767   if (libfunc
1768       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
1769     {
1770       rtx_insn *insns;
1771       rtx op1x = op1;
1772       machine_mode op1_mode = mode;
1773       rtx value;
1774
1775       start_sequence ();
1776
1777       if (shift_optab_p (binoptab))
1778         {
1779           op1_mode = targetm.libgcc_shift_count_mode ();
1780           /* Specify unsigned here,
1781              since negative shift counts are meaningless.  */
1782           op1x = convert_to_mode (op1_mode, op1, 1);
1783         }
1784
1785       if (GET_MODE (op0) != VOIDmode
1786           && GET_MODE (op0) != mode)
1787         op0 = convert_to_mode (mode, op0, unsignedp);
1788
1789       /* Pass 1 for NO_QUEUE so we don't lose any increments
1790          if the libcall is cse'd or moved.  */
1791       value = emit_library_call_value (libfunc,
1792                                        NULL_RTX, LCT_CONST, mode,
1793                                        op0, mode, op1x, op1_mode);
1794
1795       insns = get_insns ();
1796       end_sequence ();
1797
1798       bool trapv = trapv_binoptab_p (binoptab);
1799       target = gen_reg_rtx (mode);
1800       emit_libcall_block_1 (insns, target, value,
1801                             trapv ? NULL_RTX
1802                             : gen_rtx_fmt_ee (optab_to_code (binoptab),
1803                                               mode, op0, op1), trapv);
1804
1805       return target;
1806     }
1807
1808   delete_insns_since (last);
1809
1810   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1811
1812   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
1813          || methods == OPTAB_MUST_WIDEN))
1814     {
1815       /* Caller says, don't even try.  */
1816       delete_insns_since (entry_last);
1817       return 0;
1818     }
1819
1820   /* Compute the value of METHODS to pass to recursive calls.
1821      Don't allow widening to be tried recursively.  */
1822
1823   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
1824
1825   /* Look for a wider mode of the same class for which it appears we can do
1826      the operation.  */
1827
1828   if (CLASS_HAS_WIDER_MODES_P (mclass))
1829     {
1830       /* This code doesn't make sense for conversion optabs, since we
1831          wouldn't then want to extend the operands to be the same size
1832          as the result.  */
1833       gcc_assert (!convert_optab_p (binoptab));
1834       FOR_EACH_WIDER_MODE (wider_mode, mode)
1835         {
1836           if (optab_handler (binoptab, wider_mode)
1837               || (methods == OPTAB_LIB
1838                   && optab_libfunc (binoptab, wider_mode)))
1839             {
1840               rtx xop0 = op0, xop1 = op1;
1841               int no_extend = 0;
1842
1843               /* For certain integer operations, we need not actually extend
1844                  the narrow operands, as long as we will truncate
1845                  the results to the same narrowness.  */
1846
1847               if ((binoptab == ior_optab || binoptab == and_optab
1848                    || binoptab == xor_optab
1849                    || binoptab == add_optab || binoptab == sub_optab
1850                    || binoptab == smul_optab || binoptab == ashl_optab)
1851                   && mclass == MODE_INT)
1852                 no_extend = 1;
1853
1854               xop0 = widen_operand (xop0, wider_mode, mode,
1855                                     unsignedp, no_extend);
1856
1857               /* The second operand of a shift must always be extended.  */
1858               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1859                                     no_extend && binoptab != ashl_optab);
1860
1861               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1862                                    unsignedp, methods);
1863               if (temp)
1864                 {
1865                   if (mclass != MODE_INT
1866                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1867                     {
1868                       if (target == 0)
1869                         target = gen_reg_rtx (mode);
1870                       convert_move (target, temp, 0);
1871                       return target;
1872                     }
1873                   else
1874                     return gen_lowpart (mode, temp);
1875                 }
1876               else
1877                 delete_insns_since (last);
1878             }
1879         }
1880     }
1881
1882   delete_insns_since (entry_last);
1883   return 0;
1884 }
1885 \f
1886 /* Expand a binary operator which has both signed and unsigned forms.
1887    UOPTAB is the optab for unsigned operations, and SOPTAB is for
1888    signed operations.
1889
1890    If we widen unsigned operands, we may use a signed wider operation instead
1891    of an unsigned wider operation, since the result would be the same.  */
1892
1893 rtx
1894 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
1895                    rtx op0, rtx op1, rtx target, int unsignedp,
1896                    enum optab_methods methods)
1897 {
1898   rtx temp;
1899   optab direct_optab = unsignedp ? uoptab : soptab;
1900   bool save_enable;
1901
1902   /* Do it without widening, if possible.  */
1903   temp = expand_binop (mode, direct_optab, op0, op1, target,
1904                        unsignedp, OPTAB_DIRECT);
1905   if (temp || methods == OPTAB_DIRECT)
1906     return temp;
1907
1908   /* Try widening to a signed int.  Disable any direct use of any
1909      signed insn in the current mode.  */
1910   save_enable = swap_optab_enable (soptab, mode, false);
1911
1912   temp = expand_binop (mode, soptab, op0, op1, target,
1913                        unsignedp, OPTAB_WIDEN);
1914
1915   /* For unsigned operands, try widening to an unsigned int.  */
1916   if (!temp && unsignedp)
1917     temp = expand_binop (mode, uoptab, op0, op1, target,
1918                          unsignedp, OPTAB_WIDEN);
1919   if (temp || methods == OPTAB_WIDEN)
1920     goto egress;
1921
1922   /* Use the right width libcall if that exists.  */
1923   temp = expand_binop (mode, direct_optab, op0, op1, target,
1924                        unsignedp, OPTAB_LIB);
1925   if (temp || methods == OPTAB_LIB)
1926     goto egress;
1927
1928   /* Must widen and use a libcall, use either signed or unsigned.  */
1929   temp = expand_binop (mode, soptab, op0, op1, target,
1930                        unsignedp, methods);
1931   if (!temp && unsignedp)
1932     temp = expand_binop (mode, uoptab, op0, op1, target,
1933                          unsignedp, methods);
1934
1935  egress:
1936   /* Undo the fiddling above.  */
1937   if (save_enable)
1938     swap_optab_enable (soptab, mode, true);
1939   return temp;
1940 }
1941 \f
1942 /* Generate code to perform an operation specified by UNOPPTAB
1943    on operand OP0, with two results to TARG0 and TARG1.
1944    We assume that the order of the operands for the instruction
1945    is TARG0, TARG1, OP0.
1946
1947    Either TARG0 or TARG1 may be zero, but what that means is that
1948    the result is not actually wanted.  We will generate it into
1949    a dummy pseudo-reg and discard it.  They may not both be zero.
1950
1951    Returns 1 if this operation can be performed; 0 if not.  */
1952
1953 int
1954 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
1955                     int unsignedp)
1956 {
1957   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
1958   enum mode_class mclass;
1959   machine_mode wider_mode;
1960   rtx_insn *entry_last = get_last_insn ();
1961   rtx_insn *last;
1962
1963   mclass = GET_MODE_CLASS (mode);
1964
1965   if (!targ0)
1966     targ0 = gen_reg_rtx (mode);
1967   if (!targ1)
1968     targ1 = gen_reg_rtx (mode);
1969
1970   /* Record where to go back to if we fail.  */
1971   last = get_last_insn ();
1972
1973   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
1974     {
1975       struct expand_operand ops[3];
1976       enum insn_code icode = optab_handler (unoptab, mode);
1977
1978       create_fixed_operand (&ops[0], targ0);
1979       create_fixed_operand (&ops[1], targ1);
1980       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
1981       if (maybe_expand_insn (icode, 3, ops))
1982         return 1;
1983     }
1984
1985   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1986
1987   if (CLASS_HAS_WIDER_MODES_P (mclass))
1988     {
1989       FOR_EACH_WIDER_MODE (wider_mode, mode)
1990         {
1991           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
1992             {
1993               rtx t0 = gen_reg_rtx (wider_mode);
1994               rtx t1 = gen_reg_rtx (wider_mode);
1995               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
1996
1997               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
1998                 {
1999                   convert_move (targ0, t0, unsignedp);
2000                   convert_move (targ1, t1, unsignedp);
2001                   return 1;
2002                 }
2003               else
2004                 delete_insns_since (last);
2005             }
2006         }
2007     }
2008
2009   delete_insns_since (entry_last);
2010   return 0;
2011 }
2012 \f
2013 /* Generate code to perform an operation specified by BINOPTAB
2014    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2015    We assume that the order of the operands for the instruction
2016    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2017    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2018
2019    Either TARG0 or TARG1 may be zero, but what that means is that
2020    the result is not actually wanted.  We will generate it into
2021    a dummy pseudo-reg and discard it.  They may not both be zero.
2022
2023    Returns 1 if this operation can be performed; 0 if not.  */
2024
2025 int
2026 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2027                      int unsignedp)
2028 {
2029   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2030   enum mode_class mclass;
2031   machine_mode wider_mode;
2032   rtx_insn *entry_last = get_last_insn ();
2033   rtx_insn *last;
2034
2035   mclass = GET_MODE_CLASS (mode);
2036
2037   if (!targ0)
2038     targ0 = gen_reg_rtx (mode);
2039   if (!targ1)
2040     targ1 = gen_reg_rtx (mode);
2041
2042   /* Record where to go back to if we fail.  */
2043   last = get_last_insn ();
2044
2045   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2046     {
2047       struct expand_operand ops[4];
2048       enum insn_code icode = optab_handler (binoptab, mode);
2049       machine_mode mode0 = insn_data[icode].operand[1].mode;
2050       machine_mode mode1 = insn_data[icode].operand[2].mode;
2051       rtx xop0 = op0, xop1 = op1;
2052
2053       /* If we are optimizing, force expensive constants into a register.  */
2054       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2055       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2056
2057       create_fixed_operand (&ops[0], targ0);
2058       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2059       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2060       create_fixed_operand (&ops[3], targ1);
2061       if (maybe_expand_insn (icode, 4, ops))
2062         return 1;
2063       delete_insns_since (last);
2064     }
2065
2066   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2067
2068   if (CLASS_HAS_WIDER_MODES_P (mclass))
2069     {
2070       FOR_EACH_WIDER_MODE (wider_mode, mode)
2071         {
2072           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2073             {
2074               rtx t0 = gen_reg_rtx (wider_mode);
2075               rtx t1 = gen_reg_rtx (wider_mode);
2076               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2077               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2078
2079               if (expand_twoval_binop (binoptab, cop0, cop1,
2080                                        t0, t1, unsignedp))
2081                 {
2082                   convert_move (targ0, t0, unsignedp);
2083                   convert_move (targ1, t1, unsignedp);
2084                   return 1;
2085                 }
2086               else
2087                 delete_insns_since (last);
2088             }
2089         }
2090     }
2091
2092   delete_insns_since (entry_last);
2093   return 0;
2094 }
2095
2096 /* Expand the two-valued library call indicated by BINOPTAB, but
2097    preserve only one of the values.  If TARG0 is non-NULL, the first
2098    value is placed into TARG0; otherwise the second value is placed
2099    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2100    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2101    This routine assumes that the value returned by the library call is
2102    as if the return value was of an integral mode twice as wide as the
2103    mode of OP0.  Returns 1 if the call was successful.  */
2104
2105 bool
2106 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2107                              rtx targ0, rtx targ1, enum rtx_code code)
2108 {
2109   machine_mode mode;
2110   machine_mode libval_mode;
2111   rtx libval;
2112   rtx_insn *insns;
2113   rtx libfunc;
2114
2115   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2116   gcc_assert (!targ0 != !targ1);
2117
2118   mode = GET_MODE (op0);
2119   libfunc = optab_libfunc (binoptab, mode);
2120   if (!libfunc)
2121     return false;
2122
2123   /* The value returned by the library function will have twice as
2124      many bits as the nominal MODE.  */
2125   libval_mode = smallest_int_mode_for_size (2 * GET_MODE_BITSIZE (mode));
2126   start_sequence ();
2127   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2128                                     libval_mode,
2129                                     op0, mode,
2130                                     op1, mode);
2131   /* Get the part of VAL containing the value that we want.  */
2132   libval = simplify_gen_subreg (mode, libval, libval_mode,
2133                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2134   insns = get_insns ();
2135   end_sequence ();
2136   /* Move the into the desired location.  */
2137   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2138                       gen_rtx_fmt_ee (code, mode, op0, op1));
2139
2140   return true;
2141 }
2142
2143 \f
2144 /* Wrapper around expand_unop which takes an rtx code to specify
2145    the operation to perform, not an optab pointer.  All other
2146    arguments are the same.  */
2147 rtx
2148 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2149                     rtx target, int unsignedp)
2150 {
2151   optab unop = code_to_optab (code);
2152   gcc_assert (unop);
2153
2154   return expand_unop (mode, unop, op0, target, unsignedp);
2155 }
2156
2157 /* Try calculating
2158         (clz:narrow x)
2159    as
2160         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2161
2162    A similar operation can be used for clrsb.  UNOPTAB says which operation
2163    we are trying to expand.  */
2164 static rtx
2165 widen_leading (scalar_int_mode mode, rtx op0, rtx target, optab unoptab)
2166 {
2167   opt_scalar_int_mode wider_mode_iter;
2168   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2169     {
2170       scalar_int_mode wider_mode = wider_mode_iter.require ();
2171       if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2172         {
2173           rtx xop0, temp;
2174           rtx_insn *last;
2175
2176           last = get_last_insn ();
2177
2178           if (target == 0)
2179             target = gen_reg_rtx (mode);
2180           xop0 = widen_operand (op0, wider_mode, mode,
2181                                 unoptab != clrsb_optab, false);
2182           temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2183                               unoptab != clrsb_optab);
2184           if (temp != 0)
2185             temp = expand_binop
2186               (wider_mode, sub_optab, temp,
2187                gen_int_mode (GET_MODE_PRECISION (wider_mode)
2188                              - GET_MODE_PRECISION (mode),
2189                              wider_mode),
2190                target, true, OPTAB_DIRECT);
2191           if (temp == 0)
2192             delete_insns_since (last);
2193
2194           return temp;
2195         }
2196     }
2197   return 0;
2198 }
2199
2200 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2201    quantities, choosing which based on whether the high word is nonzero.  */
2202 static rtx
2203 expand_doubleword_clz (scalar_int_mode mode, rtx op0, rtx target)
2204 {
2205   rtx xop0 = force_reg (mode, op0);
2206   rtx subhi = gen_highpart (word_mode, xop0);
2207   rtx sublo = gen_lowpart (word_mode, xop0);
2208   rtx_code_label *hi0_label = gen_label_rtx ();
2209   rtx_code_label *after_label = gen_label_rtx ();
2210   rtx_insn *seq;
2211   rtx temp, result;
2212
2213   /* If we were not given a target, use a word_mode register, not a
2214      'mode' register.  The result will fit, and nobody is expecting
2215      anything bigger (the return type of __builtin_clz* is int).  */
2216   if (!target)
2217     target = gen_reg_rtx (word_mode);
2218
2219   /* In any case, write to a word_mode scratch in both branches of the
2220      conditional, so we can ensure there is a single move insn setting
2221      'target' to tag a REG_EQUAL note on.  */
2222   result = gen_reg_rtx (word_mode);
2223
2224   start_sequence ();
2225
2226   /* If the high word is not equal to zero,
2227      then clz of the full value is clz of the high word.  */
2228   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2229                            word_mode, true, hi0_label);
2230
2231   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2232   if (!temp)
2233     goto fail;
2234
2235   if (temp != result)
2236     convert_move (result, temp, true);
2237
2238   emit_jump_insn (targetm.gen_jump (after_label));
2239   emit_barrier ();
2240
2241   /* Else clz of the full value is clz of the low word plus the number
2242      of bits in the high word.  */
2243   emit_label (hi0_label);
2244
2245   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2246   if (!temp)
2247     goto fail;
2248   temp = expand_binop (word_mode, add_optab, temp,
2249                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2250                        result, true, OPTAB_DIRECT);
2251   if (!temp)
2252     goto fail;
2253   if (temp != result)
2254     convert_move (result, temp, true);
2255
2256   emit_label (after_label);
2257   convert_move (target, result, true);
2258
2259   seq = get_insns ();
2260   end_sequence ();
2261
2262   add_equal_note (seq, target, CLZ, xop0, 0);
2263   emit_insn (seq);
2264   return target;
2265
2266  fail:
2267   end_sequence ();
2268   return 0;
2269 }
2270
2271 /* Try calculating popcount of a double-word quantity as two popcount's of
2272    word-sized quantities and summing up the results.  */
2273 static rtx
2274 expand_doubleword_popcount (scalar_int_mode mode, rtx op0, rtx target)
2275 {
2276   rtx t0, t1, t;
2277   rtx_insn *seq;
2278
2279   start_sequence ();
2280
2281   t0 = expand_unop_direct (word_mode, popcount_optab,
2282                            operand_subword_force (op0, 0, mode), NULL_RTX,
2283                            true);
2284   t1 = expand_unop_direct (word_mode, popcount_optab,
2285                            operand_subword_force (op0, 1, mode), NULL_RTX,
2286                            true);
2287   if (!t0 || !t1)
2288     {
2289       end_sequence ();
2290       return NULL_RTX;
2291     }
2292
2293   /* If we were not given a target, use a word_mode register, not a
2294      'mode' register.  The result will fit, and nobody is expecting
2295      anything bigger (the return type of __builtin_popcount* is int).  */
2296   if (!target)
2297     target = gen_reg_rtx (word_mode);
2298
2299   t = expand_binop (word_mode, add_optab, t0, t1, target, 0, OPTAB_DIRECT);
2300
2301   seq = get_insns ();
2302   end_sequence ();
2303
2304   add_equal_note (seq, t, POPCOUNT, op0, 0);
2305   emit_insn (seq);
2306   return t;
2307 }
2308
2309 /* Try calculating
2310         (parity:wide x)
2311    as
2312         (parity:narrow (low (x) ^ high (x))) */
2313 static rtx
2314 expand_doubleword_parity (scalar_int_mode mode, rtx op0, rtx target)
2315 {
2316   rtx t = expand_binop (word_mode, xor_optab,
2317                         operand_subword_force (op0, 0, mode),
2318                         operand_subword_force (op0, 1, mode),
2319                         NULL_RTX, 0, OPTAB_DIRECT);
2320   return expand_unop (word_mode, parity_optab, t, target, true);
2321 }
2322
2323 /* Try calculating
2324         (bswap:narrow x)
2325    as
2326         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2327 static rtx
2328 widen_bswap (scalar_int_mode mode, rtx op0, rtx target)
2329 {
2330   rtx x;
2331   rtx_insn *last;
2332   opt_scalar_int_mode wider_mode_iter;
2333
2334   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2335     if (optab_handler (bswap_optab, wider_mode_iter.require ())
2336         != CODE_FOR_nothing)
2337       break;
2338
2339   if (!wider_mode_iter.exists ())
2340     return NULL_RTX;
2341
2342   scalar_int_mode wider_mode = wider_mode_iter.require ();
2343   last = get_last_insn ();
2344
2345   x = widen_operand (op0, wider_mode, mode, true, true);
2346   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2347
2348   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2349               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2350   if (x != 0)
2351     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2352                       GET_MODE_BITSIZE (wider_mode)
2353                       - GET_MODE_BITSIZE (mode),
2354                       NULL_RTX, true);
2355
2356   if (x != 0)
2357     {
2358       if (target == 0)
2359         target = gen_reg_rtx (mode);
2360       emit_move_insn (target, gen_lowpart (mode, x));
2361     }
2362   else
2363     delete_insns_since (last);
2364
2365   return target;
2366 }
2367
2368 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2369
2370 static rtx
2371 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2372 {
2373   rtx t0, t1;
2374
2375   t1 = expand_unop (word_mode, bswap_optab,
2376                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2377   t0 = expand_unop (word_mode, bswap_optab,
2378                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2379
2380   if (target == 0 || !valid_multiword_target_p (target))
2381     target = gen_reg_rtx (mode);
2382   if (REG_P (target))
2383     emit_clobber (target);
2384   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2385   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2386
2387   return target;
2388 }
2389
2390 /* Try calculating (parity x) as (and (popcount x) 1), where
2391    popcount can also be done in a wider mode.  */
2392 static rtx
2393 expand_parity (scalar_int_mode mode, rtx op0, rtx target)
2394 {
2395   enum mode_class mclass = GET_MODE_CLASS (mode);
2396   opt_scalar_int_mode wider_mode_iter;
2397   FOR_EACH_MODE_FROM (wider_mode_iter, mode)
2398     {
2399       scalar_int_mode wider_mode = wider_mode_iter.require ();
2400       if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2401         {
2402           rtx xop0, temp;
2403           rtx_insn *last;
2404
2405           last = get_last_insn ();
2406
2407           if (target == 0 || GET_MODE (target) != wider_mode)
2408             target = gen_reg_rtx (wider_mode);
2409
2410           xop0 = widen_operand (op0, wider_mode, mode, true, false);
2411           temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2412                               true);
2413           if (temp != 0)
2414             temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2415                                  target, true, OPTAB_DIRECT);
2416
2417           if (temp)
2418             {
2419               if (mclass != MODE_INT
2420                   || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2421                 return convert_to_mode (mode, temp, 0);
2422               else
2423                 return gen_lowpart (mode, temp);
2424             }
2425           else
2426             delete_insns_since (last);
2427         }
2428     }
2429   return 0;
2430 }
2431
2432 /* Try calculating ctz(x) as K - clz(x & -x) ,
2433    where K is GET_MODE_PRECISION(mode) - 1.
2434
2435    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2436    don't have to worry about what the hardware does in that case.  (If
2437    the clz instruction produces the usual value at 0, which is K, the
2438    result of this code sequence will be -1; expand_ffs, below, relies
2439    on this.  It might be nice to have it be K instead, for consistency
2440    with the (very few) processors that provide a ctz with a defined
2441    value, but that would take one more instruction, and it would be
2442    less convenient for expand_ffs anyway.  */
2443
2444 static rtx
2445 expand_ctz (scalar_int_mode mode, rtx op0, rtx target)
2446 {
2447   rtx_insn *seq;
2448   rtx temp;
2449
2450   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2451     return 0;
2452
2453   start_sequence ();
2454
2455   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2456   if (temp)
2457     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2458                          true, OPTAB_DIRECT);
2459   if (temp)
2460     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2461   if (temp)
2462     temp = expand_binop (mode, sub_optab,
2463                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2464                          temp, target,
2465                          true, OPTAB_DIRECT);
2466   if (temp == 0)
2467     {
2468       end_sequence ();
2469       return 0;
2470     }
2471
2472   seq = get_insns ();
2473   end_sequence ();
2474
2475   add_equal_note (seq, temp, CTZ, op0, 0);
2476   emit_insn (seq);
2477   return temp;
2478 }
2479
2480
2481 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2482    else with the sequence used by expand_clz.
2483
2484    The ffs builtin promises to return zero for a zero value and ctz/clz
2485    may have an undefined value in that case.  If they do not give us a
2486    convenient value, we have to generate a test and branch.  */
2487 static rtx
2488 expand_ffs (scalar_int_mode mode, rtx op0, rtx target)
2489 {
2490   HOST_WIDE_INT val = 0;
2491   bool defined_at_zero = false;
2492   rtx temp;
2493   rtx_insn *seq;
2494
2495   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2496     {
2497       start_sequence ();
2498
2499       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2500       if (!temp)
2501         goto fail;
2502
2503       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2504     }
2505   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2506     {
2507       start_sequence ();
2508       temp = expand_ctz (mode, op0, 0);
2509       if (!temp)
2510         goto fail;
2511
2512       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2513         {
2514           defined_at_zero = true;
2515           val = (GET_MODE_PRECISION (mode) - 1) - val;
2516         }
2517     }
2518   else
2519     return 0;
2520
2521   if (defined_at_zero && val == -1)
2522     /* No correction needed at zero.  */;
2523   else
2524     {
2525       /* We don't try to do anything clever with the situation found
2526          on some processors (eg Alpha) where ctz(0:mode) ==
2527          bitsize(mode).  If someone can think of a way to send N to -1
2528          and leave alone all values in the range 0..N-1 (where N is a
2529          power of two), cheaper than this test-and-branch, please add it.
2530
2531          The test-and-branch is done after the operation itself, in case
2532          the operation sets condition codes that can be recycled for this.
2533          (This is true on i386, for instance.)  */
2534
2535       rtx_code_label *nonzero_label = gen_label_rtx ();
2536       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2537                                mode, true, nonzero_label);
2538
2539       convert_move (temp, GEN_INT (-1), false);
2540       emit_label (nonzero_label);
2541     }
2542
2543   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2544      to produce a value in the range 0..bitsize.  */
2545   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2546                        target, false, OPTAB_DIRECT);
2547   if (!temp)
2548     goto fail;
2549
2550   seq = get_insns ();
2551   end_sequence ();
2552
2553   add_equal_note (seq, temp, FFS, op0, 0);
2554   emit_insn (seq);
2555   return temp;
2556
2557  fail:
2558   end_sequence ();
2559   return 0;
2560 }
2561
2562 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2563    conditions, VAL may already be a SUBREG against which we cannot generate
2564    a further SUBREG.  In this case, we expect forcing the value into a
2565    register will work around the situation.  */
2566
2567 static rtx
2568 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
2569                            machine_mode imode)
2570 {
2571   rtx ret;
2572   ret = lowpart_subreg (omode, val, imode);
2573   if (ret == NULL)
2574     {
2575       val = force_reg (imode, val);
2576       ret = lowpart_subreg (omode, val, imode);
2577       gcc_assert (ret != NULL);
2578     }
2579   return ret;
2580 }
2581
2582 /* Expand a floating point absolute value or negation operation via a
2583    logical operation on the sign bit.  */
2584
2585 static rtx
2586 expand_absneg_bit (enum rtx_code code, scalar_float_mode mode,
2587                    rtx op0, rtx target)
2588 {
2589   const struct real_format *fmt;
2590   int bitpos, word, nwords, i;
2591   scalar_int_mode imode;
2592   rtx temp;
2593   rtx_insn *insns;
2594
2595   /* The format has to have a simple sign bit.  */
2596   fmt = REAL_MODE_FORMAT (mode);
2597   if (fmt == NULL)
2598     return NULL_RTX;
2599
2600   bitpos = fmt->signbit_rw;
2601   if (bitpos < 0)
2602     return NULL_RTX;
2603
2604   /* Don't create negative zeros if the format doesn't support them.  */
2605   if (code == NEG && !fmt->has_signed_zero)
2606     return NULL_RTX;
2607
2608   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2609     {
2610       if (!int_mode_for_mode (mode).exists (&imode))
2611         return NULL_RTX;
2612       word = 0;
2613       nwords = 1;
2614     }
2615   else
2616     {
2617       imode = word_mode;
2618
2619       if (FLOAT_WORDS_BIG_ENDIAN)
2620         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2621       else
2622         word = bitpos / BITS_PER_WORD;
2623       bitpos = bitpos % BITS_PER_WORD;
2624       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2625     }
2626
2627   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2628   if (code == ABS)
2629     mask = ~mask;
2630
2631   if (target == 0
2632       || target == op0
2633       || (nwords > 1 && !valid_multiword_target_p (target)))
2634     target = gen_reg_rtx (mode);
2635
2636   if (nwords > 1)
2637     {
2638       start_sequence ();
2639
2640       for (i = 0; i < nwords; ++i)
2641         {
2642           rtx targ_piece = operand_subword (target, i, 1, mode);
2643           rtx op0_piece = operand_subword_force (op0, i, mode);
2644
2645           if (i == word)
2646             {
2647               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2648                                    op0_piece,
2649                                    immed_wide_int_const (mask, imode),
2650                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2651               if (temp != targ_piece)
2652                 emit_move_insn (targ_piece, temp);
2653             }
2654           else
2655             emit_move_insn (targ_piece, op0_piece);
2656         }
2657
2658       insns = get_insns ();
2659       end_sequence ();
2660
2661       emit_insn (insns);
2662     }
2663   else
2664     {
2665       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2666                            gen_lowpart (imode, op0),
2667                            immed_wide_int_const (mask, imode),
2668                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2669       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2670
2671       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2672                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2673                         target);
2674     }
2675
2676   return target;
2677 }
2678
2679 /* As expand_unop, but will fail rather than attempt the operation in a
2680    different mode or with a libcall.  */
2681 static rtx
2682 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
2683                     int unsignedp)
2684 {
2685   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2686     {
2687       struct expand_operand ops[2];
2688       enum insn_code icode = optab_handler (unoptab, mode);
2689       rtx_insn *last = get_last_insn ();
2690       rtx_insn *pat;
2691
2692       create_output_operand (&ops[0], target, mode);
2693       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2694       pat = maybe_gen_insn (icode, 2, ops);
2695       if (pat)
2696         {
2697           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
2698               && ! add_equal_note (pat, ops[0].value,
2699                                    optab_to_code (unoptab),
2700                                    ops[1].value, NULL_RTX))
2701             {
2702               delete_insns_since (last);
2703               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
2704             }
2705
2706           emit_insn (pat);
2707
2708           return ops[0].value;
2709         }
2710     }
2711   return 0;
2712 }
2713
2714 /* Generate code to perform an operation specified by UNOPTAB
2715    on operand OP0, with result having machine-mode MODE.
2716
2717    UNSIGNEDP is for the case where we have to widen the operands
2718    to perform the operation.  It says to use zero-extension.
2719
2720    If TARGET is nonzero, the value
2721    is generated there, if it is convenient to do so.
2722    In all cases an rtx is returned for the locus of the value;
2723    this may or may not be TARGET.  */
2724
2725 rtx
2726 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
2727              int unsignedp)
2728 {
2729   enum mode_class mclass = GET_MODE_CLASS (mode);
2730   machine_mode wider_mode;
2731   scalar_int_mode int_mode;
2732   scalar_float_mode float_mode;
2733   rtx temp;
2734   rtx libfunc;
2735
2736   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
2737   if (temp)
2738     return temp;
2739
2740   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
2741
2742   /* Widening (or narrowing) clz needs special treatment.  */
2743   if (unoptab == clz_optab)
2744     {
2745       if (is_a <scalar_int_mode> (mode, &int_mode))
2746         {
2747           temp = widen_leading (int_mode, op0, target, unoptab);
2748           if (temp)
2749             return temp;
2750
2751           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2752               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2753             {
2754               temp = expand_doubleword_clz (int_mode, op0, target);
2755               if (temp)
2756                 return temp;
2757             }
2758         }
2759
2760       goto try_libcall;
2761     }
2762
2763   if (unoptab == clrsb_optab)
2764     {
2765       if (is_a <scalar_int_mode> (mode, &int_mode))
2766         {
2767           temp = widen_leading (int_mode, op0, target, unoptab);
2768           if (temp)
2769             return temp;
2770         }
2771       goto try_libcall;
2772     }
2773
2774   if (unoptab == popcount_optab
2775       && is_a <scalar_int_mode> (mode, &int_mode)
2776       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2777       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2778       && optimize_insn_for_speed_p ())
2779     {
2780       temp = expand_doubleword_popcount (int_mode, op0, target);
2781       if (temp)
2782         return temp;
2783     }
2784
2785   if (unoptab == parity_optab
2786       && is_a <scalar_int_mode> (mode, &int_mode)
2787       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2788       && (optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2789           || optab_handler (popcount_optab, word_mode) != CODE_FOR_nothing)
2790       && optimize_insn_for_speed_p ())
2791     {
2792       temp = expand_doubleword_parity (int_mode, op0, target);
2793       if (temp)
2794         return temp;
2795     }
2796
2797   /* Widening (or narrowing) bswap needs special treatment.  */
2798   if (unoptab == bswap_optab)
2799     {
2800       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
2801          or ROTATERT.  First try these directly; if this fails, then try the
2802          obvious pair of shifts with allowed widening, as this will probably
2803          be always more efficient than the other fallback methods.  */
2804       if (mode == HImode)
2805         {
2806           rtx_insn *last;
2807           rtx temp1, temp2;
2808
2809           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
2810             {
2811               temp = expand_binop (mode, rotl_optab, op0,
2812                                    gen_int_shift_amount (mode, 8),
2813                                    target, unsignedp, OPTAB_DIRECT);
2814               if (temp)
2815                 return temp;
2816              }
2817
2818           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
2819             {
2820               temp = expand_binop (mode, rotr_optab, op0,
2821                                    gen_int_shift_amount (mode, 8),
2822                                    target, unsignedp, OPTAB_DIRECT);
2823               if (temp)
2824                 return temp;
2825             }
2826
2827           last = get_last_insn ();
2828
2829           temp1 = expand_binop (mode, ashl_optab, op0,
2830                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2831                                 unsignedp, OPTAB_WIDEN);
2832           temp2 = expand_binop (mode, lshr_optab, op0,
2833                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2834                                 unsignedp, OPTAB_WIDEN);
2835           if (temp1 && temp2)
2836             {
2837               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
2838                                    unsignedp, OPTAB_WIDEN);
2839               if (temp)
2840                 return temp;
2841             }
2842
2843           delete_insns_since (last);
2844         }
2845
2846       if (is_a <scalar_int_mode> (mode, &int_mode))
2847         {
2848           temp = widen_bswap (int_mode, op0, target);
2849           if (temp)
2850             return temp;
2851
2852           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2853               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2854             {
2855               temp = expand_doubleword_bswap (mode, op0, target);
2856               if (temp)
2857                 return temp;
2858             }
2859         }
2860
2861       goto try_libcall;
2862     }
2863
2864   if (CLASS_HAS_WIDER_MODES_P (mclass))
2865     FOR_EACH_WIDER_MODE (wider_mode, mode)
2866       {
2867         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2868           {
2869             rtx xop0 = op0;
2870             rtx_insn *last = get_last_insn ();
2871
2872             /* For certain operations, we need not actually extend
2873                the narrow operand, as long as we will truncate the
2874                results to the same narrowness.  */
2875
2876             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
2877                                   (unoptab == neg_optab
2878                                    || unoptab == one_cmpl_optab)
2879                                   && mclass == MODE_INT);
2880
2881             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2882                                 unsignedp);
2883
2884             if (temp)
2885               {
2886                 if (mclass != MODE_INT
2887                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2888                   {
2889                     if (target == 0)
2890                       target = gen_reg_rtx (mode);
2891                     convert_move (target, temp, 0);
2892                     return target;
2893                   }
2894                 else
2895                   return gen_lowpart (mode, temp);
2896               }
2897             else
2898               delete_insns_since (last);
2899           }
2900       }
2901
2902   /* These can be done a word at a time.  */
2903   if (unoptab == one_cmpl_optab
2904       && is_int_mode (mode, &int_mode)
2905       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
2906       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2907     {
2908       int i;
2909       rtx_insn *insns;
2910
2911       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
2912         target = gen_reg_rtx (int_mode);
2913
2914       start_sequence ();
2915
2916       /* Do the actual arithmetic.  */
2917       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
2918         {
2919           rtx target_piece = operand_subword (target, i, 1, int_mode);
2920           rtx x = expand_unop (word_mode, unoptab,
2921                                operand_subword_force (op0, i, int_mode),
2922                                target_piece, unsignedp);
2923
2924           if (target_piece != x)
2925             emit_move_insn (target_piece, x);
2926         }
2927
2928       insns = get_insns ();
2929       end_sequence ();
2930
2931       emit_insn (insns);
2932       return target;
2933     }
2934
2935   if (optab_to_code (unoptab) == NEG)
2936     {
2937       /* Try negating floating point values by flipping the sign bit.  */
2938       if (is_a <scalar_float_mode> (mode, &float_mode))
2939         {
2940           temp = expand_absneg_bit (NEG, float_mode, op0, target);
2941           if (temp)
2942             return temp;
2943         }
2944
2945       /* If there is no negation pattern, and we have no negative zero,
2946          try subtracting from zero.  */
2947       if (!HONOR_SIGNED_ZEROS (mode))
2948         {
2949           temp = expand_binop (mode, (unoptab == negv_optab
2950                                       ? subv_optab : sub_optab),
2951                                CONST0_RTX (mode), op0, target,
2952                                unsignedp, OPTAB_DIRECT);
2953           if (temp)
2954             return temp;
2955         }
2956     }
2957
2958   /* Try calculating parity (x) as popcount (x) % 2.  */
2959   if (unoptab == parity_optab && is_a <scalar_int_mode> (mode, &int_mode))
2960     {
2961       temp = expand_parity (int_mode, op0, target);
2962       if (temp)
2963         return temp;
2964     }
2965
2966   /* Try implementing ffs (x) in terms of clz (x).  */
2967   if (unoptab == ffs_optab && is_a <scalar_int_mode> (mode, &int_mode))
2968     {
2969       temp = expand_ffs (int_mode, op0, target);
2970       if (temp)
2971         return temp;
2972     }
2973
2974   /* Try implementing ctz (x) in terms of clz (x).  */
2975   if (unoptab == ctz_optab && is_a <scalar_int_mode> (mode, &int_mode))
2976     {
2977       temp = expand_ctz (int_mode, op0, target);
2978       if (temp)
2979         return temp;
2980     }
2981
2982  try_libcall:
2983   /* Now try a library call in this mode.  */
2984   libfunc = optab_libfunc (unoptab, mode);
2985   if (libfunc)
2986     {
2987       rtx_insn *insns;
2988       rtx value;
2989       rtx eq_value;
2990       machine_mode outmode = mode;
2991
2992       /* All of these functions return small values.  Thus we choose to
2993          have them return something that isn't a double-word.  */
2994       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
2995           || unoptab == clrsb_optab || unoptab == popcount_optab
2996           || unoptab == parity_optab)
2997         outmode
2998           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
2999                                           optab_libfunc (unoptab, mode)));
3000
3001       start_sequence ();
3002
3003       /* Pass 1 for NO_QUEUE so we don't lose any increments
3004          if the libcall is cse'd or moved.  */
3005       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3006                                        op0, mode);
3007       insns = get_insns ();
3008       end_sequence ();
3009
3010       target = gen_reg_rtx (outmode);
3011       bool trapv = trapv_unoptab_p (unoptab);
3012       if (trapv)
3013         eq_value = NULL_RTX;
3014       else
3015         {
3016           eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3017           if (GET_MODE_UNIT_SIZE (outmode) < GET_MODE_UNIT_SIZE (mode))
3018             eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3019           else if (GET_MODE_UNIT_SIZE (outmode) > GET_MODE_UNIT_SIZE (mode))
3020             eq_value = simplify_gen_unary (ZERO_EXTEND,
3021                                            outmode, eq_value, mode);
3022         }
3023       emit_libcall_block_1 (insns, target, value, eq_value, trapv);
3024
3025       return target;
3026     }
3027
3028   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3029
3030   if (CLASS_HAS_WIDER_MODES_P (mclass))
3031     {
3032       FOR_EACH_WIDER_MODE (wider_mode, mode)
3033         {
3034           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3035               || optab_libfunc (unoptab, wider_mode))
3036             {
3037               rtx xop0 = op0;
3038               rtx_insn *last = get_last_insn ();
3039
3040               /* For certain operations, we need not actually extend
3041                  the narrow operand, as long as we will truncate the
3042                  results to the same narrowness.  */
3043               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3044                                     (unoptab == neg_optab
3045                                      || unoptab == one_cmpl_optab
3046                                      || unoptab == bswap_optab)
3047                                     && mclass == MODE_INT);
3048
3049               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3050                                   unsignedp);
3051
3052               /* If we are generating clz using wider mode, adjust the
3053                  result.  Similarly for clrsb.  */
3054               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3055                   && temp != 0)
3056                 {
3057                   scalar_int_mode wider_int_mode
3058                     = as_a <scalar_int_mode> (wider_mode);
3059                   int_mode = as_a <scalar_int_mode> (mode);
3060                   temp = expand_binop
3061                     (wider_mode, sub_optab, temp,
3062                      gen_int_mode (GET_MODE_PRECISION (wider_int_mode)
3063                                    - GET_MODE_PRECISION (int_mode),
3064                                    wider_int_mode),
3065                      target, true, OPTAB_DIRECT);
3066                 }
3067
3068               /* Likewise for bswap.  */
3069               if (unoptab == bswap_optab && temp != 0)
3070                 {
3071                   scalar_int_mode wider_int_mode
3072                     = as_a <scalar_int_mode> (wider_mode);
3073                   int_mode = as_a <scalar_int_mode> (mode);
3074                   gcc_assert (GET_MODE_PRECISION (wider_int_mode)
3075                               == GET_MODE_BITSIZE (wider_int_mode)
3076                               && GET_MODE_PRECISION (int_mode)
3077                                  == GET_MODE_BITSIZE (int_mode));
3078
3079                   temp = expand_shift (RSHIFT_EXPR, wider_int_mode, temp,
3080                                        GET_MODE_BITSIZE (wider_int_mode)
3081                                        - GET_MODE_BITSIZE (int_mode),
3082                                        NULL_RTX, true);
3083                 }
3084
3085               if (temp)
3086                 {
3087                   if (mclass != MODE_INT)
3088                     {
3089                       if (target == 0)
3090                         target = gen_reg_rtx (mode);
3091                       convert_move (target, temp, 0);
3092                       return target;
3093                     }
3094                   else
3095                     return gen_lowpart (mode, temp);
3096                 }
3097               else
3098                 delete_insns_since (last);
3099             }
3100         }
3101     }
3102
3103   /* One final attempt at implementing negation via subtraction,
3104      this time allowing widening of the operand.  */
3105   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3106     {
3107       rtx temp;
3108       temp = expand_binop (mode,
3109                            unoptab == negv_optab ? subv_optab : sub_optab,
3110                            CONST0_RTX (mode), op0,
3111                            target, unsignedp, OPTAB_LIB_WIDEN);
3112       if (temp)
3113         return temp;
3114     }
3115
3116   return 0;
3117 }
3118 \f
3119 /* Emit code to compute the absolute value of OP0, with result to
3120    TARGET if convenient.  (TARGET may be 0.)  The return value says
3121    where the result actually is to be found.
3122
3123    MODE is the mode of the operand; the mode of the result is
3124    different but can be deduced from MODE.
3125
3126  */
3127
3128 rtx
3129 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3130                    int result_unsignedp)
3131 {
3132   rtx temp;
3133
3134   if (GET_MODE_CLASS (mode) != MODE_INT
3135       || ! flag_trapv)
3136     result_unsignedp = 1;
3137
3138   /* First try to do it with a special abs instruction.  */
3139   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3140                       op0, target, 0);
3141   if (temp != 0)
3142     return temp;
3143
3144   /* For floating point modes, try clearing the sign bit.  */
3145   scalar_float_mode float_mode;
3146   if (is_a <scalar_float_mode> (mode, &float_mode))
3147     {
3148       temp = expand_absneg_bit (ABS, float_mode, op0, target);
3149       if (temp)
3150         return temp;
3151     }
3152
3153   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3154   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3155       && !HONOR_SIGNED_ZEROS (mode))
3156     {
3157       rtx_insn *last = get_last_insn ();
3158
3159       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3160                           op0, NULL_RTX, 0);
3161       if (temp != 0)
3162         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3163                              OPTAB_WIDEN);
3164
3165       if (temp != 0)
3166         return temp;
3167
3168       delete_insns_since (last);
3169     }
3170
3171   /* If this machine has expensive jumps, we can do integer absolute
3172      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3173      where W is the width of MODE.  */
3174
3175   scalar_int_mode int_mode;
3176   if (is_int_mode (mode, &int_mode)
3177       && BRANCH_COST (optimize_insn_for_speed_p (),
3178                       false) >= 2)
3179     {
3180       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3181                                    GET_MODE_PRECISION (int_mode) - 1,
3182                                    NULL_RTX, 0);
3183
3184       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3185                            OPTAB_LIB_WIDEN);
3186       if (temp != 0)
3187         temp = expand_binop (int_mode,
3188                              result_unsignedp ? sub_optab : subv_optab,
3189                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3190
3191       if (temp != 0)
3192         return temp;
3193     }
3194
3195   return NULL_RTX;
3196 }
3197
3198 rtx
3199 expand_abs (machine_mode mode, rtx op0, rtx target,
3200             int result_unsignedp, int safe)
3201 {
3202   rtx temp;
3203   rtx_code_label *op1;
3204
3205   if (GET_MODE_CLASS (mode) != MODE_INT
3206       || ! flag_trapv)
3207     result_unsignedp = 1;
3208
3209   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3210   if (temp != 0)
3211     return temp;
3212
3213   /* If that does not win, use conditional jump and negate.  */
3214
3215   /* It is safe to use the target if it is the same
3216      as the source if this is also a pseudo register */
3217   if (op0 == target && REG_P (op0)
3218       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3219     safe = 1;
3220
3221   op1 = gen_label_rtx ();
3222   if (target == 0 || ! safe
3223       || GET_MODE (target) != mode
3224       || (MEM_P (target) && MEM_VOLATILE_P (target))
3225       || (REG_P (target)
3226           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3227     target = gen_reg_rtx (mode);
3228
3229   emit_move_insn (target, op0);
3230   NO_DEFER_POP;
3231
3232   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3233                            NULL_RTX, NULL, op1,
3234                            profile_probability::uninitialized ());
3235
3236   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3237                      target, target, 0);
3238   if (op0 != target)
3239     emit_move_insn (target, op0);
3240   emit_label (op1);
3241   OK_DEFER_POP;
3242   return target;
3243 }
3244
3245 /* Emit code to compute the one's complement absolute value of OP0
3246    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3247    (TARGET may be NULL_RTX.)  The return value says where the result
3248    actually is to be found.
3249
3250    MODE is the mode of the operand; the mode of the result is
3251    different but can be deduced from MODE.  */
3252
3253 rtx
3254 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3255 {
3256   rtx temp;
3257
3258   /* Not applicable for floating point modes.  */
3259   if (FLOAT_MODE_P (mode))
3260     return NULL_RTX;
3261
3262   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3263   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3264     {
3265       rtx_insn *last = get_last_insn ();
3266
3267       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3268       if (temp != 0)
3269         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3270                              OPTAB_WIDEN);
3271
3272       if (temp != 0)
3273         return temp;
3274
3275       delete_insns_since (last);
3276     }
3277
3278   /* If this machine has expensive jumps, we can do one's complement
3279      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3280
3281   scalar_int_mode int_mode;
3282   if (is_int_mode (mode, &int_mode)
3283       && BRANCH_COST (optimize_insn_for_speed_p (),
3284                      false) >= 2)
3285     {
3286       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3287                                    GET_MODE_PRECISION (int_mode) - 1,
3288                                    NULL_RTX, 0);
3289
3290       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3291                            OPTAB_LIB_WIDEN);
3292
3293       if (temp != 0)
3294         return temp;
3295     }
3296
3297   return NULL_RTX;
3298 }
3299
3300 /* A subroutine of expand_copysign, perform the copysign operation using the
3301    abs and neg primitives advertised to exist on the target.  The assumption
3302    is that we have a split register file, and leaving op0 in fp registers,
3303    and not playing with subregs so much, will help the register allocator.  */
3304
3305 static rtx
3306 expand_copysign_absneg (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3307                         int bitpos, bool op0_is_abs)
3308 {
3309   scalar_int_mode imode;
3310   enum insn_code icode;
3311   rtx sign;
3312   rtx_code_label *label;
3313
3314   if (target == op1)
3315     target = NULL_RTX;
3316
3317   /* Check if the back end provides an insn that handles signbit for the
3318      argument's mode. */
3319   icode = optab_handler (signbit_optab, mode);
3320   if (icode != CODE_FOR_nothing)
3321     {
3322       imode = as_a <scalar_int_mode> (insn_data[(int) icode].operand[0].mode);
3323       sign = gen_reg_rtx (imode);
3324       emit_unop_insn (icode, sign, op1, UNKNOWN);
3325     }
3326   else
3327     {
3328       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3329         {
3330           if (!int_mode_for_mode (mode).exists (&imode))
3331             return NULL_RTX;
3332           op1 = gen_lowpart (imode, op1);
3333         }
3334       else
3335         {
3336           int word;
3337
3338           imode = word_mode;
3339           if (FLOAT_WORDS_BIG_ENDIAN)
3340             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3341           else
3342             word = bitpos / BITS_PER_WORD;
3343           bitpos = bitpos % BITS_PER_WORD;
3344           op1 = operand_subword_force (op1, word, mode);
3345         }
3346
3347       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3348       sign = expand_binop (imode, and_optab, op1,
3349                            immed_wide_int_const (mask, imode),
3350                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3351     }
3352
3353   if (!op0_is_abs)
3354     {
3355       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3356       if (op0 == NULL)
3357         return NULL_RTX;
3358       target = op0;
3359     }
3360   else
3361     {
3362       if (target == NULL_RTX)
3363         target = copy_to_reg (op0);
3364       else
3365         emit_move_insn (target, op0);
3366     }
3367
3368   label = gen_label_rtx ();
3369   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3370
3371   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3372     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3373   else
3374     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3375   if (op0 != target)
3376     emit_move_insn (target, op0);
3377
3378   emit_label (label);
3379
3380   return target;
3381 }
3382
3383
3384 /* A subroutine of expand_copysign, perform the entire copysign operation
3385    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3386    is true if op0 is known to have its sign bit clear.  */
3387
3388 static rtx
3389 expand_copysign_bit (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3390                      int bitpos, bool op0_is_abs)
3391 {
3392   scalar_int_mode imode;
3393   int word, nwords, i;
3394   rtx temp;
3395   rtx_insn *insns;
3396
3397   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3398     {
3399       if (!int_mode_for_mode (mode).exists (&imode))
3400         return NULL_RTX;
3401       word = 0;
3402       nwords = 1;
3403     }
3404   else
3405     {
3406       imode = word_mode;
3407
3408       if (FLOAT_WORDS_BIG_ENDIAN)
3409         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3410       else
3411         word = bitpos / BITS_PER_WORD;
3412       bitpos = bitpos % BITS_PER_WORD;
3413       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3414     }
3415
3416   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3417
3418   if (target == 0
3419       || target == op0
3420       || target == op1
3421       || (nwords > 1 && !valid_multiword_target_p (target)))
3422     target = gen_reg_rtx (mode);
3423
3424   if (nwords > 1)
3425     {
3426       start_sequence ();
3427
3428       for (i = 0; i < nwords; ++i)
3429         {
3430           rtx targ_piece = operand_subword (target, i, 1, mode);
3431           rtx op0_piece = operand_subword_force (op0, i, mode);
3432
3433           if (i == word)
3434             {
3435               if (!op0_is_abs)
3436                 op0_piece
3437                   = expand_binop (imode, and_optab, op0_piece,
3438                                   immed_wide_int_const (~mask, imode),
3439                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3440               op1 = expand_binop (imode, and_optab,
3441                                   operand_subword_force (op1, i, mode),
3442                                   immed_wide_int_const (mask, imode),
3443                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3444
3445               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3446                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3447               if (temp != targ_piece)
3448                 emit_move_insn (targ_piece, temp);
3449             }
3450           else
3451             emit_move_insn (targ_piece, op0_piece);
3452         }
3453
3454       insns = get_insns ();
3455       end_sequence ();
3456
3457       emit_insn (insns);
3458     }
3459   else
3460     {
3461       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3462                           immed_wide_int_const (mask, imode),
3463                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3464
3465       op0 = gen_lowpart (imode, op0);
3466       if (!op0_is_abs)
3467         op0 = expand_binop (imode, and_optab, op0,
3468                             immed_wide_int_const (~mask, imode),
3469                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3470
3471       temp = expand_binop (imode, ior_optab, op0, op1,
3472                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3473       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3474     }
3475
3476   return target;
3477 }
3478
3479 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3480    scalar floating point mode.  Return NULL if we do not know how to
3481    expand the operation inline.  */
3482
3483 rtx
3484 expand_copysign (rtx op0, rtx op1, rtx target)
3485 {
3486   scalar_float_mode mode;
3487   const struct real_format *fmt;
3488   bool op0_is_abs;
3489   rtx temp;
3490
3491   mode = as_a <scalar_float_mode> (GET_MODE (op0));
3492   gcc_assert (GET_MODE (op1) == mode);
3493
3494   /* First try to do it with a special instruction.  */
3495   temp = expand_binop (mode, copysign_optab, op0, op1,
3496                        target, 0, OPTAB_DIRECT);
3497   if (temp)
3498     return temp;
3499
3500   fmt = REAL_MODE_FORMAT (mode);
3501   if (fmt == NULL || !fmt->has_signed_zero)
3502     return NULL_RTX;
3503
3504   op0_is_abs = false;
3505   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3506     {
3507       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3508         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3509       op0_is_abs = true;
3510     }
3511
3512   if (fmt->signbit_ro >= 0
3513       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3514           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3515               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3516     {
3517       temp = expand_copysign_absneg (mode, op0, op1, target,
3518                                      fmt->signbit_ro, op0_is_abs);
3519       if (temp)
3520         return temp;
3521     }
3522
3523   if (fmt->signbit_rw < 0)
3524     return NULL_RTX;
3525   return expand_copysign_bit (mode, op0, op1, target,
3526                               fmt->signbit_rw, op0_is_abs);
3527 }
3528 \f
3529 /* Generate an instruction whose insn-code is INSN_CODE,
3530    with two operands: an output TARGET and an input OP0.
3531    TARGET *must* be nonzero, and the output is always stored there.
3532    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3533    the value that is stored into TARGET.
3534
3535    Return false if expansion failed.  */
3536
3537 bool
3538 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3539                       enum rtx_code code)
3540 {
3541   struct expand_operand ops[2];
3542   rtx_insn *pat;
3543
3544   create_output_operand (&ops[0], target, GET_MODE (target));
3545   create_input_operand (&ops[1], op0, GET_MODE (op0));
3546   pat = maybe_gen_insn (icode, 2, ops);
3547   if (!pat)
3548     return false;
3549
3550   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3551       && code != UNKNOWN)
3552     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3553
3554   emit_insn (pat);
3555
3556   if (ops[0].value != target)
3557     emit_move_insn (target, ops[0].value);
3558   return true;
3559 }
3560 /* Generate an instruction whose insn-code is INSN_CODE,
3561    with two operands: an output TARGET and an input OP0.
3562    TARGET *must* be nonzero, and the output is always stored there.
3563    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3564    the value that is stored into TARGET.  */
3565
3566 void
3567 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3568 {
3569   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3570   gcc_assert (ok);
3571 }
3572 \f
3573 struct no_conflict_data
3574 {
3575   rtx target;
3576   rtx_insn *first, *insn;
3577   bool must_stay;
3578 };
3579
3580 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3581    the currently examined clobber / store has to stay in the list of
3582    insns that constitute the actual libcall block.  */
3583 static void
3584 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3585 {
3586   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3587
3588   /* If this inns directly contributes to setting the target, it must stay.  */
3589   if (reg_overlap_mentioned_p (p->target, dest))
3590     p->must_stay = true;
3591   /* If we haven't committed to keeping any other insns in the list yet,
3592      there is nothing more to check.  */
3593   else if (p->insn == p->first)
3594     return;
3595   /* If this insn sets / clobbers a register that feeds one of the insns
3596      already in the list, this insn has to stay too.  */
3597   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3598            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3599            || reg_used_between_p (dest, p->first, p->insn)
3600            /* Likewise if this insn depends on a register set by a previous
3601               insn in the list, or if it sets a result (presumably a hard
3602               register) that is set or clobbered by a previous insn.
3603               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3604               SET_DEST perform the former check on the address, and the latter
3605               check on the MEM.  */
3606            || (GET_CODE (set) == SET
3607                && (modified_in_p (SET_SRC (set), p->first)
3608                    || modified_in_p (SET_DEST (set), p->first)
3609                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3610                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3611     p->must_stay = true;
3612 }
3613
3614 \f
3615 /* Emit code to make a call to a constant function or a library call.
3616
3617    INSNS is a list containing all insns emitted in the call.
3618    These insns leave the result in RESULT.  Our block is to copy RESULT
3619    to TARGET, which is logically equivalent to EQUIV.
3620
3621    We first emit any insns that set a pseudo on the assumption that these are
3622    loading constants into registers; doing so allows them to be safely cse'ed
3623    between blocks.  Then we emit all the other insns in the block, followed by
3624    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3625    note with an operand of EQUIV.  */
3626
3627 static void
3628 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3629                       bool equiv_may_trap)
3630 {
3631   rtx final_dest = target;
3632   rtx_insn *next, *last, *insn;
3633
3634   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3635      into a MEM later.  Protect the libcall block from this change.  */
3636   if (! REG_P (target) || REG_USERVAR_P (target))
3637     target = gen_reg_rtx (GET_MODE (target));
3638
3639   /* If we're using non-call exceptions, a libcall corresponding to an
3640      operation that may trap may also trap.  */
3641   /* ??? See the comment in front of make_reg_eh_region_note.  */
3642   if (cfun->can_throw_non_call_exceptions
3643       && (equiv_may_trap || may_trap_p (equiv)))
3644     {
3645       for (insn = insns; insn; insn = NEXT_INSN (insn))
3646         if (CALL_P (insn))
3647           {
3648             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3649             if (note)
3650               {
3651                 int lp_nr = INTVAL (XEXP (note, 0));
3652                 if (lp_nr == 0 || lp_nr == INT_MIN)
3653                   remove_note (insn, note);
3654               }
3655           }
3656     }
3657   else
3658     {
3659       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3660          reg note to indicate that this call cannot throw or execute a nonlocal
3661          goto (unless there is already a REG_EH_REGION note, in which case
3662          we update it).  */
3663       for (insn = insns; insn; insn = NEXT_INSN (insn))
3664         if (CALL_P (insn))
3665           make_reg_eh_region_note_nothrow_nononlocal (insn);
3666     }
3667
3668   /* First emit all insns that set pseudos.  Remove them from the list as
3669      we go.  Avoid insns that set pseudos which were referenced in previous
3670      insns.  These can be generated by move_by_pieces, for example,
3671      to update an address.  Similarly, avoid insns that reference things
3672      set in previous insns.  */
3673
3674   for (insn = insns; insn; insn = next)
3675     {
3676       rtx set = single_set (insn);
3677
3678       next = NEXT_INSN (insn);
3679
3680       if (set != 0 && REG_P (SET_DEST (set))
3681           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3682         {
3683           struct no_conflict_data data;
3684
3685           data.target = const0_rtx;
3686           data.first = insns;
3687           data.insn = insn;
3688           data.must_stay = 0;
3689           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3690           if (! data.must_stay)
3691             {
3692               if (PREV_INSN (insn))
3693                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3694               else
3695                 insns = next;
3696
3697               if (next)
3698                 SET_PREV_INSN (next) = PREV_INSN (insn);
3699
3700               add_insn (insn);
3701             }
3702         }
3703
3704       /* Some ports use a loop to copy large arguments onto the stack.
3705          Don't move anything outside such a loop.  */
3706       if (LABEL_P (insn))
3707         break;
3708     }
3709
3710   /* Write the remaining insns followed by the final copy.  */
3711   for (insn = insns; insn; insn = next)
3712     {
3713       next = NEXT_INSN (insn);
3714
3715       add_insn (insn);
3716     }
3717
3718   last = emit_move_insn (target, result);
3719   if (equiv)
3720     set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3721
3722   if (final_dest != target)
3723     emit_move_insn (final_dest, target);
3724 }
3725
3726 void
3727 emit_libcall_block (rtx_insn *insns, rtx target, rtx result, rtx equiv)
3728 {
3729   emit_libcall_block_1 (insns, target, result, equiv, false);
3730 }
3731 \f
3732 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3733    PURPOSE describes how this comparison will be used.  CODE is the rtx
3734    comparison code we will be using.
3735
3736    ??? Actually, CODE is slightly weaker than that.  A target is still
3737    required to implement all of the normal bcc operations, but not
3738    required to implement all (or any) of the unordered bcc operations.  */
3739
3740 int
3741 can_compare_p (enum rtx_code code, machine_mode mode,
3742                enum can_compare_purpose purpose)
3743 {
3744   rtx test;
3745   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
3746   do
3747     {
3748       enum insn_code icode;
3749
3750       if (purpose == ccp_jump
3751           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
3752           && insn_operand_matches (icode, 0, test))
3753         return 1;
3754       if (purpose == ccp_store_flag
3755           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
3756           && insn_operand_matches (icode, 1, test))
3757         return 1;
3758       if (purpose == ccp_cmov
3759           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
3760         return 1;
3761
3762       mode = GET_MODE_WIDER_MODE (mode).else_void ();
3763       PUT_MODE (test, mode);
3764     }
3765   while (mode != VOIDmode);
3766
3767   return 0;
3768 }
3769
3770 /* This function is called when we are going to emit a compare instruction that
3771    compares the values found in X and Y, using the rtl operator COMPARISON.
3772
3773    If they have mode BLKmode, then SIZE specifies the size of both operands.
3774
3775    UNSIGNEDP nonzero says that the operands are unsigned;
3776    this matters if they need to be widened (as given by METHODS).
3777
3778    *PTEST is where the resulting comparison RTX is returned or NULL_RTX
3779    if we failed to produce one.
3780
3781    *PMODE is the mode of the inputs (in case they are const_int).
3782
3783    This function performs all the setup necessary so that the caller only has
3784    to emit a single comparison insn.  This setup can involve doing a BLKmode
3785    comparison or emitting a library call to perform the comparison if no insn
3786    is available to handle it.
3787    The values which are passed in through pointers can be modified; the caller
3788    should perform the comparison on the modified values.  Constant
3789    comparisons must have already been folded.  */
3790
3791 static void
3792 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
3793                   int unsignedp, enum optab_methods methods,
3794                   rtx *ptest, machine_mode *pmode)
3795 {
3796   machine_mode mode = *pmode;
3797   rtx libfunc, test;
3798   machine_mode cmp_mode;
3799   enum mode_class mclass;
3800
3801   /* The other methods are not needed.  */
3802   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
3803               || methods == OPTAB_LIB_WIDEN);
3804
3805   /* If we are optimizing, force expensive constants into a register.  */
3806   if (CONSTANT_P (x) && optimize
3807       && (rtx_cost (x, mode, COMPARE, 0, optimize_insn_for_speed_p ())
3808           > COSTS_N_INSNS (1)))
3809     x = force_reg (mode, x);
3810
3811   if (CONSTANT_P (y) && optimize
3812       && (rtx_cost (y, mode, COMPARE, 1, optimize_insn_for_speed_p ())
3813           > COSTS_N_INSNS (1)))
3814     y = force_reg (mode, y);
3815
3816 #if HAVE_cc0
3817   /* Make sure if we have a canonical comparison.  The RTL
3818      documentation states that canonical comparisons are required only
3819      for targets which have cc0.  */
3820   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
3821 #endif
3822
3823   /* Don't let both operands fail to indicate the mode.  */
3824   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
3825     x = force_reg (mode, x);
3826   if (mode == VOIDmode)
3827     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
3828
3829   /* Handle all BLKmode compares.  */
3830
3831   if (mode == BLKmode)
3832     {
3833       machine_mode result_mode;
3834       enum insn_code cmp_code;
3835       rtx result;
3836       rtx opalign
3837         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
3838
3839       gcc_assert (size);
3840
3841       /* Try to use a memory block compare insn - either cmpstr
3842          or cmpmem will do.  */
3843       opt_scalar_int_mode cmp_mode_iter;
3844       FOR_EACH_MODE_IN_CLASS (cmp_mode_iter, MODE_INT)
3845         {
3846           scalar_int_mode cmp_mode = cmp_mode_iter.require ();
3847           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
3848           if (cmp_code == CODE_FOR_nothing)
3849             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
3850           if (cmp_code == CODE_FOR_nothing)
3851             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
3852           if (cmp_code == CODE_FOR_nothing)
3853             continue;
3854
3855           /* Must make sure the size fits the insn's mode.  */
3856           if (CONST_INT_P (size)
3857               ? INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode))
3858               : (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (size)))
3859                  > GET_MODE_BITSIZE (cmp_mode)))
3860             continue;
3861
3862           result_mode = insn_data[cmp_code].operand[0].mode;
3863           result = gen_reg_rtx (result_mode);
3864           size = convert_to_mode (cmp_mode, size, 1);
3865           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
3866
3867           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
3868           *pmode = result_mode;
3869           return;
3870         }
3871
3872       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
3873         goto fail;
3874
3875       /* Otherwise call a library function.  */
3876       result = emit_block_comp_via_libcall (XEXP (x, 0), XEXP (y, 0), size);
3877
3878       x = result;
3879       y = const0_rtx;
3880       mode = TYPE_MODE (integer_type_node);
3881       methods = OPTAB_LIB_WIDEN;
3882       unsignedp = false;
3883     }
3884
3885   /* Don't allow operands to the compare to trap, as that can put the
3886      compare and branch in different basic blocks.  */
3887   if (cfun->can_throw_non_call_exceptions)
3888     {
3889       if (may_trap_p (x))
3890         x = copy_to_reg (x);
3891       if (may_trap_p (y))
3892         y = copy_to_reg (y);
3893     }
3894
3895   if (GET_MODE_CLASS (mode) == MODE_CC)
3896     {
3897       enum insn_code icode = optab_handler (cbranch_optab, CCmode);
3898       test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3899       gcc_assert (icode != CODE_FOR_nothing
3900                   && insn_operand_matches (icode, 0, test));
3901       *ptest = test;
3902       return;
3903     }
3904
3905   mclass = GET_MODE_CLASS (mode);
3906   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3907   FOR_EACH_MODE_FROM (cmp_mode, mode)
3908     {
3909       enum insn_code icode;
3910       icode = optab_handler (cbranch_optab, cmp_mode);
3911       if (icode != CODE_FOR_nothing
3912           && insn_operand_matches (icode, 0, test))
3913         {
3914           rtx_insn *last = get_last_insn ();
3915           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
3916           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
3917           if (op0 && op1
3918               && insn_operand_matches (icode, 1, op0)
3919               && insn_operand_matches (icode, 2, op1))
3920             {
3921               XEXP (test, 0) = op0;
3922               XEXP (test, 1) = op1;
3923               *ptest = test;
3924               *pmode = cmp_mode;
3925               return;
3926             }
3927           delete_insns_since (last);
3928         }
3929
3930       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
3931         break;
3932     }
3933
3934   if (methods != OPTAB_LIB_WIDEN)
3935     goto fail;
3936
3937   if (!SCALAR_FLOAT_MODE_P (mode))
3938     {
3939       rtx result;
3940       machine_mode ret_mode;
3941
3942       /* Handle a libcall just for the mode we are using.  */
3943       libfunc = optab_libfunc (cmp_optab, mode);
3944       gcc_assert (libfunc);
3945
3946       /* If we want unsigned, and this mode has a distinct unsigned
3947          comparison routine, use that.  */
3948       if (unsignedp)
3949         {
3950           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
3951           if (ulibfunc)
3952             libfunc = ulibfunc;
3953         }
3954
3955       ret_mode = targetm.libgcc_cmp_return_mode ();
3956       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
3957                                         ret_mode, x, mode, y, mode);
3958
3959       /* There are two kinds of comparison routines. Biased routines
3960          return 0/1/2, and unbiased routines return -1/0/1. Other parts
3961          of gcc expect that the comparison operation is equivalent
3962          to the modified comparison. For signed comparisons compare the
3963          result against 1 in the biased case, and zero in the unbiased
3964          case. For unsigned comparisons always compare against 1 after
3965          biasing the unbiased result by adding 1. This gives us a way to
3966          represent LTU.
3967          The comparisons in the fixed-point helper library are always
3968          biased.  */
3969       x = result;
3970       y = const1_rtx;
3971
3972       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
3973         {
3974           if (unsignedp)
3975             x = plus_constant (ret_mode, result, 1);
3976           else
3977             y = const0_rtx;
3978         }
3979
3980       *pmode = ret_mode;
3981       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
3982                         ptest, pmode);
3983     }
3984   else
3985     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
3986
3987   return;
3988
3989  fail:
3990   *ptest = NULL_RTX;
3991 }
3992
3993 /* Before emitting an insn with code ICODE, make sure that X, which is going
3994    to be used for operand OPNUM of the insn, is converted from mode MODE to
3995    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
3996    that it is accepted by the operand predicate.  Return the new value.  */
3997
3998 rtx
3999 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
4000                  machine_mode wider_mode, int unsignedp)
4001 {
4002   if (mode != wider_mode)
4003     x = convert_modes (wider_mode, mode, x, unsignedp);
4004
4005   if (!insn_operand_matches (icode, opnum, x))
4006     {
4007       machine_mode op_mode = insn_data[(int) icode].operand[opnum].mode;
4008       if (reload_completed)
4009         return NULL_RTX;
4010       if (GET_MODE (x) != op_mode && GET_MODE (x) != VOIDmode)
4011         return NULL_RTX;
4012       x = copy_to_mode_reg (op_mode, x);
4013     }
4014
4015   return x;
4016 }
4017
4018 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4019    we can do the branch.  */
4020
4021 static void
4022 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label,
4023                           profile_probability prob)
4024 {
4025   machine_mode optab_mode;
4026   enum mode_class mclass;
4027   enum insn_code icode;
4028   rtx_insn *insn;
4029
4030   mclass = GET_MODE_CLASS (mode);
4031   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4032   icode = optab_handler (cbranch_optab, optab_mode);
4033
4034   gcc_assert (icode != CODE_FOR_nothing);
4035   gcc_assert (insn_operand_matches (icode, 0, test));
4036   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4037                                           XEXP (test, 1), label));
4038   if (prob.initialized_p ()
4039       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4040       && insn
4041       && JUMP_P (insn)
4042       && any_condjump_p (insn)
4043       && !find_reg_note (insn, REG_BR_PROB, 0))
4044     add_reg_br_prob_note (insn, prob);
4045 }
4046
4047 /* Generate code to compare X with Y so that the condition codes are
4048    set and to jump to LABEL if the condition is true.  If X is a
4049    constant and Y is not a constant, then the comparison is swapped to
4050    ensure that the comparison RTL has the canonical form.
4051
4052    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4053    need to be widened.  UNSIGNEDP is also used to select the proper
4054    branch condition code.
4055
4056    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4057
4058    MODE is the mode of the inputs (in case they are const_int).
4059
4060    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4061    It will be potentially converted into an unsigned variant based on
4062    UNSIGNEDP to select a proper jump instruction.
4063
4064    PROB is the probability of jumping to LABEL.  */
4065
4066 void
4067 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4068                          machine_mode mode, int unsignedp, rtx label,
4069                          profile_probability prob)
4070 {
4071   rtx op0 = x, op1 = y;
4072   rtx test;
4073
4074   /* Swap operands and condition to ensure canonical RTL.  */
4075   if (swap_commutative_operands_p (x, y)
4076       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4077     {
4078       op0 = y, op1 = x;
4079       comparison = swap_condition (comparison);
4080     }
4081
4082   /* If OP0 is still a constant, then both X and Y must be constants
4083      or the opposite comparison is not supported.  Force X into a register
4084      to create canonical RTL.  */
4085   if (CONSTANT_P (op0))
4086     op0 = force_reg (mode, op0);
4087
4088   if (unsignedp)
4089     comparison = unsigned_condition (comparison);
4090
4091   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4092                     &test, &mode);
4093   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4094 }
4095
4096 \f
4097 /* Emit a library call comparison between floating point X and Y.
4098    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4099
4100 static void
4101 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4102                        rtx *ptest, machine_mode *pmode)
4103 {
4104   enum rtx_code swapped = swap_condition (comparison);
4105   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4106   machine_mode orig_mode = GET_MODE (x);
4107   machine_mode mode;
4108   rtx true_rtx, false_rtx;
4109   rtx value, target, equiv;
4110   rtx_insn *insns;
4111   rtx libfunc = 0;
4112   bool reversed_p = false;
4113   scalar_int_mode cmp_mode = targetm.libgcc_cmp_return_mode ();
4114
4115   FOR_EACH_MODE_FROM (mode, orig_mode)
4116     {
4117       if (code_to_optab (comparison)
4118           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4119         break;
4120
4121       if (code_to_optab (swapped)
4122           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4123         {
4124           std::swap (x, y);
4125           comparison = swapped;
4126           break;
4127         }
4128
4129       if (code_to_optab (reversed)
4130           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4131         {
4132           comparison = reversed;
4133           reversed_p = true;
4134           break;
4135         }
4136     }
4137
4138   gcc_assert (mode != VOIDmode);
4139
4140   if (mode != orig_mode)
4141     {
4142       x = convert_to_mode (mode, x, 0);
4143       y = convert_to_mode (mode, y, 0);
4144     }
4145
4146   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4147      the RTL.  The allows the RTL optimizers to delete the libcall if the
4148      condition can be determined at compile-time.  */
4149   if (comparison == UNORDERED
4150       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4151     {
4152       true_rtx = const_true_rtx;
4153       false_rtx = const0_rtx;
4154     }
4155   else
4156     {
4157       switch (comparison)
4158         {
4159         case EQ:
4160           true_rtx = const0_rtx;
4161           false_rtx = const_true_rtx;
4162           break;
4163
4164         case NE:
4165           true_rtx = const_true_rtx;
4166           false_rtx = const0_rtx;
4167           break;
4168
4169         case GT:
4170           true_rtx = const1_rtx;
4171           false_rtx = const0_rtx;
4172           break;
4173
4174         case GE:
4175           true_rtx = const0_rtx;
4176           false_rtx = constm1_rtx;
4177           break;
4178
4179         case LT:
4180           true_rtx = constm1_rtx;
4181           false_rtx = const0_rtx;
4182           break;
4183
4184         case LE:
4185           true_rtx = const0_rtx;
4186           false_rtx = const1_rtx;
4187           break;
4188
4189         default:
4190           gcc_unreachable ();
4191         }
4192     }
4193
4194   if (comparison == UNORDERED)
4195     {
4196       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4197       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4198       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4199                                     temp, const_true_rtx, equiv);
4200     }
4201   else
4202     {
4203       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4204       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4205         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4206                                       equiv, true_rtx, false_rtx);
4207     }
4208
4209   start_sequence ();
4210   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4211                                    cmp_mode, x, mode, y, mode);
4212   insns = get_insns ();
4213   end_sequence ();
4214
4215   target = gen_reg_rtx (cmp_mode);
4216   emit_libcall_block (insns, target, value, equiv);
4217
4218   if (comparison == UNORDERED
4219       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4220       || reversed_p)
4221     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4222   else
4223     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4224
4225   *pmode = cmp_mode;
4226 }
4227 \f
4228 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4229
4230 void
4231 emit_indirect_jump (rtx loc)
4232 {
4233   if (!targetm.have_indirect_jump ())
4234     sorry ("indirect jumps are not available on this target");
4235   else
4236     {
4237       struct expand_operand ops[1];
4238       create_address_operand (&ops[0], loc);
4239       expand_jump_insn (targetm.code_for_indirect_jump, 1, ops);
4240       emit_barrier ();
4241     }
4242 }
4243 \f
4244
4245 /* Emit a conditional move instruction if the machine supports one for that
4246    condition and machine mode.
4247
4248    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4249    the mode to use should they be constants.  If it is VOIDmode, they cannot
4250    both be constants.
4251
4252    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4253    should be stored there.  MODE is the mode to use should they be constants.
4254    If it is VOIDmode, they cannot both be constants.
4255
4256    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4257    is not supported.  */
4258
4259 rtx
4260 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4261                        machine_mode cmode, rtx op2, rtx op3,
4262                        machine_mode mode, int unsignedp)
4263 {
4264   rtx comparison;
4265   rtx_insn *last;
4266   enum insn_code icode;
4267   enum rtx_code reversed;
4268
4269   /* If the two source operands are identical, that's just a move.  */
4270
4271   if (rtx_equal_p (op2, op3))
4272     {
4273       if (!target)
4274         target = gen_reg_rtx (mode);
4275
4276       emit_move_insn (target, op3);
4277       return target;
4278     }
4279
4280   /* If one operand is constant, make it the second one.  Only do this
4281      if the other operand is not constant as well.  */
4282
4283   if (swap_commutative_operands_p (op0, op1))
4284     {
4285       std::swap (op0, op1);
4286       code = swap_condition (code);
4287     }
4288
4289   /* get_condition will prefer to generate LT and GT even if the old
4290      comparison was against zero, so undo that canonicalization here since
4291      comparisons against zero are cheaper.  */
4292   if (code == LT && op1 == const1_rtx)
4293     code = LE, op1 = const0_rtx;
4294   else if (code == GT && op1 == constm1_rtx)
4295     code = GE, op1 = const0_rtx;
4296
4297   if (cmode == VOIDmode)
4298     cmode = GET_MODE (op0);
4299
4300   enum rtx_code orig_code = code;
4301   bool swapped = false;
4302   if (swap_commutative_operands_p (op2, op3)
4303       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4304           != UNKNOWN))
4305     {
4306       std::swap (op2, op3);
4307       code = reversed;
4308       swapped = true;
4309     }
4310
4311   if (mode == VOIDmode)
4312     mode = GET_MODE (op2);
4313
4314   icode = direct_optab_handler (movcc_optab, mode);
4315
4316   if (icode == CODE_FOR_nothing)
4317     return NULL_RTX;
4318
4319   if (!target)
4320     target = gen_reg_rtx (mode);
4321
4322   for (int pass = 0; ; pass++)
4323     {
4324       code = unsignedp ? unsigned_condition (code) : code;
4325       comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4326
4327       /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4328          punt and let the caller figure out how best to deal with this
4329          situation.  */
4330       if (COMPARISON_P (comparison))
4331         {
4332           saved_pending_stack_adjust save;
4333           save_pending_stack_adjust (&save);
4334           last = get_last_insn ();
4335           do_pending_stack_adjust ();
4336           prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4337                             GET_CODE (comparison), NULL_RTX, unsignedp,
4338                             OPTAB_WIDEN, &comparison, &cmode);
4339           if (comparison)
4340             {
4341               struct expand_operand ops[4];
4342
4343               create_output_operand (&ops[0], target, mode);
4344               create_fixed_operand (&ops[1], comparison);
4345               create_input_operand (&ops[2], op2, mode);
4346               create_input_operand (&ops[3], op3, mode);
4347               if (maybe_expand_insn (icode, 4, ops))
4348                 {
4349                   if (ops[0].value != target)
4350                     convert_move (target, ops[0].value, false);
4351                   return target;
4352                 }
4353             }
4354           delete_insns_since (last);
4355           restore_pending_stack_adjust (&save);
4356         }
4357
4358       if (pass == 1)
4359         return NULL_RTX;
4360
4361       /* If the preferred op2/op3 order is not usable, retry with other
4362          operand order, perhaps it will expand successfully.  */
4363       if (swapped)
4364         code = orig_code;
4365       else if ((reversed = reversed_comparison_code_parts (orig_code, op0, op1,
4366                                                            NULL))
4367                != UNKNOWN)
4368         code = reversed;
4369       else
4370         return NULL_RTX;
4371       std::swap (op2, op3);
4372     }
4373 }
4374
4375
4376 /* Emit a conditional negate or bitwise complement using the
4377    negcc or notcc optabs if available.  Return NULL_RTX if such operations
4378    are not available.  Otherwise return the RTX holding the result.
4379    TARGET is the desired destination of the result.  COMP is the comparison
4380    on which to negate.  If COND is true move into TARGET the negation
4381    or bitwise complement of OP1.  Otherwise move OP2 into TARGET.
4382    CODE is either NEG or NOT.  MODE is the machine mode in which the
4383    operation is performed.  */
4384
4385 rtx
4386 emit_conditional_neg_or_complement (rtx target, rtx_code code,
4387                                      machine_mode mode, rtx cond, rtx op1,
4388                                      rtx op2)
4389 {
4390   optab op = unknown_optab;
4391   if (code == NEG)
4392     op = negcc_optab;
4393   else if (code == NOT)
4394     op = notcc_optab;
4395   else
4396     gcc_unreachable ();
4397
4398   insn_code icode = direct_optab_handler (op, mode);
4399
4400   if (icode == CODE_FOR_nothing)
4401     return NULL_RTX;
4402
4403   if (!target)
4404     target = gen_reg_rtx (mode);
4405
4406   rtx_insn *last = get_last_insn ();
4407   struct expand_operand ops[4];
4408
4409   create_output_operand (&ops[0], target, mode);
4410   create_fixed_operand (&ops[1], cond);
4411   create_input_operand (&ops[2], op1, mode);
4412   create_input_operand (&ops[3], op2, mode);
4413
4414   if (maybe_expand_insn (icode, 4, ops))
4415     {
4416       if (ops[0].value != target)
4417         convert_move (target, ops[0].value, false);
4418
4419       return target;
4420     }
4421   delete_insns_since (last);
4422   return NULL_RTX;
4423 }
4424
4425 /* Emit a conditional addition instruction if the machine supports one for that
4426    condition and machine mode.
4427
4428    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4429    the mode to use should they be constants.  If it is VOIDmode, they cannot
4430    both be constants.
4431
4432    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4433    should be stored there.  MODE is the mode to use should they be constants.
4434    If it is VOIDmode, they cannot both be constants.
4435
4436    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4437    is not supported.  */
4438
4439 rtx
4440 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4441                       machine_mode cmode, rtx op2, rtx op3,
4442                       machine_mode mode, int unsignedp)
4443 {
4444   rtx comparison;
4445   rtx_insn *last;
4446   enum insn_code icode;
4447
4448   /* If one operand is constant, make it the second one.  Only do this
4449      if the other operand is not constant as well.  */
4450
4451   if (swap_commutative_operands_p (op0, op1))
4452     {
4453       std::swap (op0, op1);
4454       code = swap_condition (code);
4455     }
4456
4457   /* get_condition will prefer to generate LT and GT even if the old
4458      comparison was against zero, so undo that canonicalization here since
4459      comparisons against zero are cheaper.  */
4460   if (code == LT && op1 == const1_rtx)
4461     code = LE, op1 = const0_rtx;
4462   else if (code == GT && op1 == constm1_rtx)
4463     code = GE, op1 = const0_rtx;
4464
4465   if (cmode == VOIDmode)
4466     cmode = GET_MODE (op0);
4467
4468   if (mode == VOIDmode)
4469     mode = GET_MODE (op2);
4470
4471   icode = optab_handler (addcc_optab, mode);
4472
4473   if (icode == CODE_FOR_nothing)
4474     return 0;
4475
4476   if (!target)
4477     target = gen_reg_rtx (mode);
4478
4479   code = unsignedp ? unsigned_condition (code) : code;
4480   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4481
4482   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4483      return NULL and let the caller figure out how best to deal with this
4484      situation.  */
4485   if (!COMPARISON_P (comparison))
4486     return NULL_RTX;
4487
4488   do_pending_stack_adjust ();
4489   last = get_last_insn ();
4490   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4491                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4492                     &comparison, &cmode);
4493   if (comparison)
4494     {
4495       struct expand_operand ops[4];
4496
4497       create_output_operand (&ops[0], target, mode);
4498       create_fixed_operand (&ops[1], comparison);
4499       create_input_operand (&ops[2], op2, mode);
4500       create_input_operand (&ops[3], op3, mode);
4501       if (maybe_expand_insn (icode, 4, ops))
4502         {
4503           if (ops[0].value != target)
4504             convert_move (target, ops[0].value, false);
4505           return target;
4506         }
4507     }
4508   delete_insns_since (last);
4509   return NULL_RTX;
4510 }
4511 \f
4512 /* These functions attempt to generate an insn body, rather than
4513    emitting the insn, but if the gen function already emits them, we
4514    make no attempt to turn them back into naked patterns.  */
4515
4516 /* Generate and return an insn body to add Y to X.  */
4517
4518 rtx_insn *
4519 gen_add2_insn (rtx x, rtx y)
4520 {
4521   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4522
4523   gcc_assert (insn_operand_matches (icode, 0, x));
4524   gcc_assert (insn_operand_matches (icode, 1, x));
4525   gcc_assert (insn_operand_matches (icode, 2, y));
4526
4527   return GEN_FCN (icode) (x, x, y);
4528 }
4529
4530 /* Generate and return an insn body to add r1 and c,
4531    storing the result in r0.  */
4532
4533 rtx_insn *
4534 gen_add3_insn (rtx r0, rtx r1, rtx c)
4535 {
4536   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4537
4538   if (icode == CODE_FOR_nothing
4539       || !insn_operand_matches (icode, 0, r0)
4540       || !insn_operand_matches (icode, 1, r1)
4541       || !insn_operand_matches (icode, 2, c))
4542     return NULL;
4543
4544   return GEN_FCN (icode) (r0, r1, c);
4545 }
4546
4547 int
4548 have_add2_insn (rtx x, rtx y)
4549 {
4550   enum insn_code icode;
4551
4552   gcc_assert (GET_MODE (x) != VOIDmode);
4553
4554   icode = optab_handler (add_optab, GET_MODE (x));
4555
4556   if (icode == CODE_FOR_nothing)
4557     return 0;
4558
4559   if (!insn_operand_matches (icode, 0, x)
4560       || !insn_operand_matches (icode, 1, x)
4561       || !insn_operand_matches (icode, 2, y))
4562     return 0;
4563
4564   return 1;
4565 }
4566
4567 /* Generate and return an insn body to add Y to X.  */
4568
4569 rtx_insn *
4570 gen_addptr3_insn (rtx x, rtx y, rtx z)
4571 {
4572   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4573
4574   gcc_assert (insn_operand_matches (icode, 0, x));
4575   gcc_assert (insn_operand_matches (icode, 1, y));
4576   gcc_assert (insn_operand_matches (icode, 2, z));
4577
4578   return GEN_FCN (icode) (x, y, z);
4579 }
4580
4581 /* Return true if the target implements an addptr pattern and X, Y,
4582    and Z are valid for the pattern predicates.  */
4583
4584 int
4585 have_addptr3_insn (rtx x, rtx y, rtx z)
4586 {
4587   enum insn_code icode;
4588
4589   gcc_assert (GET_MODE (x) != VOIDmode);
4590
4591   icode = optab_handler (addptr3_optab, GET_MODE (x));
4592
4593   if (icode == CODE_FOR_nothing)
4594     return 0;
4595
4596   if (!insn_operand_matches (icode, 0, x)
4597       || !insn_operand_matches (icode, 1, y)
4598       || !insn_operand_matches (icode, 2, z))
4599     return 0;
4600
4601   return 1;
4602 }
4603
4604 /* Generate and return an insn body to subtract Y from X.  */
4605
4606 rtx_insn *
4607 gen_sub2_insn (rtx x, rtx y)
4608 {
4609   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4610
4611   gcc_assert (insn_operand_matches (icode, 0, x));
4612   gcc_assert (insn_operand_matches (icode, 1, x));
4613   gcc_assert (insn_operand_matches (icode, 2, y));
4614
4615   return GEN_FCN (icode) (x, x, y);
4616 }
4617
4618 /* Generate and return an insn body to subtract r1 and c,
4619    storing the result in r0.  */
4620
4621 rtx_insn *
4622 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4623 {
4624   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4625
4626   if (icode == CODE_FOR_nothing
4627       || !insn_operand_matches (icode, 0, r0)
4628       || !insn_operand_matches (icode, 1, r1)
4629       || !insn_operand_matches (icode, 2, c))
4630     return NULL;
4631
4632   return GEN_FCN (icode) (r0, r1, c);
4633 }
4634
4635 int
4636 have_sub2_insn (rtx x, rtx y)
4637 {
4638   enum insn_code icode;
4639
4640   gcc_assert (GET_MODE (x) != VOIDmode);
4641
4642   icode = optab_handler (sub_optab, GET_MODE (x));
4643
4644   if (icode == CODE_FOR_nothing)
4645     return 0;
4646
4647   if (!insn_operand_matches (icode, 0, x)
4648       || !insn_operand_matches (icode, 1, x)
4649       || !insn_operand_matches (icode, 2, y))
4650     return 0;
4651
4652   return 1;
4653 }
4654 \f
4655 /* Generate the body of an insn to extend Y (with mode MFROM)
4656    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4657
4658 rtx_insn *
4659 gen_extend_insn (rtx x, rtx y, machine_mode mto,
4660                  machine_mode mfrom, int unsignedp)
4661 {
4662   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4663   return GEN_FCN (icode) (x, y);
4664 }
4665 \f
4666 /* Generate code to convert FROM to floating point
4667    and store in TO.  FROM must be fixed point and not VOIDmode.
4668    UNSIGNEDP nonzero means regard FROM as unsigned.
4669    Normally this is done by correcting the final value
4670    if it is negative.  */
4671
4672 void
4673 expand_float (rtx to, rtx from, int unsignedp)
4674 {
4675   enum insn_code icode;
4676   rtx target = to;
4677   scalar_mode from_mode, to_mode;
4678   machine_mode fmode, imode;
4679   bool can_do_signed = false;
4680
4681   /* Crash now, because we won't be able to decide which mode to use.  */
4682   gcc_assert (GET_MODE (from) != VOIDmode);
4683
4684   /* Look for an insn to do the conversion.  Do it in the specified
4685      modes if possible; otherwise convert either input, output or both to
4686      wider mode.  If the integer mode is wider than the mode of FROM,
4687      we can do the conversion signed even if the input is unsigned.  */
4688
4689   FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
4690     FOR_EACH_MODE_FROM (imode, GET_MODE (from))
4691       {
4692         int doing_unsigned = unsignedp;
4693
4694         if (fmode != GET_MODE (to)
4695             && (significand_size (fmode)
4696                 < GET_MODE_UNIT_PRECISION (GET_MODE (from))))
4697           continue;
4698
4699         icode = can_float_p (fmode, imode, unsignedp);
4700         if (icode == CODE_FOR_nothing && unsignedp)
4701           {
4702             enum insn_code scode = can_float_p (fmode, imode, 0);
4703             if (scode != CODE_FOR_nothing)
4704               can_do_signed = true;
4705             if (imode != GET_MODE (from))
4706               icode = scode, doing_unsigned = 0;
4707           }
4708
4709         if (icode != CODE_FOR_nothing)
4710           {
4711             if (imode != GET_MODE (from))
4712               from = convert_to_mode (imode, from, unsignedp);
4713
4714             if (fmode != GET_MODE (to))
4715               target = gen_reg_rtx (fmode);
4716
4717             emit_unop_insn (icode, target, from,
4718                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
4719
4720             if (target != to)
4721               convert_move (to, target, 0);
4722             return;
4723           }
4724       }
4725
4726   /* Unsigned integer, and no way to convert directly.  Convert as signed,
4727      then unconditionally adjust the result.  */
4728   if (unsignedp
4729       && can_do_signed
4730       && is_a <scalar_mode> (GET_MODE (to), &to_mode)
4731       && is_a <scalar_mode> (GET_MODE (from), &from_mode))
4732     {
4733       opt_scalar_mode fmode_iter;
4734       rtx_code_label *label = gen_label_rtx ();
4735       rtx temp;
4736       REAL_VALUE_TYPE offset;
4737
4738       /* Look for a usable floating mode FMODE wider than the source and at
4739          least as wide as the target.  Using FMODE will avoid rounding woes
4740          with unsigned values greater than the signed maximum value.  */
4741
4742       FOR_EACH_MODE_FROM (fmode_iter, to_mode)
4743         {
4744           scalar_mode fmode = fmode_iter.require ();
4745           if (GET_MODE_PRECISION (from_mode) < GET_MODE_BITSIZE (fmode)
4746               && can_float_p (fmode, from_mode, 0) != CODE_FOR_nothing)
4747             break;
4748         }
4749
4750       if (!fmode_iter.exists (&fmode))
4751         {
4752           /* There is no such mode.  Pretend the target is wide enough.  */
4753           fmode = to_mode;
4754
4755           /* Avoid double-rounding when TO is narrower than FROM.  */
4756           if ((significand_size (fmode) + 1)
4757               < GET_MODE_PRECISION (from_mode))
4758             {
4759               rtx temp1;
4760               rtx_code_label *neglabel = gen_label_rtx ();
4761
4762               /* Don't use TARGET if it isn't a register, is a hard register,
4763                  or is the wrong mode.  */
4764               if (!REG_P (target)
4765                   || REGNO (target) < FIRST_PSEUDO_REGISTER
4766                   || GET_MODE (target) != fmode)
4767                 target = gen_reg_rtx (fmode);
4768
4769               imode = from_mode;
4770               do_pending_stack_adjust ();
4771
4772               /* Test whether the sign bit is set.  */
4773               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
4774                                        0, neglabel);
4775
4776               /* The sign bit is not set.  Convert as signed.  */
4777               expand_float (target, from, 0);
4778               emit_jump_insn (targetm.gen_jump (label));
4779               emit_barrier ();
4780
4781               /* The sign bit is set.
4782                  Convert to a usable (positive signed) value by shifting right
4783                  one bit, while remembering if a nonzero bit was shifted
4784                  out; i.e., compute  (from & 1) | (from >> 1).  */
4785
4786               emit_label (neglabel);
4787               temp = expand_binop (imode, and_optab, from, const1_rtx,
4788                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
4789               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
4790               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
4791                                    OPTAB_LIB_WIDEN);
4792               expand_float (target, temp, 0);
4793
4794               /* Multiply by 2 to undo the shift above.  */
4795               temp = expand_binop (fmode, add_optab, target, target,
4796                                    target, 0, OPTAB_LIB_WIDEN);
4797               if (temp != target)
4798                 emit_move_insn (target, temp);
4799
4800               do_pending_stack_adjust ();
4801               emit_label (label);
4802               goto done;
4803             }
4804         }
4805
4806       /* If we are about to do some arithmetic to correct for an
4807          unsigned operand, do it in a pseudo-register.  */
4808
4809       if (to_mode != fmode
4810           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
4811         target = gen_reg_rtx (fmode);
4812
4813       /* Convert as signed integer to floating.  */
4814       expand_float (target, from, 0);
4815
4816       /* If FROM is negative (and therefore TO is negative),
4817          correct its value by 2**bitwidth.  */
4818
4819       do_pending_stack_adjust ();
4820       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, from_mode,
4821                                0, label);
4822
4823
4824       real_2expN (&offset, GET_MODE_PRECISION (from_mode), fmode);
4825       temp = expand_binop (fmode, add_optab, target,
4826                            const_double_from_real_value (offset, fmode),
4827                            target, 0, OPTAB_LIB_WIDEN);
4828       if (temp != target)
4829         emit_move_insn (target, temp);
4830
4831       do_pending_stack_adjust ();
4832       emit_label (label);
4833       goto done;
4834     }
4835
4836   /* No hardware instruction available; call a library routine.  */
4837     {
4838       rtx libfunc;
4839       rtx_insn *insns;
4840       rtx value;
4841       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
4842
4843       if (is_narrower_int_mode (GET_MODE (from), SImode))
4844         from = convert_to_mode (SImode, from, unsignedp);
4845
4846       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
4847       gcc_assert (libfunc);
4848
4849       start_sequence ();
4850
4851       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4852                                        GET_MODE (to), from, GET_MODE (from));
4853       insns = get_insns ();
4854       end_sequence ();
4855
4856       emit_libcall_block (insns, target, value,
4857                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
4858                                          GET_MODE (to), from));
4859     }
4860
4861  done:
4862
4863   /* Copy result to requested destination
4864      if we have been computing in a temp location.  */
4865
4866   if (target != to)
4867     {
4868       if (GET_MODE (target) == GET_MODE (to))
4869         emit_move_insn (to, target);
4870       else
4871         convert_move (to, target, 0);
4872     }
4873 }
4874 \f
4875 /* Generate code to convert FROM to fixed point and store in TO.  FROM
4876    must be floating point.  */
4877
4878 void
4879 expand_fix (rtx to, rtx from, int unsignedp)
4880 {
4881   enum insn_code icode;
4882   rtx target = to;
4883   machine_mode fmode, imode;
4884   opt_scalar_mode fmode_iter;
4885   bool must_trunc = false;
4886
4887   /* We first try to find a pair of modes, one real and one integer, at
4888      least as wide as FROM and TO, respectively, in which we can open-code
4889      this conversion.  If the integer mode is wider than the mode of TO,
4890      we can do the conversion either signed or unsigned.  */
4891
4892   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
4893     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
4894       {
4895         int doing_unsigned = unsignedp;
4896
4897         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
4898         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
4899           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
4900
4901         if (icode != CODE_FOR_nothing)
4902           {
4903             rtx_insn *last = get_last_insn ();
4904             if (fmode != GET_MODE (from))
4905               from = convert_to_mode (fmode, from, 0);
4906
4907             if (must_trunc)
4908               {
4909                 rtx temp = gen_reg_rtx (GET_MODE (from));
4910                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
4911                                     temp, 0);
4912               }
4913
4914             if (imode != GET_MODE (to))
4915               target = gen_reg_rtx (imode);
4916
4917             if (maybe_emit_unop_insn (icode, target, from,
4918                                       doing_unsigned ? UNSIGNED_FIX : FIX))
4919               {
4920                 if (target != to)
4921                   convert_move (to, target, unsignedp);
4922                 return;
4923               }
4924             delete_insns_since (last);
4925           }
4926       }
4927
4928   /* For an unsigned conversion, there is one more way to do it.
4929      If we have a signed conversion, we generate code that compares
4930      the real value to the largest representable positive number.  If if
4931      is smaller, the conversion is done normally.  Otherwise, subtract
4932      one plus the highest signed number, convert, and add it back.
4933
4934      We only need to check all real modes, since we know we didn't find
4935      anything with a wider integer mode.
4936
4937      This code used to extend FP value into mode wider than the destination.
4938      This is needed for decimal float modes which cannot accurately
4939      represent one plus the highest signed number of the same size, but
4940      not for binary modes.  Consider, for instance conversion from SFmode
4941      into DImode.
4942
4943      The hot path through the code is dealing with inputs smaller than 2^63
4944      and doing just the conversion, so there is no bits to lose.
4945
4946      In the other path we know the value is positive in the range 2^63..2^64-1
4947      inclusive.  (as for other input overflow happens and result is undefined)
4948      So we know that the most important bit set in mantissa corresponds to
4949      2^63.  The subtraction of 2^63 should not generate any rounding as it
4950      simply clears out that bit.  The rest is trivial.  */
4951
4952   scalar_int_mode to_mode;
4953   if (unsignedp
4954       && is_a <scalar_int_mode> (GET_MODE (to), &to_mode)
4955       && HWI_COMPUTABLE_MODE_P (to_mode))
4956     FOR_EACH_MODE_FROM (fmode_iter, as_a <scalar_mode> (GET_MODE (from)))
4957       {
4958         scalar_mode fmode = fmode_iter.require ();
4959         if (CODE_FOR_nothing != can_fix_p (to_mode, fmode,
4960                                            0, &must_trunc)
4961             && (!DECIMAL_FLOAT_MODE_P (fmode)
4962                 || (GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (to_mode))))
4963           {
4964             int bitsize;
4965             REAL_VALUE_TYPE offset;
4966             rtx limit;
4967             rtx_code_label *lab1, *lab2;
4968             rtx_insn *insn;
4969
4970             bitsize = GET_MODE_PRECISION (to_mode);
4971             real_2expN (&offset, bitsize - 1, fmode);
4972             limit = const_double_from_real_value (offset, fmode);
4973             lab1 = gen_label_rtx ();
4974             lab2 = gen_label_rtx ();
4975
4976             if (fmode != GET_MODE (from))
4977               from = convert_to_mode (fmode, from, 0);
4978
4979             /* See if we need to do the subtraction.  */
4980             do_pending_stack_adjust ();
4981             emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX,
4982                                      GET_MODE (from), 0, lab1);
4983
4984             /* If not, do the signed "fix" and branch around fixup code.  */
4985             expand_fix (to, from, 0);
4986             emit_jump_insn (targetm.gen_jump (lab2));
4987             emit_barrier ();
4988
4989             /* Otherwise, subtract 2**(N-1), convert to signed number,
4990                then add 2**(N-1).  Do the addition using XOR since this
4991                will often generate better code.  */
4992             emit_label (lab1);
4993             target = expand_binop (GET_MODE (from), sub_optab, from, limit,
4994                                    NULL_RTX, 0, OPTAB_LIB_WIDEN);
4995             expand_fix (to, target, 0);
4996             target = expand_binop (to_mode, xor_optab, to,
4997                                    gen_int_mode
4998                                    (HOST_WIDE_INT_1 << (bitsize - 1),
4999                                     to_mode),
5000                                    to, 1, OPTAB_LIB_WIDEN);
5001
5002             if (target != to)
5003               emit_move_insn (to, target);
5004
5005             emit_label (lab2);
5006
5007             if (optab_handler (mov_optab, to_mode) != CODE_FOR_nothing)
5008               {
5009                 /* Make a place for a REG_NOTE and add it.  */
5010                 insn = emit_move_insn (to, to);
5011                 set_dst_reg_note (insn, REG_EQUAL,
5012                                   gen_rtx_fmt_e (UNSIGNED_FIX, to_mode,
5013                                                  copy_rtx (from)),
5014                                   to);
5015               }
5016
5017             return;
5018           }
5019       }
5020
5021   /* We can't do it with an insn, so use a library call.  But first ensure
5022      that the mode of TO is at least as wide as SImode, since those are the
5023      only library calls we know about.  */
5024
5025   if (is_narrower_int_mode (GET_MODE (to), SImode))
5026     {
5027       target = gen_reg_rtx (SImode);
5028
5029       expand_fix (target, from, unsignedp);
5030     }
5031   else
5032     {
5033       rtx_insn *insns;
5034       rtx value;
5035       rtx libfunc;
5036
5037       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5038       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5039       gcc_assert (libfunc);
5040
5041       start_sequence ();
5042
5043       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5044                                        GET_MODE (to), from, GET_MODE (from));
5045       insns = get_insns ();
5046       end_sequence ();
5047
5048       emit_libcall_block (insns, target, value,
5049                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5050                                          GET_MODE (to), from));
5051     }
5052
5053   if (target != to)
5054     {
5055       if (GET_MODE (to) == GET_MODE (target))
5056         emit_move_insn (to, target);
5057       else
5058         convert_move (to, target, 0);
5059     }
5060 }
5061
5062
5063 /* Promote integer arguments for a libcall if necessary.
5064    emit_library_call_value cannot do the promotion because it does not
5065    know if it should do a signed or unsigned promotion.  This is because
5066    there are no tree types defined for libcalls.  */
5067
5068 static rtx
5069 prepare_libcall_arg (rtx arg, int uintp)
5070 {
5071   scalar_int_mode mode;
5072   machine_mode arg_mode;
5073   if (is_a <scalar_int_mode> (GET_MODE (arg), &mode))
5074     {
5075       /*  If we need to promote the integer function argument we need to do
5076           it here instead of inside emit_library_call_value because in
5077           emit_library_call_value we don't know if we should do a signed or
5078           unsigned promotion.  */
5079
5080       int unsigned_p = 0;
5081       arg_mode = promote_function_mode (NULL_TREE, mode,
5082                                         &unsigned_p, NULL_TREE, 0);
5083       if (arg_mode != mode)
5084         return convert_to_mode (arg_mode, arg, uintp);
5085     }
5086     return arg;
5087 }
5088
5089 /* Generate code to convert FROM or TO a fixed-point.
5090    If UINTP is true, either TO or FROM is an unsigned integer.
5091    If SATP is true, we need to saturate the result.  */
5092
5093 void
5094 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5095 {
5096   machine_mode to_mode = GET_MODE (to);
5097   machine_mode from_mode = GET_MODE (from);
5098   convert_optab tab;
5099   enum rtx_code this_code;
5100   enum insn_code code;
5101   rtx_insn *insns;
5102   rtx value;
5103   rtx libfunc;
5104
5105   if (to_mode == from_mode)
5106     {
5107       emit_move_insn (to, from);
5108       return;
5109     }
5110
5111   if (uintp)
5112     {
5113       tab = satp ? satfractuns_optab : fractuns_optab;
5114       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5115     }
5116   else
5117     {
5118       tab = satp ? satfract_optab : fract_optab;
5119       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5120     }
5121   code = convert_optab_handler (tab, to_mode, from_mode);
5122   if (code != CODE_FOR_nothing)
5123     {
5124       emit_unop_insn (code, to, from, this_code);
5125       return;
5126     }
5127
5128   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5129   gcc_assert (libfunc);
5130
5131   from = prepare_libcall_arg (from, uintp);
5132   from_mode = GET_MODE (from);
5133
5134   start_sequence ();
5135   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5136                                    from, from_mode);
5137   insns = get_insns ();
5138   end_sequence ();
5139
5140   emit_libcall_block (insns, to, value,
5141                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5142 }
5143
5144 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5145    must be floating point, TO must be signed.  Use the conversion optab
5146    TAB to do the conversion.  */
5147
5148 bool
5149 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5150 {
5151   enum insn_code icode;
5152   rtx target = to;
5153   machine_mode fmode, imode;
5154
5155   /* We first try to find a pair of modes, one real and one integer, at
5156      least as wide as FROM and TO, respectively, in which we can open-code
5157      this conversion.  If the integer mode is wider than the mode of TO,
5158      we can do the conversion either signed or unsigned.  */
5159
5160   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
5161     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
5162       {
5163         icode = convert_optab_handler (tab, imode, fmode);
5164         if (icode != CODE_FOR_nothing)
5165           {
5166             rtx_insn *last = get_last_insn ();
5167             if (fmode != GET_MODE (from))
5168               from = convert_to_mode (fmode, from, 0);
5169
5170             if (imode != GET_MODE (to))
5171               target = gen_reg_rtx (imode);
5172
5173             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5174               {
5175                 delete_insns_since (last);
5176                 continue;
5177               }
5178             if (target != to)
5179               convert_move (to, target, 0);
5180             return true;
5181           }
5182       }
5183
5184   return false;
5185 }
5186 \f
5187 /* Report whether we have an instruction to perform the operation
5188    specified by CODE on operands of mode MODE.  */
5189 int
5190 have_insn_for (enum rtx_code code, machine_mode mode)
5191 {
5192   return (code_to_optab (code)
5193           && (optab_handler (code_to_optab (code), mode)
5194               != CODE_FOR_nothing));
5195 }
5196
5197 /* Print information about the current contents of the optabs on
5198    STDERR.  */
5199
5200 DEBUG_FUNCTION void
5201 debug_optab_libfuncs (void)
5202 {
5203   int i, j, k;
5204
5205   /* Dump the arithmetic optabs.  */
5206   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
5207     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5208       {
5209         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
5210         if (l)
5211           {
5212             gcc_assert (GET_CODE (l) == SYMBOL_REF);
5213             fprintf (stderr, "%s\t%s:\t%s\n",
5214                      GET_RTX_NAME (optab_to_code ((optab) i)),
5215                      GET_MODE_NAME (j),
5216                      XSTR (l, 0));
5217           }
5218       }
5219
5220   /* Dump the conversion optabs.  */
5221   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
5222     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5223       for (k = 0; k < NUM_MACHINE_MODES; ++k)
5224         {
5225           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
5226                                          (machine_mode) k);
5227           if (l)
5228             {
5229               gcc_assert (GET_CODE (l) == SYMBOL_REF);
5230               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
5231                        GET_RTX_NAME (optab_to_code ((optab) i)),
5232                        GET_MODE_NAME (j),
5233                        GET_MODE_NAME (k),
5234                        XSTR (l, 0));
5235             }
5236         }
5237 }
5238
5239 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
5240    CODE.  Return 0 on failure.  */
5241
5242 rtx_insn *
5243 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
5244 {
5245   machine_mode mode = GET_MODE (op1);
5246   enum insn_code icode;
5247   rtx_insn *insn;
5248   rtx trap_rtx;
5249
5250   if (mode == VOIDmode)
5251     return 0;
5252
5253   icode = optab_handler (ctrap_optab, mode);
5254   if (icode == CODE_FOR_nothing)
5255     return 0;
5256
5257   /* Some targets only accept a zero trap code.  */
5258   if (!insn_operand_matches (icode, 3, tcode))
5259     return 0;
5260
5261   do_pending_stack_adjust ();
5262   start_sequence ();
5263   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
5264                     &trap_rtx, &mode);
5265   if (!trap_rtx)
5266     insn = NULL;
5267   else
5268     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
5269                             tcode);
5270
5271   /* If that failed, then give up.  */
5272   if (insn == 0)
5273     {
5274       end_sequence ();
5275       return 0;
5276     }
5277
5278   emit_insn (insn);
5279   insn = get_insns ();
5280   end_sequence ();
5281   return insn;
5282 }
5283
5284 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
5285    or unsigned operation code.  */
5286
5287 enum rtx_code
5288 get_rtx_code (enum tree_code tcode, bool unsignedp)
5289 {
5290   enum rtx_code code;
5291   switch (tcode)
5292     {
5293     case EQ_EXPR:
5294       code = EQ;
5295       break;
5296     case NE_EXPR:
5297       code = NE;
5298       break;
5299     case LT_EXPR:
5300       code = unsignedp ? LTU : LT;
5301       break;
5302     case LE_EXPR:
5303       code = unsignedp ? LEU : LE;
5304       break;
5305     case GT_EXPR:
5306       code = unsignedp ? GTU : GT;
5307       break;
5308     case GE_EXPR:
5309       code = unsignedp ? GEU : GE;
5310       break;
5311
5312     case UNORDERED_EXPR:
5313       code = UNORDERED;
5314       break;
5315     case ORDERED_EXPR:
5316       code = ORDERED;
5317       break;
5318     case UNLT_EXPR:
5319       code = UNLT;
5320       break;
5321     case UNLE_EXPR:
5322       code = UNLE;
5323       break;
5324     case UNGT_EXPR:
5325       code = UNGT;
5326       break;
5327     case UNGE_EXPR:
5328       code = UNGE;
5329       break;
5330     case UNEQ_EXPR:
5331       code = UNEQ;
5332       break;
5333     case LTGT_EXPR:
5334       code = LTGT;
5335       break;
5336
5337     case BIT_AND_EXPR:
5338       code = AND;
5339       break;
5340
5341     case BIT_IOR_EXPR:
5342       code = IOR;
5343       break;
5344
5345     default:
5346       gcc_unreachable ();
5347     }
5348   return code;
5349 }
5350
5351 /* Return a comparison rtx of mode CMP_MODE for COND.  Use UNSIGNEDP to
5352    select signed or unsigned operators.  OPNO holds the index of the
5353    first comparison operand for insn ICODE.  Do not generate the
5354    compare instruction itself.  */
5355
5356 static rtx
5357 vector_compare_rtx (machine_mode cmp_mode, enum tree_code tcode,
5358                     tree t_op0, tree t_op1, bool unsignedp,
5359                     enum insn_code icode, unsigned int opno)
5360 {
5361   struct expand_operand ops[2];
5362   rtx rtx_op0, rtx_op1;
5363   machine_mode m0, m1;
5364   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
5365
5366   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
5367
5368   /* Expand operands.  For vector types with scalar modes, e.g. where int64x1_t
5369      has mode DImode, this can produce a constant RTX of mode VOIDmode; in such
5370      cases, use the original mode.  */
5371   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
5372                          EXPAND_STACK_PARM);
5373   m0 = GET_MODE (rtx_op0);
5374   if (m0 == VOIDmode)
5375     m0 = TYPE_MODE (TREE_TYPE (t_op0));
5376
5377   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
5378                          EXPAND_STACK_PARM);
5379   m1 = GET_MODE (rtx_op1);
5380   if (m1 == VOIDmode)
5381     m1 = TYPE_MODE (TREE_TYPE (t_op1));
5382
5383   create_input_operand (&ops[0], rtx_op0, m0);
5384   create_input_operand (&ops[1], rtx_op1, m1);
5385   if (!maybe_legitimize_operands (icode, opno, 2, ops))
5386     gcc_unreachable ();
5387   return gen_rtx_fmt_ee (rcode, cmp_mode, ops[0].value, ops[1].value);
5388 }
5389
5390 /* Checks if vec_perm mask SEL is a constant equivalent to a shift of the first
5391    vec_perm operand, assuming the second operand is a constant vector of zeroes.
5392    Return the shift distance in bits if so, or NULL_RTX if the vec_perm is not a
5393    shift.  */
5394 static rtx
5395 shift_amt_for_vec_perm_mask (rtx sel)
5396 {
5397   unsigned int i, first, nelt = GET_MODE_NUNITS (GET_MODE (sel));
5398   unsigned int bitsize = GET_MODE_UNIT_BITSIZE (GET_MODE (sel));
5399
5400   if (GET_CODE (sel) != CONST_VECTOR)
5401     return NULL_RTX;
5402
5403   first = INTVAL (CONST_VECTOR_ELT (sel, 0));
5404   if (first >= nelt)
5405     return NULL_RTX;
5406   for (i = 1; i < nelt; i++)
5407     {
5408       int idx = INTVAL (CONST_VECTOR_ELT (sel, i));
5409       unsigned int expected = i + first;
5410       /* Indices into the second vector are all equivalent.  */
5411       if (idx < 0 || (MIN (nelt, (unsigned) idx) != MIN (nelt, expected)))
5412         return NULL_RTX;
5413     }
5414
5415   return gen_int_shift_amount (GET_MODE (sel), first * bitsize);
5416 }
5417
5418 /* A subroutine of expand_vec_perm for expanding one vec_perm insn.  */
5419
5420 static rtx
5421 expand_vec_perm_1 (enum insn_code icode, rtx target,
5422                    rtx v0, rtx v1, rtx sel)
5423 {
5424   machine_mode tmode = GET_MODE (target);
5425   machine_mode smode = GET_MODE (sel);
5426   struct expand_operand ops[4];
5427
5428   create_output_operand (&ops[0], target, tmode);
5429   create_input_operand (&ops[3], sel, smode);
5430
5431   /* Make an effort to preserve v0 == v1.  The target expander is able to
5432      rely on this to determine if we're permuting a single input operand.  */
5433   if (rtx_equal_p (v0, v1))
5434     {
5435       if (!insn_operand_matches (icode, 1, v0))
5436         v0 = force_reg (tmode, v0);
5437       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
5438       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
5439
5440       create_fixed_operand (&ops[1], v0);
5441       create_fixed_operand (&ops[2], v0);
5442     }
5443   else
5444     {
5445       create_input_operand (&ops[1], v0, tmode);
5446       create_input_operand (&ops[2], v1, tmode);
5447     }
5448
5449   if (maybe_expand_insn (icode, 4, ops))
5450     return ops[0].value;
5451   return NULL_RTX;
5452 }
5453
5454 /* Generate instructions for vec_perm optab given its mode
5455    and three operands.  */
5456
5457 rtx
5458 expand_vec_perm (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
5459 {
5460   enum insn_code icode;
5461   machine_mode qimode;
5462   unsigned int i, w, e, u;
5463   rtx tmp, sel_qi = NULL;
5464   rtvec vec;
5465
5466   if (!target || GET_MODE (target) != mode)
5467     target = gen_reg_rtx (mode);
5468
5469   w = GET_MODE_SIZE (mode);
5470   e = GET_MODE_NUNITS (mode);
5471   u = GET_MODE_UNIT_SIZE (mode);
5472
5473   /* Set QIMODE to a different vector mode with byte elements.
5474      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
5475   if (GET_MODE_INNER (mode) == QImode
5476       || !mode_for_vector (QImode, w).exists (&qimode)
5477       || !VECTOR_MODE_P (qimode))
5478     qimode = VOIDmode;
5479
5480   /* If the input is a constant, expand it specially.  */
5481   gcc_assert (GET_MODE_CLASS (GET_MODE (sel)) == MODE_VECTOR_INT);
5482   if (GET_CODE (sel) == CONST_VECTOR)
5483     {
5484       /* See if this can be handled with a vec_shr.  We only do this if the
5485          second vector is all zeroes.  */
5486       enum insn_code shift_code = optab_handler (vec_shr_optab, mode);
5487       enum insn_code shift_code_qi = ((qimode != VOIDmode && qimode != mode)
5488                                       ? optab_handler (vec_shr_optab, qimode)
5489                                       : CODE_FOR_nothing);
5490       rtx shift_amt = NULL_RTX;
5491       if (v1 == CONST0_RTX (GET_MODE (v1))
5492           && (shift_code != CODE_FOR_nothing
5493               || shift_code_qi != CODE_FOR_nothing))
5494         {
5495           shift_amt = shift_amt_for_vec_perm_mask (sel);
5496           if (shift_amt)
5497             {
5498               struct expand_operand ops[3];
5499               if (shift_code != CODE_FOR_nothing)
5500                 {
5501                   create_output_operand (&ops[0], target, mode);
5502                   create_input_operand (&ops[1], v0, mode);
5503                   create_convert_operand_from_type (&ops[2], shift_amt,
5504                                                     sizetype);
5505                   if (maybe_expand_insn (shift_code, 3, ops))
5506                     return ops[0].value;
5507                 }
5508               if (shift_code_qi != CODE_FOR_nothing)
5509                 {
5510                   tmp = gen_reg_rtx (qimode);
5511                   create_output_operand (&ops[0], tmp, qimode);
5512                   create_input_operand (&ops[1], gen_lowpart (qimode, v0),
5513                                         qimode);
5514                   create_convert_operand_from_type (&ops[2], shift_amt,
5515                                                     sizetype);
5516                   if (maybe_expand_insn (shift_code_qi, 3, ops))
5517                     return gen_lowpart (mode, ops[0].value);
5518                 }
5519             }
5520         }
5521
5522       icode = direct_optab_handler (vec_perm_const_optab, mode);
5523       if (icode != CODE_FOR_nothing)
5524         {
5525           tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5526           if (tmp)
5527             return tmp;
5528         }
5529
5530       /* Fall back to a constant byte-based permutation.  */
5531       if (qimode != VOIDmode)
5532         {
5533           vec = rtvec_alloc (w);
5534           for (i = 0; i < e; ++i)
5535             {
5536               unsigned int j, this_e;
5537
5538               this_e = INTVAL (CONST_VECTOR_ELT (sel, i));
5539               this_e &= 2 * e - 1;
5540               this_e *= u;
5541
5542               for (j = 0; j < u; ++j)
5543                 RTVEC_ELT (vec, i * u + j) = GEN_INT (this_e + j);
5544             }
5545           sel_qi = gen_rtx_CONST_VECTOR (qimode, vec);
5546
5547           icode = direct_optab_handler (vec_perm_const_optab, qimode);
5548           if (icode != CODE_FOR_nothing)
5549             {
5550               tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5551               tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5552                                        gen_lowpart (qimode, v1), sel_qi);
5553               if (tmp)
5554                 return gen_lowpart (mode, tmp);
5555             }
5556         }
5557     }
5558
5559   /* Otherwise expand as a fully variable permuation.  */
5560   icode = direct_optab_handler (vec_perm_optab, mode);
5561   if (icode != CODE_FOR_nothing)
5562     {
5563       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5564       if (tmp)
5565         return tmp;
5566     }
5567
5568   /* As a special case to aid several targets, lower the element-based
5569      permutation to a byte-based permutation and try again.  */
5570   if (qimode == VOIDmode)
5571     return NULL_RTX;
5572   icode = direct_optab_handler (vec_perm_optab, qimode);
5573   if (icode == CODE_FOR_nothing)
5574     return NULL_RTX;
5575
5576   if (sel_qi == NULL)
5577     {
5578       /* Multiply each element by its byte size.  */
5579       machine_mode selmode = GET_MODE (sel);
5580       if (u == 2)
5581         sel = expand_simple_binop (selmode, PLUS, sel, sel,
5582                                    NULL, 0, OPTAB_DIRECT);
5583       else
5584         sel = expand_simple_binop (selmode, ASHIFT, sel,
5585                                    gen_int_shift_amount (selmode,
5586                                                          exact_log2 (u)),
5587                                    NULL, 0, OPTAB_DIRECT);
5588       gcc_assert (sel != NULL);
5589
5590       /* Broadcast the low byte each element into each of its bytes.  */
5591       vec = rtvec_alloc (w);
5592       for (i = 0; i < w; ++i)
5593         {
5594           int this_e = i / u * u;
5595           if (BYTES_BIG_ENDIAN)
5596             this_e += u - 1;
5597           RTVEC_ELT (vec, i) = GEN_INT (this_e);
5598         }
5599       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
5600       sel = gen_lowpart (qimode, sel);
5601       sel = expand_vec_perm (qimode, sel, sel, tmp, NULL);
5602       gcc_assert (sel != NULL);
5603
5604       /* Add the byte offset to each byte element.  */
5605       /* Note that the definition of the indicies here is memory ordering,
5606          so there should be no difference between big and little endian.  */
5607       vec = rtvec_alloc (w);
5608       for (i = 0; i < w; ++i)
5609         RTVEC_ELT (vec, i) = GEN_INT (i % u);
5610       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
5611       sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
5612                                     sel, 0, OPTAB_DIRECT);
5613       gcc_assert (sel_qi != NULL);
5614     }
5615
5616   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5617   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5618                            gen_lowpart (qimode, v1), sel_qi);
5619   if (tmp)
5620     tmp = gen_lowpart (mode, tmp);
5621   return tmp;
5622 }
5623
5624 /* Generate insns for a VEC_COND_EXPR with mask, given its TYPE and its
5625    three operands.  */
5626
5627 rtx
5628 expand_vec_cond_mask_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5629                            rtx target)
5630 {
5631   struct expand_operand ops[4];
5632   machine_mode mode = TYPE_MODE (vec_cond_type);
5633   machine_mode mask_mode = TYPE_MODE (TREE_TYPE (op0));
5634   enum insn_code icode = get_vcond_mask_icode (mode, mask_mode);
5635   rtx mask, rtx_op1, rtx_op2;
5636
5637   if (icode == CODE_FOR_nothing)
5638     return 0;
5639
5640   mask = expand_normal (op0);
5641   rtx_op1 = expand_normal (op1);
5642   rtx_op2 = expand_normal (op2);
5643
5644   mask = force_reg (mask_mode, mask);
5645   rtx_op1 = force_reg (GET_MODE (rtx_op1), rtx_op1);
5646
5647   create_output_operand (&ops[0], target, mode);
5648   create_input_operand (&ops[1], rtx_op1, mode);
5649   create_input_operand (&ops[2], rtx_op2, mode);
5650   create_input_operand (&ops[3], mask, mask_mode);
5651   expand_insn (icode, 4, ops);
5652
5653   return ops[0].value;
5654 }
5655
5656 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
5657    three operands.  */
5658
5659 rtx
5660 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5661                       rtx target)
5662 {
5663   struct expand_operand ops[6];
5664   enum insn_code icode;
5665   rtx comparison, rtx_op1, rtx_op2;
5666   machine_mode mode = TYPE_MODE (vec_cond_type);
5667   machine_mode cmp_op_mode;
5668   bool unsignedp;
5669   tree op0a, op0b;
5670   enum tree_code tcode;
5671
5672   if (COMPARISON_CLASS_P (op0))
5673     {
5674       op0a = TREE_OPERAND (op0, 0);
5675       op0b = TREE_OPERAND (op0, 1);
5676       tcode = TREE_CODE (op0);
5677     }
5678   else
5679     {
5680       gcc_assert (VECTOR_BOOLEAN_TYPE_P (TREE_TYPE (op0)));
5681       if (get_vcond_mask_icode (mode, TYPE_MODE (TREE_TYPE (op0)))
5682           != CODE_FOR_nothing)
5683         return expand_vec_cond_mask_expr (vec_cond_type, op0, op1,
5684                                           op2, target);
5685       /* Fake op0 < 0.  */
5686       else
5687         {
5688           gcc_assert (GET_MODE_CLASS (TYPE_MODE (TREE_TYPE (op0)))
5689                       == MODE_VECTOR_INT);
5690           op0a = op0;
5691           op0b = build_zero_cst (TREE_TYPE (op0));
5692           tcode = LT_EXPR;
5693         }
5694     }
5695   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
5696   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5697
5698
5699   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
5700               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
5701
5702   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
5703   if (icode == CODE_FOR_nothing)
5704     {
5705       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5706         icode = get_vcond_eq_icode (mode, cmp_op_mode);
5707       if (icode == CODE_FOR_nothing)
5708         return 0;
5709     }
5710
5711   comparison = vector_compare_rtx (VOIDmode, tcode, op0a, op0b, unsignedp,
5712                                    icode, 4);
5713   rtx_op1 = expand_normal (op1);
5714   rtx_op2 = expand_normal (op2);
5715
5716   create_output_operand (&ops[0], target, mode);
5717   create_input_operand (&ops[1], rtx_op1, mode);
5718   create_input_operand (&ops[2], rtx_op2, mode);
5719   create_fixed_operand (&ops[3], comparison);
5720   create_fixed_operand (&ops[4], XEXP (comparison, 0));
5721   create_fixed_operand (&ops[5], XEXP (comparison, 1));
5722   expand_insn (icode, 6, ops);
5723   return ops[0].value;
5724 }
5725
5726 /* Generate VEC_SERIES_EXPR <OP0, OP1>, returning a value of mode VMODE.
5727    Use TARGET for the result if nonnull and convenient.  */
5728
5729 rtx
5730 expand_vec_series_expr (machine_mode vmode, rtx op0, rtx op1, rtx target)
5731 {
5732   struct expand_operand ops[3];
5733   enum insn_code icode;
5734   machine_mode emode = GET_MODE_INNER (vmode);
5735
5736   icode = direct_optab_handler (vec_series_optab, vmode);
5737   gcc_assert (icode != CODE_FOR_nothing);
5738
5739   create_output_operand (&ops[0], target, vmode);
5740   create_input_operand (&ops[1], op0, emode);
5741   create_input_operand (&ops[2], op1, emode);
5742
5743   expand_insn (icode, 3, ops);
5744   return ops[0].value;
5745 }
5746
5747 /* Generate insns for a vector comparison into a mask.  */
5748
5749 rtx
5750 expand_vec_cmp_expr (tree type, tree exp, rtx target)
5751 {
5752   struct expand_operand ops[4];
5753   enum insn_code icode;
5754   rtx comparison;
5755   machine_mode mask_mode = TYPE_MODE (type);
5756   machine_mode vmode;
5757   bool unsignedp;
5758   tree op0a, op0b;
5759   enum tree_code tcode;
5760
5761   op0a = TREE_OPERAND (exp, 0);
5762   op0b = TREE_OPERAND (exp, 1);
5763   tcode = TREE_CODE (exp);
5764
5765   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5766   vmode = TYPE_MODE (TREE_TYPE (op0a));
5767
5768   icode = get_vec_cmp_icode (vmode, mask_mode, unsignedp);
5769   if (icode == CODE_FOR_nothing)
5770     {
5771       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5772         icode = get_vec_cmp_eq_icode (vmode, mask_mode);
5773       if (icode == CODE_FOR_nothing)
5774         return 0;
5775     }
5776
5777   comparison = vector_compare_rtx (mask_mode, tcode, op0a, op0b,
5778                                    unsignedp, icode, 2);
5779   create_output_operand (&ops[0], target, mask_mode);
5780   create_fixed_operand (&ops[1], comparison);
5781   create_fixed_operand (&ops[2], XEXP (comparison, 0));
5782   create_fixed_operand (&ops[3], XEXP (comparison, 1));
5783   expand_insn (icode, 4, ops);
5784   return ops[0].value;
5785 }
5786
5787 /* Expand a highpart multiply.  */
5788
5789 rtx
5790 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
5791                       rtx target, bool uns_p)
5792 {
5793   struct expand_operand eops[3];
5794   enum insn_code icode;
5795   int method, i, nunits;
5796   machine_mode wmode;
5797   rtx m1, m2, perm;
5798   optab tab1, tab2;
5799   rtvec v;
5800
5801   method = can_mult_highpart_p (mode, uns_p);
5802   switch (method)
5803     {
5804     case 0:
5805       return NULL_RTX;
5806     case 1:
5807       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
5808       return expand_binop (mode, tab1, op0, op1, target, uns_p,
5809                            OPTAB_LIB_WIDEN);
5810     case 2:
5811       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
5812       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
5813       break;
5814     case 3:
5815       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
5816       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
5817       if (BYTES_BIG_ENDIAN)
5818         std::swap (tab1, tab2);
5819       break;
5820     default:
5821       gcc_unreachable ();
5822     }
5823
5824   icode = optab_handler (tab1, mode);
5825   nunits = GET_MODE_NUNITS (mode);
5826   wmode = insn_data[icode].operand[0].mode;
5827   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
5828   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
5829
5830   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5831   create_input_operand (&eops[1], op0, mode);
5832   create_input_operand (&eops[2], op1, mode);
5833   expand_insn (icode, 3, eops);
5834   m1 = gen_lowpart (mode, eops[0].value);
5835
5836   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5837   create_input_operand (&eops[1], op0, mode);
5838   create_input_operand (&eops[2], op1, mode);
5839   expand_insn (optab_handler (tab2, mode), 3, eops);
5840   m2 = gen_lowpart (mode, eops[0].value);
5841
5842   v = rtvec_alloc (nunits);
5843   if (method == 2)
5844     {
5845       for (i = 0; i < nunits; ++i)
5846         RTVEC_ELT (v, i) = GEN_INT (!BYTES_BIG_ENDIAN + (i & ~1)
5847                                     + ((i & 1) ? nunits : 0));
5848       perm = gen_rtx_CONST_VECTOR (mode, v);
5849     }
5850   else
5851     {
5852       int base = BYTES_BIG_ENDIAN ? 0 : 1;
5853       perm = gen_const_vec_series (mode, GEN_INT (base), GEN_INT (2));
5854     }
5855
5856   return expand_vec_perm (mode, m1, m2, perm, target);
5857 }
5858 \f
5859 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
5860    pattern.  */
5861
5862 static void
5863 find_cc_set (rtx x, const_rtx pat, void *data)
5864 {
5865   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
5866       && GET_CODE (pat) == SET)
5867     {
5868       rtx *p_cc_reg = (rtx *) data;
5869       gcc_assert (!*p_cc_reg);
5870       *p_cc_reg = x;
5871     }
5872 }
5873
5874 /* This is a helper function for the other atomic operations.  This function
5875    emits a loop that contains SEQ that iterates until a compare-and-swap
5876    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
5877    a set of instructions that takes a value from OLD_REG as an input and
5878    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
5879    set to the current contents of MEM.  After SEQ, a compare-and-swap will
5880    attempt to update MEM with NEW_REG.  The function returns true when the
5881    loop was generated successfully.  */
5882
5883 static bool
5884 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
5885 {
5886   machine_mode mode = GET_MODE (mem);
5887   rtx_code_label *label;
5888   rtx cmp_reg, success, oldval;
5889
5890   /* The loop we want to generate looks like
5891
5892         cmp_reg = mem;
5893       label:
5894         old_reg = cmp_reg;
5895         seq;
5896         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
5897         if (success)
5898           goto label;
5899
5900      Note that we only do the plain load from memory once.  Subsequent
5901      iterations use the value loaded by the compare-and-swap pattern.  */
5902
5903   label = gen_label_rtx ();
5904   cmp_reg = gen_reg_rtx (mode);
5905
5906   emit_move_insn (cmp_reg, mem);
5907   emit_label (label);
5908   emit_move_insn (old_reg, cmp_reg);
5909   if (seq)
5910     emit_insn (seq);
5911
5912   success = NULL_RTX;
5913   oldval = cmp_reg;
5914   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
5915                                        new_reg, false, MEMMODEL_SYNC_SEQ_CST,
5916                                        MEMMODEL_RELAXED))
5917     return false;
5918
5919   if (oldval != cmp_reg)
5920     emit_move_insn (cmp_reg, oldval);
5921
5922   /* Mark this jump predicted not taken.  */
5923   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
5924                            GET_MODE (success), 1, label,
5925                            profile_probability::guessed_never ());
5926   return true;
5927 }
5928
5929
5930 /* This function tries to emit an atomic_exchange intruction.  VAL is written
5931    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
5932    using TARGET if possible.  */
5933
5934 static rtx
5935 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
5936 {
5937   machine_mode mode = GET_MODE (mem);
5938   enum insn_code icode;
5939
5940   /* If the target supports the exchange directly, great.  */
5941   icode = direct_optab_handler (atomic_exchange_optab, mode);
5942   if (icode != CODE_FOR_nothing)
5943     {
5944       struct expand_operand ops[4];
5945
5946       create_output_operand (&ops[0], target, mode);
5947       create_fixed_operand (&ops[1], mem);
5948       create_input_operand (&ops[2], val, mode);
5949       create_integer_operand (&ops[3], model);
5950       if (maybe_expand_insn (icode, 4, ops))
5951         return ops[0].value;
5952     }
5953
5954   return NULL_RTX;
5955 }
5956
5957 /* This function tries to implement an atomic exchange operation using
5958    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
5959    The previous contents of *MEM are returned, using TARGET if possible.
5960    Since this instructionn is an acquire barrier only, stronger memory
5961    models may require additional barriers to be emitted.  */
5962
5963 static rtx
5964 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
5965                                    enum memmodel model)
5966 {
5967   machine_mode mode = GET_MODE (mem);
5968   enum insn_code icode;
5969   rtx_insn *last_insn = get_last_insn ();
5970
5971   icode = optab_handler (sync_lock_test_and_set_optab, mode);
5972
5973   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
5974      exists, and the memory model is stronger than acquire, add a release
5975      barrier before the instruction.  */
5976
5977   if (is_mm_seq_cst (model) || is_mm_release (model) || is_mm_acq_rel (model))
5978     expand_mem_thread_fence (model);
5979
5980   if (icode != CODE_FOR_nothing)
5981     {
5982       struct expand_operand ops[3];
5983       create_output_operand (&ops[0], target, mode);
5984       create_fixed_operand (&ops[1], mem);
5985       create_input_operand (&ops[2], val, mode);
5986       if (maybe_expand_insn (icode, 3, ops))
5987         return ops[0].value;
5988     }
5989
5990   /* If an external test-and-set libcall is provided, use that instead of
5991      any external compare-and-swap that we might get from the compare-and-
5992      swap-loop expansion later.  */
5993   if (!can_compare_and_swap_p (mode, false))
5994     {
5995       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
5996       if (libfunc != NULL)
5997         {
5998           rtx addr;
5999
6000           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6001           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6002                                           mode, addr, ptr_mode,
6003                                           val, mode);
6004         }
6005     }
6006
6007   /* If the test_and_set can't be emitted, eliminate any barrier that might
6008      have been emitted.  */
6009   delete_insns_since (last_insn);
6010   return NULL_RTX;
6011 }
6012
6013 /* This function tries to implement an atomic exchange operation using a
6014    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
6015    *MEM are returned, using TARGET if possible.  No memory model is required
6016    since a compare_and_swap loop is seq-cst.  */
6017
6018 static rtx
6019 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
6020 {
6021   machine_mode mode = GET_MODE (mem);
6022
6023   if (can_compare_and_swap_p (mode, true))
6024     {
6025       if (!target || !register_operand (target, mode))
6026         target = gen_reg_rtx (mode);
6027       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
6028         return target;
6029     }
6030
6031   return NULL_RTX;
6032 }
6033
6034 /* This function tries to implement an atomic test-and-set operation
6035    using the atomic_test_and_set instruction pattern.  A boolean value
6036    is returned from the operation, using TARGET if possible.  */
6037
6038 static rtx
6039 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6040 {
6041   machine_mode pat_bool_mode;
6042   struct expand_operand ops[3];
6043
6044   if (!targetm.have_atomic_test_and_set ())
6045     return NULL_RTX;
6046
6047   /* While we always get QImode from __atomic_test_and_set, we get
6048      other memory modes from __sync_lock_test_and_set.  Note that we
6049      use no endian adjustment here.  This matches the 4.6 behavior
6050      in the Sparc backend.  */
6051   enum insn_code icode = targetm.code_for_atomic_test_and_set;
6052   gcc_checking_assert (insn_data[icode].operand[1].mode == QImode);
6053   if (GET_MODE (mem) != QImode)
6054     mem = adjust_address_nv (mem, QImode, 0);
6055
6056   pat_bool_mode = insn_data[icode].operand[0].mode;
6057   create_output_operand (&ops[0], target, pat_bool_mode);
6058   create_fixed_operand (&ops[1], mem);
6059   create_integer_operand (&ops[2], model);
6060
6061   if (maybe_expand_insn (icode, 3, ops))
6062     return ops[0].value;
6063   return NULL_RTX;
6064 }
6065
6066 /* This function expands the legacy _sync_lock test_and_set operation which is
6067    generally an atomic exchange.  Some limited targets only allow the
6068    constant 1 to be stored.  This is an ACQUIRE operation.
6069
6070    TARGET is an optional place to stick the return value.
6071    MEM is where VAL is stored.  */
6072
6073 rtx
6074 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
6075 {
6076   rtx ret;
6077
6078   /* Try an atomic_exchange first.  */
6079   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_SYNC_ACQUIRE);
6080   if (ret)
6081     return ret;
6082
6083   ret = maybe_emit_sync_lock_test_and_set (target, mem, val,
6084                                            MEMMODEL_SYNC_ACQUIRE);
6085   if (ret)
6086     return ret;
6087
6088   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6089   if (ret)
6090     return ret;
6091
6092   /* If there are no other options, try atomic_test_and_set if the value
6093      being stored is 1.  */
6094   if (val == const1_rtx)
6095     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_SYNC_ACQUIRE);
6096
6097   return ret;
6098 }
6099
6100 /* This function expands the atomic test_and_set operation:
6101    atomically store a boolean TRUE into MEM and return the previous value.
6102
6103    MEMMODEL is the memory model variant to use.
6104    TARGET is an optional place to stick the return value.  */
6105
6106 rtx
6107 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6108 {
6109   machine_mode mode = GET_MODE (mem);
6110   rtx ret, trueval, subtarget;
6111
6112   ret = maybe_emit_atomic_test_and_set (target, mem, model);
6113   if (ret)
6114     return ret;
6115
6116   /* Be binary compatible with non-default settings of trueval, and different
6117      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
6118      another only has atomic-exchange.  */
6119   if (targetm.atomic_test_and_set_trueval == 1)
6120     {
6121       trueval = const1_rtx;
6122       subtarget = target ? target : gen_reg_rtx (mode);
6123     }
6124   else
6125     {
6126       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
6127       subtarget = gen_reg_rtx (mode);
6128     }
6129
6130   /* Try the atomic-exchange optab...  */
6131   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
6132
6133   /* ... then an atomic-compare-and-swap loop ... */
6134   if (!ret)
6135     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
6136
6137   /* ... before trying the vaguely defined legacy lock_test_and_set. */
6138   if (!ret)
6139     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
6140
6141   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
6142      things with the value 1.  Thus we try again without trueval.  */
6143   if (!ret && targetm.atomic_test_and_set_trueval != 1)
6144     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
6145
6146   /* Failing all else, assume a single threaded environment and simply
6147      perform the operation.  */
6148   if (!ret)
6149     {
6150       /* If the result is ignored skip the move to target.  */
6151       if (subtarget != const0_rtx)
6152         emit_move_insn (subtarget, mem);
6153
6154       emit_move_insn (mem, trueval);
6155       ret = subtarget;
6156     }
6157
6158   /* Recall that have to return a boolean value; rectify if trueval
6159      is not exactly one.  */
6160   if (targetm.atomic_test_and_set_trueval != 1)
6161     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
6162
6163   return ret;
6164 }
6165
6166 /* This function expands the atomic exchange operation:
6167    atomically store VAL in MEM and return the previous value in MEM.
6168
6169    MEMMODEL is the memory model variant to use.
6170    TARGET is an optional place to stick the return value.  */
6171
6172 rtx
6173 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6174 {
6175   machine_mode mode = GET_MODE (mem);
6176   rtx ret;
6177
6178   /* If loads are not atomic for the required size and we are not called to
6179      provide a __sync builtin, do not do anything so that we stay consistent
6180      with atomic loads of the same size.  */
6181   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6182     return NULL_RTX;
6183
6184   ret = maybe_emit_atomic_exchange (target, mem, val, model);
6185
6186   /* Next try a compare-and-swap loop for the exchange.  */
6187   if (!ret)
6188     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6189
6190   return ret;
6191 }
6192
6193 /* This function expands the atomic compare exchange operation:
6194
6195    *PTARGET_BOOL is an optional place to store the boolean success/failure.
6196    *PTARGET_OVAL is an optional place to store the old value from memory.
6197    Both target parameters may be NULL or const0_rtx to indicate that we do
6198    not care about that return value.  Both target parameters are updated on
6199    success to the actual location of the corresponding result.
6200
6201    MEMMODEL is the memory model variant to use.
6202
6203    The return value of the function is true for success.  */
6204
6205 bool
6206 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
6207                                 rtx mem, rtx expected, rtx desired,
6208                                 bool is_weak, enum memmodel succ_model,
6209                                 enum memmodel fail_model)
6210 {
6211   machine_mode mode = GET_MODE (mem);
6212   struct expand_operand ops[8];
6213   enum insn_code icode;
6214   rtx target_oval, target_bool = NULL_RTX;
6215   rtx libfunc;
6216
6217   /* If loads are not atomic for the required size and we are not called to
6218      provide a __sync builtin, do not do anything so that we stay consistent
6219      with atomic loads of the same size.  */
6220   if (!can_atomic_load_p (mode) && !is_mm_sync (succ_model))
6221     return false;
6222
6223   /* Load expected into a register for the compare and swap.  */
6224   if (MEM_P (expected))
6225     expected = copy_to_reg (expected);
6226
6227   /* Make sure we always have some place to put the return oldval.
6228      Further, make sure that place is distinct from the input expected,
6229      just in case we need that path down below.  */
6230   if (ptarget_oval && *ptarget_oval == const0_rtx)
6231     ptarget_oval = NULL;
6232
6233   if (ptarget_oval == NULL
6234       || (target_oval = *ptarget_oval) == NULL
6235       || reg_overlap_mentioned_p (expected, target_oval))
6236     target_oval = gen_reg_rtx (mode);
6237
6238   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
6239   if (icode != CODE_FOR_nothing)
6240     {
6241       machine_mode bool_mode = insn_data[icode].operand[0].mode;
6242
6243       if (ptarget_bool && *ptarget_bool == const0_rtx)
6244         ptarget_bool = NULL;
6245
6246       /* Make sure we always have a place for the bool operand.  */
6247       if (ptarget_bool == NULL
6248           || (target_bool = *ptarget_bool) == NULL
6249           || GET_MODE (target_bool) != bool_mode)
6250         target_bool = gen_reg_rtx (bool_mode);
6251
6252       /* Emit the compare_and_swap.  */
6253       create_output_operand (&ops[0], target_bool, bool_mode);
6254       create_output_operand (&ops[1], target_oval, mode);
6255       create_fixed_operand (&ops[2], mem);
6256       create_input_operand (&ops[3], expected, mode);
6257       create_input_operand (&ops[4], desired, mode);
6258       create_integer_operand (&ops[5], is_weak);
6259       create_integer_operand (&ops[6], succ_model);
6260       create_integer_operand (&ops[7], fail_model);
6261       if (maybe_expand_insn (icode, 8, ops))
6262         {
6263           /* Return success/failure.  */
6264           target_bool = ops[0].value;
6265           target_oval = ops[1].value;
6266           goto success;
6267         }
6268     }
6269
6270   /* Otherwise fall back to the original __sync_val_compare_and_swap
6271      which is always seq-cst.  */
6272   icode = optab_handler (sync_compare_and_swap_optab, mode);
6273   if (icode != CODE_FOR_nothing)
6274     {
6275       rtx cc_reg;
6276
6277       create_output_operand (&ops[0], target_oval, mode);
6278       create_fixed_operand (&ops[1], mem);
6279       create_input_operand (&ops[2], expected, mode);
6280       create_input_operand (&ops[3], desired, mode);
6281       if (!maybe_expand_insn (icode, 4, ops))
6282         return false;
6283
6284       target_oval = ops[0].value;
6285
6286       /* If the caller isn't interested in the boolean return value,
6287          skip the computation of it.  */
6288       if (ptarget_bool == NULL)
6289         goto success;
6290
6291       /* Otherwise, work out if the compare-and-swap succeeded.  */
6292       cc_reg = NULL_RTX;
6293       if (have_insn_for (COMPARE, CCmode))
6294         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
6295       if (cc_reg)
6296         {
6297           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
6298                                                const0_rtx, VOIDmode, 0, 1);
6299           goto success;
6300         }
6301       goto success_bool_from_val;
6302     }
6303
6304   /* Also check for library support for __sync_val_compare_and_swap.  */
6305   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
6306   if (libfunc != NULL)
6307     {
6308       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6309       rtx target = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6310                                             mode, addr, ptr_mode,
6311                                             expected, mode, desired, mode);
6312       emit_move_insn (target_oval, target);
6313
6314       /* Compute the boolean return value only if requested.  */
6315       if (ptarget_bool)
6316         goto success_bool_from_val;
6317       else
6318         goto success;
6319     }
6320
6321   /* Failure.  */
6322   return false;
6323
6324  success_bool_from_val:
6325    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
6326                                         expected, VOIDmode, 1, 1);
6327  success:
6328   /* Make sure that the oval output winds up where the caller asked.  */
6329   if (ptarget_oval)
6330     *ptarget_oval = target_oval;
6331   if (ptarget_bool)
6332     *ptarget_bool = target_bool;
6333   return true;
6334 }
6335
6336 /* Generate asm volatile("" : : : "memory") as the memory blockage.  */
6337
6338 static void
6339 expand_asm_memory_blockage (void)
6340 {
6341   rtx asm_op, clob;
6342
6343   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, "", "", 0,
6344                                  rtvec_alloc (0), rtvec_alloc (0),
6345                                  rtvec_alloc (0), UNKNOWN_LOCATION);
6346   MEM_VOLATILE_P (asm_op) = 1;
6347
6348   clob = gen_rtx_SCRATCH (VOIDmode);
6349   clob = gen_rtx_MEM (BLKmode, clob);
6350   clob = gen_rtx_CLOBBER (VOIDmode, clob);
6351
6352   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
6353 }
6354
6355 /* Do not propagate memory accesses across this point.  */
6356
6357 static void
6358 expand_memory_blockage (void)
6359 {
6360   if (targetm.have_memory_blockage ())
6361     emit_insn (targetm.gen_memory_blockage ());
6362   else
6363     expand_asm_memory_blockage ();
6364 }
6365
6366 /* This routine will either emit the mem_thread_fence pattern or issue a
6367    sync_synchronize to generate a fence for memory model MEMMODEL.  */
6368
6369 void
6370 expand_mem_thread_fence (enum memmodel model)
6371 {
6372   if (is_mm_relaxed (model))
6373     return;
6374   if (targetm.have_mem_thread_fence ())
6375     {
6376       emit_insn (targetm.gen_mem_thread_fence (GEN_INT (model)));
6377       expand_memory_blockage ();
6378     }
6379   else if (targetm.have_memory_barrier ())
6380     emit_insn (targetm.gen_memory_barrier ());
6381   else if (synchronize_libfunc != NULL_RTX)
6382     emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode);
6383   else
6384     expand_memory_blockage ();
6385 }
6386
6387 /* Emit a signal fence with given memory model.  */
6388
6389 void
6390 expand_mem_signal_fence (enum memmodel model)
6391 {
6392   /* No machine barrier is required to implement a signal fence, but
6393      a compiler memory barrier must be issued, except for relaxed MM.  */
6394   if (!is_mm_relaxed (model))
6395     expand_memory_blockage ();
6396 }
6397
6398 /* This function expands the atomic load operation:
6399    return the atomically loaded value in MEM.
6400
6401    MEMMODEL is the memory model variant to use.
6402    TARGET is an option place to stick the return value.  */
6403
6404 rtx
6405 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
6406 {
6407   machine_mode mode = GET_MODE (mem);
6408   enum insn_code icode;
6409
6410   /* If the target supports the load directly, great.  */
6411   icode = direct_optab_handler (atomic_load_optab, mode);
6412   if (icode != CODE_FOR_nothing)
6413     {
6414       struct expand_operand ops[3];
6415       rtx_insn *last = get_last_insn ();
6416       if (is_mm_seq_cst (model))
6417         expand_memory_blockage ();
6418
6419       create_output_operand (&ops[0], target, mode);
6420       create_fixed_operand (&ops[1], mem);
6421       create_integer_operand (&ops[2], model);
6422       if (maybe_expand_insn (icode, 3, ops))
6423         {
6424           if (!is_mm_relaxed (model))
6425             expand_memory_blockage ();
6426           return ops[0].value;
6427         }
6428       delete_insns_since (last);
6429     }
6430
6431   /* If the size of the object is greater than word size on this target,
6432      then we assume that a load will not be atomic.  We could try to
6433      emulate a load with a compare-and-swap operation, but the store that
6434      doing this could result in would be incorrect if this is a volatile
6435      atomic load or targetting read-only-mapped memory.  */
6436   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6437     /* If there is no atomic load, leave the library call.  */
6438     return NULL_RTX;
6439
6440   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
6441   if (!target || target == const0_rtx)
6442     target = gen_reg_rtx (mode);
6443
6444   /* For SEQ_CST, emit a barrier before the load.  */
6445   if (is_mm_seq_cst (model))
6446     expand_mem_thread_fence (model);
6447
6448   emit_move_insn (target, mem);
6449
6450   /* Emit the appropriate barrier after the load.  */
6451   expand_mem_thread_fence (model);
6452
6453   return target;
6454 }
6455
6456 /* This function expands the atomic store operation:
6457    Atomically store VAL in MEM.
6458    MEMMODEL is the memory model variant to use.
6459    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
6460    function returns const0_rtx if a pattern was emitted.  */
6461
6462 rtx
6463 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
6464 {
6465   machine_mode mode = GET_MODE (mem);
6466   enum insn_code icode;
6467   struct expand_operand ops[3];
6468
6469   /* If the target supports the store directly, great.  */
6470   icode = direct_optab_handler (atomic_store_optab, mode);
6471   if (icode != CODE_FOR_nothing)
6472     {
6473       rtx_insn *last = get_last_insn ();
6474       if (!is_mm_relaxed (model))
6475         expand_memory_blockage ();
6476       create_fixed_operand (&ops[0], mem);
6477       create_input_operand (&ops[1], val, mode);
6478       create_integer_operand (&ops[2], model);
6479       if (maybe_expand_insn (icode, 3, ops))
6480         {
6481           if (is_mm_seq_cst (model))
6482             expand_memory_blockage ();
6483           return const0_rtx;
6484         }
6485       delete_insns_since (last);
6486     }
6487
6488   /* If using __sync_lock_release is a viable alternative, try it.
6489      Note that this will not be set to true if we are expanding a generic
6490      __atomic_store_n.  */
6491   if (use_release)
6492     {
6493       icode = direct_optab_handler (sync_lock_release_optab, mode);
6494       if (icode != CODE_FOR_nothing)
6495         {
6496           create_fixed_operand (&ops[0], mem);
6497           create_input_operand (&ops[1], const0_rtx, mode);
6498           if (maybe_expand_insn (icode, 2, ops))
6499             {
6500               /* lock_release is only a release barrier.  */
6501               if (is_mm_seq_cst (model))
6502                 expand_mem_thread_fence (model);
6503               return const0_rtx;
6504             }
6505         }
6506     }
6507
6508   /* If the size of the object is greater than word size on this target,
6509      a default store will not be atomic.  */
6510   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6511     {
6512       /* If loads are atomic or we are called to provide a __sync builtin,
6513          we can try a atomic_exchange and throw away the result.  Otherwise,
6514          don't do anything so that we do not create an inconsistency between
6515          loads and stores.  */
6516       if (can_atomic_load_p (mode) || is_mm_sync (model))
6517         {
6518           rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
6519           if (!target)
6520             target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem,
6521                                                                 val);
6522           if (target)
6523             return const0_rtx;
6524         }
6525         return NULL_RTX;
6526     }
6527
6528   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
6529   expand_mem_thread_fence (model);
6530
6531   emit_move_insn (mem, val);
6532
6533   /* For SEQ_CST, also emit a barrier after the store.  */
6534   if (is_mm_seq_cst (model))
6535     expand_mem_thread_fence (model);
6536
6537   return const0_rtx;
6538 }
6539
6540
6541 /* Structure containing the pointers and values required to process the
6542    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
6543
6544 struct atomic_op_functions
6545 {
6546   direct_optab mem_fetch_before;
6547   direct_optab mem_fetch_after;
6548   direct_optab mem_no_result;
6549   optab fetch_before;
6550   optab fetch_after;
6551   direct_optab no_result;
6552   enum rtx_code reverse_code;
6553 };
6554
6555
6556 /* Fill in structure pointed to by OP with the various optab entries for an
6557    operation of type CODE.  */
6558
6559 static void
6560 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
6561 {
6562   gcc_assert (op!= NULL);
6563
6564   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
6565      in the source code during compilation, and the optab entries are not
6566      computable until runtime.  Fill in the values at runtime.  */
6567   switch (code)
6568     {
6569     case PLUS:
6570       op->mem_fetch_before = atomic_fetch_add_optab;
6571       op->mem_fetch_after = atomic_add_fetch_optab;
6572       op->mem_no_result = atomic_add_optab;
6573       op->fetch_before = sync_old_add_optab;
6574       op->fetch_after = sync_new_add_optab;
6575       op->no_result = sync_add_optab;
6576       op->reverse_code = MINUS;
6577       break;
6578     case MINUS:
6579       op->mem_fetch_before = atomic_fetch_sub_optab;
6580       op->mem_fetch_after = atomic_sub_fetch_optab;
6581       op->mem_no_result = atomic_sub_optab;
6582       op->fetch_before = sync_old_sub_optab;
6583       op->fetch_after = sync_new_sub_optab;
6584       op->no_result = sync_sub_optab;
6585       op->reverse_code = PLUS;
6586       break;
6587     case XOR:
6588       op->mem_fetch_before = atomic_fetch_xor_optab;
6589       op->mem_fetch_after = atomic_xor_fetch_optab;
6590       op->mem_no_result = atomic_xor_optab;
6591       op->fetch_before = sync_old_xor_optab;
6592       op->fetch_after = sync_new_xor_optab;
6593       op->no_result = sync_xor_optab;
6594       op->reverse_code = XOR;
6595       break;
6596     case AND:
6597       op->mem_fetch_before = atomic_fetch_and_optab;
6598       op->mem_fetch_after = atomic_and_fetch_optab;
6599       op->mem_no_result = atomic_and_optab;
6600       op->fetch_before = sync_old_and_optab;
6601       op->fetch_after = sync_new_and_optab;
6602       op->no_result = sync_and_optab;
6603       op->reverse_code = UNKNOWN;
6604       break;
6605     case IOR:
6606       op->mem_fetch_before = atomic_fetch_or_optab;
6607       op->mem_fetch_after = atomic_or_fetch_optab;
6608       op->mem_no_result = atomic_or_optab;
6609       op->fetch_before = sync_old_ior_optab;
6610       op->fetch_after = sync_new_ior_optab;
6611       op->no_result = sync_ior_optab;
6612       op->reverse_code = UNKNOWN;
6613       break;
6614     case NOT:
6615       op->mem_fetch_before = atomic_fetch_nand_optab;
6616       op->mem_fetch_after = atomic_nand_fetch_optab;
6617       op->mem_no_result = atomic_nand_optab;
6618       op->fetch_before = sync_old_nand_optab;
6619       op->fetch_after = sync_new_nand_optab;
6620       op->no_result = sync_nand_optab;
6621       op->reverse_code = UNKNOWN;
6622       break;
6623     default:
6624       gcc_unreachable ();
6625     }
6626 }
6627
6628 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
6629    using memory order MODEL.  If AFTER is true the operation needs to return
6630    the value of *MEM after the operation, otherwise the previous value.
6631    TARGET is an optional place to place the result.  The result is unused if
6632    it is const0_rtx.
6633    Return the result if there is a better sequence, otherwise NULL_RTX.  */
6634
6635 static rtx
6636 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6637                          enum memmodel model, bool after)
6638 {
6639   /* If the value is prefetched, or not used, it may be possible to replace
6640      the sequence with a native exchange operation.  */
6641   if (!after || target == const0_rtx)
6642     {
6643       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
6644       if (code == AND && val == const0_rtx)
6645         {
6646           if (target == const0_rtx)
6647             target = gen_reg_rtx (GET_MODE (mem));
6648           return maybe_emit_atomic_exchange (target, mem, val, model);
6649         }
6650
6651       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
6652       if (code == IOR && val == constm1_rtx)
6653         {
6654           if (target == const0_rtx)
6655             target = gen_reg_rtx (GET_MODE (mem));
6656           return maybe_emit_atomic_exchange (target, mem, val, model);
6657         }
6658     }
6659
6660   return NULL_RTX;
6661 }
6662
6663 /* Try to emit an instruction for a specific operation varaition.
6664    OPTAB contains the OP functions.
6665    TARGET is an optional place to return the result. const0_rtx means unused.
6666    MEM is the memory location to operate on.
6667    VAL is the value to use in the operation.
6668    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
6669    MODEL is the memory model, if used.
6670    AFTER is true if the returned result is the value after the operation.  */
6671
6672 static rtx
6673 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
6674                rtx val, bool use_memmodel, enum memmodel model, bool after)
6675 {
6676   machine_mode mode = GET_MODE (mem);
6677   struct expand_operand ops[4];
6678   enum insn_code icode;
6679   int op_counter = 0;
6680   int num_ops;
6681
6682   /* Check to see if there is a result returned.  */
6683   if (target == const0_rtx)
6684     {
6685       if (use_memmodel)
6686         {
6687           icode = direct_optab_handler (optab->mem_no_result, mode);
6688           create_integer_operand (&ops[2], model);
6689           num_ops = 3;
6690         }
6691       else
6692         {
6693           icode = direct_optab_handler (optab->no_result, mode);
6694           num_ops = 2;
6695         }
6696     }
6697   /* Otherwise, we need to generate a result.  */
6698   else
6699     {
6700       if (use_memmodel)
6701         {
6702           icode = direct_optab_handler (after ? optab->mem_fetch_after
6703                                         : optab->mem_fetch_before, mode);
6704           create_integer_operand (&ops[3], model);
6705           num_ops = 4;
6706         }
6707       else
6708         {
6709           icode = optab_handler (after ? optab->fetch_after
6710                                  : optab->fetch_before, mode);
6711           num_ops = 3;
6712         }
6713       create_output_operand (&ops[op_counter++], target, mode);
6714     }
6715   if (icode == CODE_FOR_nothing)
6716     return NULL_RTX;
6717
6718   create_fixed_operand (&ops[op_counter++], mem);
6719   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
6720   create_convert_operand_to (&ops[op_counter++], val, mode, true);
6721
6722   if (maybe_expand_insn (icode, num_ops, ops))
6723     return (target == const0_rtx ? const0_rtx : ops[0].value);
6724
6725   return NULL_RTX;
6726 }
6727
6728
6729 /* This function expands an atomic fetch_OP or OP_fetch operation:
6730    TARGET is an option place to stick the return value.  const0_rtx indicates
6731    the result is unused.
6732    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6733    CODE is the operation being performed (OP)
6734    MEMMODEL is the memory model variant to use.
6735    AFTER is true to return the result of the operation (OP_fetch).
6736    AFTER is false to return the value before the operation (fetch_OP).
6737
6738    This function will *only* generate instructions if there is a direct
6739    optab. No compare and swap loops or libcalls will be generated. */
6740
6741 static rtx
6742 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
6743                                     enum rtx_code code, enum memmodel model,
6744                                     bool after)
6745 {
6746   machine_mode mode = GET_MODE (mem);
6747   struct atomic_op_functions optab;
6748   rtx result;
6749   bool unused_result = (target == const0_rtx);
6750
6751   get_atomic_op_for_code (&optab, code);
6752
6753   /* Check to see if there are any better instructions.  */
6754   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
6755   if (result)
6756     return result;
6757
6758   /* Check for the case where the result isn't used and try those patterns.  */
6759   if (unused_result)
6760     {
6761       /* Try the memory model variant first.  */
6762       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
6763       if (result)
6764         return result;
6765
6766       /* Next try the old style withuot a memory model.  */
6767       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
6768       if (result)
6769         return result;
6770
6771       /* There is no no-result pattern, so try patterns with a result.  */
6772       target = NULL_RTX;
6773     }
6774
6775   /* Try the __atomic version.  */
6776   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
6777   if (result)
6778     return result;
6779
6780   /* Try the older __sync version.  */
6781   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
6782   if (result)
6783     return result;
6784
6785   /* If the fetch value can be calculated from the other variation of fetch,
6786      try that operation.  */
6787   if (after || unused_result || optab.reverse_code != UNKNOWN)
6788     {
6789       /* Try the __atomic version, then the older __sync version.  */
6790       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
6791       if (!result)
6792         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
6793
6794       if (result)
6795         {
6796           /* If the result isn't used, no need to do compensation code.  */
6797           if (unused_result)
6798             return result;
6799
6800           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
6801              Fetch_before == after REVERSE_OP val.  */
6802           if (!after)
6803             code = optab.reverse_code;
6804           if (code == NOT)
6805             {
6806               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
6807                                             true, OPTAB_LIB_WIDEN);
6808               result = expand_simple_unop (mode, NOT, result, target, true);
6809             }
6810           else
6811             result = expand_simple_binop (mode, code, result, val, target,
6812                                           true, OPTAB_LIB_WIDEN);
6813           return result;
6814         }
6815     }
6816
6817   /* No direct opcode can be generated.  */
6818   return NULL_RTX;
6819 }
6820
6821
6822
6823 /* This function expands an atomic fetch_OP or OP_fetch operation:
6824    TARGET is an option place to stick the return value.  const0_rtx indicates
6825    the result is unused.
6826    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6827    CODE is the operation being performed (OP)
6828    MEMMODEL is the memory model variant to use.
6829    AFTER is true to return the result of the operation (OP_fetch).
6830    AFTER is false to return the value before the operation (fetch_OP).  */
6831 rtx
6832 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6833                         enum memmodel model, bool after)
6834 {
6835   machine_mode mode = GET_MODE (mem);
6836   rtx result;
6837   bool unused_result = (target == const0_rtx);
6838
6839   /* If loads are not atomic for the required size and we are not called to
6840      provide a __sync builtin, do not do anything so that we stay consistent
6841      with atomic loads of the same size.  */
6842   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6843     return NULL_RTX;
6844
6845   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
6846                                                after);
6847
6848   if (result)
6849     return result;
6850
6851   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
6852   if (code == PLUS || code == MINUS)
6853     {
6854       rtx tmp;
6855       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
6856
6857       start_sequence ();
6858       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
6859       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
6860                                                    model, after);
6861       if (result)
6862         {
6863           /* PLUS worked so emit the insns and return.  */
6864           tmp = get_insns ();
6865           end_sequence ();
6866           emit_insn (tmp);
6867           return result;
6868         }
6869
6870       /* PLUS did not work, so throw away the negation code and continue.  */
6871       end_sequence ();
6872     }
6873
6874   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
6875   if (!can_compare_and_swap_p (mode, false))
6876     {
6877       rtx libfunc;
6878       bool fixup = false;
6879       enum rtx_code orig_code = code;
6880       struct atomic_op_functions optab;
6881
6882       get_atomic_op_for_code (&optab, code);
6883       libfunc = optab_libfunc (after ? optab.fetch_after
6884                                : optab.fetch_before, mode);
6885       if (libfunc == NULL
6886           && (after || unused_result || optab.reverse_code != UNKNOWN))
6887         {
6888           fixup = true;
6889           if (!after)
6890             code = optab.reverse_code;
6891           libfunc = optab_libfunc (after ? optab.fetch_before
6892                                    : optab.fetch_after, mode);
6893         }
6894       if (libfunc != NULL)
6895         {
6896           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6897           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
6898                                             addr, ptr_mode, val, mode);
6899
6900           if (!unused_result && fixup)
6901             result = expand_simple_binop (mode, code, result, val, target,
6902                                           true, OPTAB_LIB_WIDEN);
6903           return result;
6904         }
6905
6906       /* We need the original code for any further attempts.  */
6907       code = orig_code;
6908     }
6909
6910   /* If nothing else has succeeded, default to a compare and swap loop.  */
6911   if (can_compare_and_swap_p (mode, true))
6912     {
6913       rtx_insn *insn;
6914       rtx t0 = gen_reg_rtx (mode), t1;
6915
6916       start_sequence ();
6917
6918       /* If the result is used, get a register for it.  */
6919       if (!unused_result)
6920         {
6921           if (!target || !register_operand (target, mode))
6922             target = gen_reg_rtx (mode);
6923           /* If fetch_before, copy the value now.  */
6924           if (!after)
6925             emit_move_insn (target, t0);
6926         }
6927       else
6928         target = const0_rtx;
6929
6930       t1 = t0;
6931       if (code == NOT)
6932         {
6933           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
6934                                     true, OPTAB_LIB_WIDEN);
6935           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
6936         }
6937       else
6938         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
6939                                   OPTAB_LIB_WIDEN);
6940
6941       /* For after, copy the value now.  */
6942       if (!unused_result && after)
6943         emit_move_insn (target, t1);
6944       insn = get_insns ();
6945       end_sequence ();
6946
6947       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
6948         return target;
6949     }
6950
6951   return NULL_RTX;
6952 }
6953 \f
6954 /* Return true if OPERAND is suitable for operand number OPNO of
6955    instruction ICODE.  */
6956
6957 bool
6958 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
6959 {
6960   return (!insn_data[(int) icode].operand[opno].predicate
6961           || (insn_data[(int) icode].operand[opno].predicate
6962               (operand, insn_data[(int) icode].operand[opno].mode)));
6963 }
6964 \f
6965 /* TARGET is a target of a multiword operation that we are going to
6966    implement as a series of word-mode operations.  Return true if
6967    TARGET is suitable for this purpose.  */
6968
6969 bool
6970 valid_multiword_target_p (rtx target)
6971 {
6972   machine_mode mode;
6973   int i;
6974
6975   mode = GET_MODE (target);
6976   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
6977     if (!validate_subreg (word_mode, mode, target, i))
6978       return false;
6979   return true;
6980 }
6981
6982 /* Make OP describe an input operand that has value INTVAL and that has
6983    no inherent mode.  This function should only be used for operands that
6984    are always expand-time constants.  The backend may request that INTVAL
6985    be copied into a different kind of rtx, but it must specify the mode
6986    of that rtx if so.  */
6987
6988 void
6989 create_integer_operand (struct expand_operand *op, poly_int64 intval)
6990 {
6991   create_expand_operand (op, EXPAND_INTEGER,
6992                          gen_int_mode (intval, MAX_MODE_INT),
6993                          VOIDmode, false, intval);
6994 }
6995
6996 /* Like maybe_legitimize_operand, but do not change the code of the
6997    current rtx value.  */
6998
6999 static bool
7000 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
7001                                     struct expand_operand *op)
7002 {
7003   /* See if the operand matches in its current form.  */
7004   if (insn_operand_matches (icode, opno, op->value))
7005     return true;
7006
7007   /* If the operand is a memory whose address has no side effects,
7008      try forcing the address into a non-virtual pseudo register.
7009      The check for side effects is important because copy_to_mode_reg
7010      cannot handle things like auto-modified addresses.  */
7011   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
7012     {
7013       rtx addr, mem;
7014
7015       mem = op->value;
7016       addr = XEXP (mem, 0);
7017       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
7018           && !side_effects_p (addr))
7019         {
7020           rtx_insn *last;
7021           machine_mode mode;
7022
7023           last = get_last_insn ();
7024           mode = get_address_mode (mem);
7025           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
7026           if (insn_operand_matches (icode, opno, mem))
7027             {
7028               op->value = mem;
7029               return true;
7030             }
7031           delete_insns_since (last);
7032         }
7033     }
7034
7035   return false;
7036 }
7037
7038 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
7039    on success, storing the new operand value back in OP.  */
7040
7041 static bool
7042 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
7043                           struct expand_operand *op)
7044 {
7045   machine_mode mode, imode;
7046   bool old_volatile_ok, result;
7047
7048   mode = op->mode;
7049   switch (op->type)
7050     {
7051     case EXPAND_FIXED:
7052       old_volatile_ok = volatile_ok;
7053       volatile_ok = true;
7054       result = maybe_legitimize_operand_same_code (icode, opno, op);
7055       volatile_ok = old_volatile_ok;
7056       return result;
7057
7058     case EXPAND_OUTPUT:
7059       gcc_assert (mode != VOIDmode);
7060       if (op->value
7061           && op->value != const0_rtx
7062           && GET_MODE (op->value) == mode
7063           && maybe_legitimize_operand_same_code (icode, opno, op))
7064         return true;
7065
7066       op->value = gen_reg_rtx (mode);
7067       op->target = 0;
7068       break;
7069
7070     case EXPAND_INPUT:
7071     input:
7072       gcc_assert (mode != VOIDmode);
7073       gcc_assert (GET_MODE (op->value) == VOIDmode
7074                   || GET_MODE (op->value) == mode);
7075       if (maybe_legitimize_operand_same_code (icode, opno, op))
7076         return true;
7077
7078       op->value = copy_to_mode_reg (mode, op->value);
7079       break;
7080
7081     case EXPAND_CONVERT_TO:
7082       gcc_assert (mode != VOIDmode);
7083       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
7084       goto input;
7085
7086     case EXPAND_CONVERT_FROM:
7087       if (GET_MODE (op->value) != VOIDmode)
7088         mode = GET_MODE (op->value);
7089       else
7090         /* The caller must tell us what mode this value has.  */
7091         gcc_assert (mode != VOIDmode);
7092
7093       imode = insn_data[(int) icode].operand[opno].mode;
7094       if (imode != VOIDmode && imode != mode)
7095         {
7096           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
7097           mode = imode;
7098         }
7099       goto input;
7100
7101     case EXPAND_ADDRESS:
7102       op->value = convert_memory_address (as_a <scalar_int_mode> (mode),
7103                                           op->value);
7104       goto input;
7105
7106     case EXPAND_INTEGER:
7107       mode = insn_data[(int) icode].operand[opno].mode;
7108       if (mode != VOIDmode
7109           && known_eq (trunc_int_for_mode (op->int_value, mode),
7110                        op->int_value))
7111         {
7112           op->value = gen_int_mode (op->int_value, mode);
7113           goto input;
7114         }
7115       break;
7116     }
7117   return insn_operand_matches (icode, opno, op->value);
7118 }
7119
7120 /* Make OP describe an input operand that should have the same value
7121    as VALUE, after any mode conversion that the target might request.
7122    TYPE is the type of VALUE.  */
7123
7124 void
7125 create_convert_operand_from_type (struct expand_operand *op,
7126                                   rtx value, tree type)
7127 {
7128   create_convert_operand_from (op, value, TYPE_MODE (type),
7129                                TYPE_UNSIGNED (type));
7130 }
7131
7132 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
7133    of instruction ICODE.  Return true on success, leaving the new operand
7134    values in the OPS themselves.  Emit no code on failure.  */
7135
7136 bool
7137 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
7138                            unsigned int nops, struct expand_operand *ops)
7139 {
7140   rtx_insn *last;
7141   unsigned int i;
7142
7143   last = get_last_insn ();
7144   for (i = 0; i < nops; i++)
7145     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
7146       {
7147         delete_insns_since (last);
7148         return false;
7149       }
7150   return true;
7151 }
7152
7153 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
7154    as its operands.  Return the instruction pattern on success,
7155    and emit any necessary set-up code.  Return null and emit no
7156    code on failure.  */
7157
7158 rtx_insn *
7159 maybe_gen_insn (enum insn_code icode, unsigned int nops,
7160                 struct expand_operand *ops)
7161 {
7162   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
7163   if (!maybe_legitimize_operands (icode, 0, nops, ops))
7164     return NULL;
7165
7166   switch (nops)
7167     {
7168     case 1:
7169       return GEN_FCN (icode) (ops[0].value);
7170     case 2:
7171       return GEN_FCN (icode) (ops[0].value, ops[1].value);
7172     case 3:
7173       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
7174     case 4:
7175       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7176                               ops[3].value);
7177     case 5:
7178       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7179                               ops[3].value, ops[4].value);
7180     case 6:
7181       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7182                               ops[3].value, ops[4].value, ops[5].value);
7183     case 7:
7184       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7185                               ops[3].value, ops[4].value, ops[5].value,
7186                               ops[6].value);
7187     case 8:
7188       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7189                               ops[3].value, ops[4].value, ops[5].value,
7190                               ops[6].value, ops[7].value);
7191     case 9:
7192       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7193                               ops[3].value, ops[4].value, ops[5].value,
7194                               ops[6].value, ops[7].value, ops[8].value);
7195     }
7196   gcc_unreachable ();
7197 }
7198
7199 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
7200    as its operands.  Return true on success and emit no code on failure.  */
7201
7202 bool
7203 maybe_expand_insn (enum insn_code icode, unsigned int nops,
7204                    struct expand_operand *ops)
7205 {
7206   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7207   if (pat)
7208     {
7209       emit_insn (pat);
7210       return true;
7211     }
7212   return false;
7213 }
7214
7215 /* Like maybe_expand_insn, but for jumps.  */
7216
7217 bool
7218 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
7219                         struct expand_operand *ops)
7220 {
7221   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7222   if (pat)
7223     {
7224       emit_jump_insn (pat);
7225       return true;
7226     }
7227   return false;
7228 }
7229
7230 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
7231    as its operands.  */
7232
7233 void
7234 expand_insn (enum insn_code icode, unsigned int nops,
7235              struct expand_operand *ops)
7236 {
7237   if (!maybe_expand_insn (icode, nops, ops))
7238     gcc_unreachable ();
7239 }
7240
7241 /* Like expand_insn, but for jumps.  */
7242
7243 void
7244 expand_jump_insn (enum insn_code icode, unsigned int nops,
7245                   struct expand_operand *ops)
7246 {
7247   if (!maybe_expand_jump_insn (icode, nops, ops))
7248     gcc_unreachable ();
7249 }