gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2018 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "backend.h"
  25 #include "target.h"
  26 #include "rtl.h"
  27 #include "tree.h"
  28 #include "memmodel.h"
  29 #include "predict.h"
  30 #include "tm_p.h"
  31 #include "expmed.h"
  32 #include "optabs.h"
  33 #include "emit-rtl.h"
  34 #include "recog.h"
  35 #include "diagnostic-core.h"
  36 #include "rtx-vector-builder.h"
  37
  38 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  39    is properly defined.  */
  40 #include "stor-layout.h"
  41 #include "except.h"
  42 #include "dojump.h"
  43 #include "explow.h"
  44 #include "expr.h"
  45 #include "optabs-tree.h"
  46 #include "libfuncs.h"
  47
  48 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  49                                    machine_mode *);
  50 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  51 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  52
  53 /* Debug facility for use in GDB.  */
  54 void debug_optab_libfuncs (void);
  55 \f
  56 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
  57    the result of operation CODE applied to OP0 (and OP1 if it is a binary
  58    operation).
  59
  60    If the last insn does not set TARGET, don't do anything, but return 1.
  61
  62    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
  63    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
  64    try again, ensuring that TARGET is not one of the operands.  */
  65
  66 static int
  67 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
  68 {
  69   rtx_insn *last_insn;
  70   rtx set;
  71   rtx note;
  72
  73   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
  74
  75   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
  76       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
  77       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
  78       && GET_RTX_CLASS (code) != RTX_COMPARE
  79       && GET_RTX_CLASS (code) != RTX_UNARY)
  80     return 1;
  81
  82   if (GET_CODE (target) == ZERO_EXTRACT)
  83     return 1;
  84
  85   for (last_insn = insns;
  86        NEXT_INSN (last_insn) != NULL_RTX;
  87        last_insn = NEXT_INSN (last_insn))
  88     ;
  89
  90   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
  91      a value changing in the insn, so the note would be invalid for CSE.  */
  92   if (reg_overlap_mentioned_p (target, op0)
  93       || (op1 && reg_overlap_mentioned_p (target, op1)))
  94     {
  95       if (MEM_P (target)
  96           && (rtx_equal_p (target, op0)
  97               || (op1 && rtx_equal_p (target, op1))))
  98         {
  99           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 100              over expanding it as temp = MEM op X, MEM = temp.  If the target
 101              supports MEM = MEM op X instructions, it is sometimes too hard
 102              to reconstruct that form later, especially if X is also a memory,
 103              and due to multiple occurrences of addresses the address might
 104              be forced into register unnecessarily.
 105              Note that not emitting the REG_EQUIV note might inhibit
 106              CSE in some cases.  */
 107           set = single_set (last_insn);
 108           if (set
 109               && GET_CODE (SET_SRC (set)) == code
 110               && MEM_P (SET_DEST (set))
 111               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 112                   || (op1 && rtx_equal_p (SET_DEST (set),
 113                                           XEXP (SET_SRC (set), 1)))))
 114             return 1;
 115         }
 116       return 0;
 117     }
 118
 119   set = set_for_reg_notes (last_insn);
 120   if (set == NULL_RTX)
 121     return 1;
 122
 123   if (! rtx_equal_p (SET_DEST (set), target)
 124       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 125       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 126           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 127     return 1;
 128
 129   if (GET_RTX_CLASS (code) == RTX_UNARY)
 130     switch (code)
 131       {
 132       case FFS:
 133       case CLZ:
 134       case CTZ:
 135       case CLRSB:
 136       case POPCOUNT:
 137       case PARITY:
 138       case BSWAP:
 139         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 140           {
 141             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 142             if (GET_MODE_UNIT_SIZE (GET_MODE (op0))
 143                 > GET_MODE_UNIT_SIZE (GET_MODE (target)))
 144               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 145                                          note, GET_MODE (op0));
 146             else
 147               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 148                                          note, GET_MODE (op0));
 149             break;
 150           }
 151         /* FALLTHRU */
 152       default:
 153         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 154         break;
 155       }
 156   else
 157     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 158
 159   set_unique_reg_note (last_insn, REG_EQUAL, note);
 160
 161   return 1;
 162 }
 163 \f
 164 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 165    for a widening operation would be.  In most cases this would be OP0, but if
 166    that's a constant it'll be VOIDmode, which isn't useful.  */
 167
 168 static machine_mode
 169 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 170 {
 171   machine_mode m0 = GET_MODE (op0);
 172   machine_mode m1 = GET_MODE (op1);
 173   machine_mode result;
 174
 175   if (m0 == VOIDmode && m1 == VOIDmode)
 176     return to_mode;
 177   else if (m0 == VOIDmode || GET_MODE_UNIT_SIZE (m0) < GET_MODE_UNIT_SIZE (m1))
 178     result = m1;
 179   else
 180     result = m0;
 181
 182   if (GET_MODE_UNIT_SIZE (result) > GET_MODE_UNIT_SIZE (to_mode))
 183     return to_mode;
 184
 185   return result;
 186 }
 187 \f
 188 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 189    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 190    not actually do a sign-extend or zero-extend, but can leave the
 191    higher-order bits of the result rtx undefined, for example, in the case
 192    of logical operations, but not right shifts.  */
 193
 194 static rtx
 195 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 196                int unsignedp, int no_extend)
 197 {
 198   rtx result;
 199   scalar_int_mode int_mode;
 200
 201   /* If we don't have to extend and this is a constant, return it.  */
 202   if (no_extend && GET_MODE (op) == VOIDmode)
 203     return op;
 204
 205   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 206      extend since it will be more efficient to do so unless the signedness of
 207      a promoted object differs from our extension.  */
 208   if (! no_extend
 209       || !is_a <scalar_int_mode> (mode, &int_mode)
 210       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 211           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 212     return convert_modes (mode, oldmode, op, unsignedp);
 213
 214   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 215      SUBREG.  */
 216   if (GET_MODE_SIZE (int_mode) <= UNITS_PER_WORD)
 217     return gen_lowpart (int_mode, force_reg (GET_MODE (op), op));
 218
 219   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 220      part to OP.  */
 221
 222   result = gen_reg_rtx (int_mode);
 223   emit_clobber (result);
 224   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 225   return result;
 226 }
 227 \f
 228 /* Expand vector widening operations.
 229
 230    There are two different classes of operations handled here:
 231    1) Operations whose result is wider than all the arguments to the operation.
 232       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 233       In this case OP0 and optionally OP1 would be initialized,
 234       but WIDE_OP wouldn't (not relevant for this case).
 235    2) Operations whose result is of the same size as the last argument to the
 236       operation, but wider than all the other arguments to the operation.
 237       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 238       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 239
 240    E.g, when called to expand the following operations, this is how
 241    the arguments will be initialized:
 242                                 nops    OP0     OP1     WIDE_OP
 243    widening-sum                 2       oprnd0  -       oprnd1
 244    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 245    widening-mult                2       oprnd0  oprnd1  -
 246    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 247
 248 rtx
 249 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 250                            rtx target, int unsignedp)
 251 {
 252   struct expand_operand eops[4];
 253   tree oprnd0, oprnd1, oprnd2;
 254   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 255   optab widen_pattern_optab;
 256   enum insn_code icode;
 257   int nops = TREE_CODE_LENGTH (ops->code);
 258   int op;
 259
 260   oprnd0 = ops->op0;
 261   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 262   if (ops->code == VEC_UNPACK_FIX_TRUNC_HI_EXPR
 263       || ops->code == VEC_UNPACK_FIX_TRUNC_LO_EXPR)
 264     /* The sign is from the result type rather than operand's type
 265        for these ops.  */
 266     widen_pattern_optab
 267       = optab_for_tree_code (ops->code, ops->type, optab_default);
 268   else
 269     widen_pattern_optab
 270       = optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 271   if (ops->code == WIDEN_MULT_PLUS_EXPR
 272       || ops->code == WIDEN_MULT_MINUS_EXPR)
 273     icode = find_widening_optab_handler (widen_pattern_optab,
 274                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 275                                          tmode0);
 276   else
 277     icode = optab_handler (widen_pattern_optab, tmode0);
 278   gcc_assert (icode != CODE_FOR_nothing);
 279
 280   if (nops >= 2)
 281     {
 282       oprnd1 = ops->op1;
 283       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 284     }
 285
 286   /* The last operand is of a wider mode than the rest of the operands.  */
 287   if (nops == 2)
 288     wmode = tmode1;
 289   else if (nops == 3)
 290     {
 291       gcc_assert (tmode1 == tmode0);
 292       gcc_assert (op1);
 293       oprnd2 = ops->op2;
 294       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 295     }
 296
 297   op = 0;
 298   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 299   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 300   if (op1)
 301     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 302   if (wide_op)
 303     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 304   expand_insn (icode, op, eops);
 305   return eops[0].value;
 306 }
 307
 308 /* Generate code to perform an operation specified by TERNARY_OPTAB
 309    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 310
 311    UNSIGNEDP is for the case where we have to widen the operands
 312    to perform the operation.  It says to use zero-extension.
 313
 314    If TARGET is nonzero, the value
 315    is generated there, if it is convenient to do so.
 316    In all cases an rtx is returned for the locus of the value;
 317    this may or may not be TARGET.  */
 318
 319 rtx
 320 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 321                    rtx op1, rtx op2, rtx target, int unsignedp)
 322 {
 323   struct expand_operand ops[4];
 324   enum insn_code icode = optab_handler (ternary_optab, mode);
 325
 326   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 327
 328   create_output_operand (&ops[0], target, mode);
 329   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 330   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 331   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 332   expand_insn (icode, 4, ops);
 333   return ops[0].value;
 334 }
 335
 336
 337 /* Like expand_binop, but return a constant rtx if the result can be
 338    calculated at compile time.  The arguments and return value are
 339    otherwise the same as for expand_binop.  */
 340
 341 rtx
 342 simplify_expand_binop (machine_mode mode, optab binoptab,
 343                        rtx op0, rtx op1, rtx target, int unsignedp,
 344                        enum optab_methods methods)
 345 {
 346   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 347     {
 348       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 349                                          mode, op0, op1);
 350       if (x)
 351         return x;
 352     }
 353
 354   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 355 }
 356
 357 /* Like simplify_expand_binop, but always put the result in TARGET.
 358    Return true if the expansion succeeded.  */
 359
 360 bool
 361 force_expand_binop (machine_mode mode, optab binoptab,
 362                     rtx op0, rtx op1, rtx target, int unsignedp,
 363                     enum optab_methods methods)
 364 {
 365   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 366                                  target, unsignedp, methods);
 367   if (x == 0)
 368     return false;
 369   if (x != target)
 370     emit_move_insn (target, x);
 371   return true;
 372 }
 373
 374 /* Create a new vector value in VMODE with all elements set to OP.  The
 375    mode of OP must be the element mode of VMODE.  If OP is a constant,
 376    then the return value will be a constant.  */
 377
 378 rtx
 379 expand_vector_broadcast (machine_mode vmode, rtx op)
 380 {
 381   int n;
 382   rtvec vec;
 383
 384   gcc_checking_assert (VECTOR_MODE_P (vmode));
 385
 386   if (valid_for_const_vector_p (vmode, op))
 387     return gen_const_vec_duplicate (vmode, op);
 388
 389   insn_code icode = optab_handler (vec_duplicate_optab, vmode);
 390   if (icode != CODE_FOR_nothing)
 391     {
 392       struct expand_operand ops[2];
 393       create_output_operand (&ops[0], NULL_RTX, vmode);
 394       create_input_operand (&ops[1], op, GET_MODE (op));
 395       expand_insn (icode, 2, ops);
 396       return ops[0].value;
 397     }
 398
 399   if (!GET_MODE_NUNITS (vmode).is_constant (&n))
 400     return NULL;
 401
 402   /* ??? If the target doesn't have a vec_init, then we have no easy way
 403      of performing this operation.  Most of this sort of generic support
 404      is hidden away in the vector lowering support in gimple.  */
 405   icode = convert_optab_handler (vec_init_optab, vmode,
 406                                  GET_MODE_INNER (vmode));
 407   if (icode == CODE_FOR_nothing)
 408     return NULL;
 409
 410   vec = rtvec_alloc (n);
 411   for (int i = 0; i < n; ++i)
 412     RTVEC_ELT (vec, i) = op;
 413   rtx ret = gen_reg_rtx (vmode);
 414   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 415
 416   return ret;
 417 }
 418
 419 /* This subroutine of expand_doubleword_shift handles the cases in which
 420    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 421    value are the same as for the parent routine, except that SUPERWORD_OP1
 422    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 423    INTO_TARGET may be null if the caller has decided to calculate it.  */
 424
 425 static bool
 426 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 427                         rtx outof_target, rtx into_target,
 428                         int unsignedp, enum optab_methods methods)
 429 {
 430   if (into_target != 0)
 431     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 432                              into_target, unsignedp, methods))
 433       return false;
 434
 435   if (outof_target != 0)
 436     {
 437       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 438          of the sign bit, otherwise we must fill it with zeros.  */
 439       if (binoptab != ashr_optab)
 440         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 441       else
 442         if (!force_expand_binop (word_mode, binoptab, outof_input,
 443                                  gen_int_shift_amount (word_mode,
 444                                                        BITS_PER_WORD - 1),
 445                                  outof_target, unsignedp, methods))
 446           return false;
 447     }
 448   return true;
 449 }
 450
 451 /* This subroutine of expand_doubleword_shift handles the cases in which
 452    the effective shift value is < BITS_PER_WORD.  The arguments and return
 453    value are the same as for the parent routine.  */
 454
 455 static bool
 456 expand_subword_shift (scalar_int_mode op1_mode, optab binoptab,
 457                       rtx outof_input, rtx into_input, rtx op1,
 458                       rtx outof_target, rtx into_target,
 459                       int unsignedp, enum optab_methods methods,
 460                       unsigned HOST_WIDE_INT shift_mask)
 461 {
 462   optab reverse_unsigned_shift, unsigned_shift;
 463   rtx tmp, carries;
 464
 465   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 466   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 467
 468   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 469      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 470      the opposite direction to BINOPTAB.  */
 471   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 472     {
 473       carries = outof_input;
 474       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 475                                             op1_mode), op1_mode);
 476       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 477                                    0, true, methods);
 478     }
 479   else
 480     {
 481       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 482          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 483          has unknown behavior.  Do a single shift first, then shift by the
 484          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 485          are truncated to the mode size.  */
 486       carries = expand_binop (word_mode, reverse_unsigned_shift,
 487                               outof_input, const1_rtx, 0, unsignedp, methods);
 488       if (shift_mask == BITS_PER_WORD - 1)
 489         {
 490           tmp = immed_wide_int_const
 491             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 492           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 493                                        0, true, methods);
 494         }
 495       else
 496         {
 497           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 498                                                 op1_mode), op1_mode);
 499           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 500                                        0, true, methods);
 501         }
 502     }
 503   if (tmp == 0 || carries == 0)
 504     return false;
 505   carries = expand_binop (word_mode, reverse_unsigned_shift,
 506                           carries, tmp, 0, unsignedp, methods);
 507   if (carries == 0)
 508     return false;
 509
 510   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 511      so the result can go directly into INTO_TARGET if convenient.  */
 512   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 513                       into_target, unsignedp, methods);
 514   if (tmp == 0)
 515     return false;
 516
 517   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 518   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 519                            into_target, unsignedp, methods))
 520     return false;
 521
 522   /* Use a standard word_mode shift for the out-of half.  */
 523   if (outof_target != 0)
 524     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 525                              outof_target, unsignedp, methods))
 526       return false;
 527
 528   return true;
 529 }
 530
 531
 532 /* Try implementing expand_doubleword_shift using conditional moves.
 533    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 534    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 535    are the shift counts to use in the former and latter case.  All other
 536    arguments are the same as the parent routine.  */
 537
 538 static bool
 539 expand_doubleword_shift_condmove (scalar_int_mode op1_mode, optab binoptab,
 540                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 541                                   rtx outof_input, rtx into_input,
 542                                   rtx subword_op1, rtx superword_op1,
 543                                   rtx outof_target, rtx into_target,
 544                                   int unsignedp, enum optab_methods methods,
 545                                   unsigned HOST_WIDE_INT shift_mask)
 546 {
 547   rtx outof_superword, into_superword;
 548
 549   /* Put the superword version of the output into OUTOF_SUPERWORD and
 550      INTO_SUPERWORD.  */
 551   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 552   if (outof_target != 0 && subword_op1 == superword_op1)
 553     {
 554       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 555          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 556       into_superword = outof_target;
 557       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 558                                    outof_superword, 0, unsignedp, methods))
 559         return false;
 560     }
 561   else
 562     {
 563       into_superword = gen_reg_rtx (word_mode);
 564       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 565                                    outof_superword, into_superword,
 566                                    unsignedp, methods))
 567         return false;
 568     }
 569
 570   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 571   if (!expand_subword_shift (op1_mode, binoptab,
 572                              outof_input, into_input, subword_op1,
 573                              outof_target, into_target,
 574                              unsignedp, methods, shift_mask))
 575     return false;
 576
 577   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 578      might be the current value of OUTOF_TARGET.  */
 579   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 580                               into_target, into_superword, word_mode, false))
 581     return false;
 582
 583   if (outof_target != 0)
 584     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 585                                 outof_target, outof_superword,
 586                                 word_mode, false))
 587       return false;
 588
 589   return true;
 590 }
 591
 592 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 593    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 594    input operand; the shift moves bits in the direction OUTOF_INPUT->
 595    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 596    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 597    If OP1 is constant, it will have been truncated as appropriate
 598    and is known to be nonzero.
 599
 600    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 601    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 602    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 603
 604    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 605    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 606    fill with zeros or sign bits as appropriate.
 607
 608    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 609    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 610    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
 611    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
 612    are undefined.
 613
 614    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
 615    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
 616    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
 617    function wants to calculate it itself.
 618
 619    Return true if the shift could be successfully synthesized.  */
 620
 621 static bool
 622 expand_doubleword_shift (scalar_int_mode op1_mode, optab binoptab,
 623                          rtx outof_input, rtx into_input, rtx op1,
 624                          rtx outof_target, rtx into_target,
 625                          int unsignedp, enum optab_methods methods,
 626                          unsigned HOST_WIDE_INT shift_mask)
 627 {
 628   rtx superword_op1, tmp, cmp1, cmp2;
 629   enum rtx_code cmp_code;
 630
 631   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
 632      fill the result with sign or zero bits as appropriate.  If so, the value
 633      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
 634      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
 635      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
 636
 637      This isn't worthwhile for constant shifts since the optimizers will
 638      cope better with in-range shift counts.  */
 639   if (shift_mask >= BITS_PER_WORD
 640       && outof_target != 0
 641       && !CONSTANT_P (op1))
 642     {
 643       if (!expand_doubleword_shift (op1_mode, binoptab,
 644                                     outof_input, into_input, op1,
 645                                     0, into_target,
 646                                     unsignedp, methods, shift_mask))
 647         return false;
 648       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 649                                outof_target, unsignedp, methods))
 650         return false;
 651       return true;
 652     }
 653
 654   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
 655      is true when the effective shift value is less than BITS_PER_WORD.
 656      Set SUPERWORD_OP1 to the shift count that should be used to shift
 657      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
 658   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
 659   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
 660     {
 661       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
 662          is a subword shift count.  */
 663       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
 664                                     0, true, methods);
 665       cmp2 = CONST0_RTX (op1_mode);
 666       cmp_code = EQ;
 667       superword_op1 = op1;
 668     }
 669   else
 670     {
 671       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
 672       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
 673                                     0, true, methods);
 674       cmp2 = CONST0_RTX (op1_mode);
 675       cmp_code = LT;
 676       superword_op1 = cmp1;
 677     }
 678   if (cmp1 == 0)
 679     return false;
 680
 681   /* If we can compute the condition at compile time, pick the
 682      appropriate subroutine.  */
 683   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
 684   if (tmp != 0 && CONST_INT_P (tmp))
 685     {
 686       if (tmp == const0_rtx)
 687         return expand_superword_shift (binoptab, outof_input, superword_op1,
 688                                        outof_target, into_target,
 689                                        unsignedp, methods);
 690       else
 691         return expand_subword_shift (op1_mode, binoptab,
 692                                      outof_input, into_input, op1,
 693                                      outof_target, into_target,
 694                                      unsignedp, methods, shift_mask);
 695     }
 696
 697   /* Try using conditional moves to generate straight-line code.  */
 698   if (HAVE_conditional_move)
 699     {
 700       rtx_insn *start = get_last_insn ();
 701       if (expand_doubleword_shift_condmove (op1_mode, binoptab,
 702                                             cmp_code, cmp1, cmp2,
 703                                             outof_input, into_input,
 704                                             op1, superword_op1,
 705                                             outof_target, into_target,
 706                                             unsignedp, methods, shift_mask))
 707         return true;
 708       delete_insns_since (start);
 709     }
 710
 711   /* As a last resort, use branches to select the correct alternative.  */
 712   rtx_code_label *subword_label = gen_label_rtx ();
 713   rtx_code_label *done_label = gen_label_rtx ();
 714
 715   NO_DEFER_POP;
 716   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
 717                            0, 0, subword_label,
 718                            profile_probability::uninitialized ());
 719   OK_DEFER_POP;
 720
 721   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 722                                outof_target, into_target,
 723                                unsignedp, methods))
 724     return false;
 725
 726   emit_jump_insn (targetm.gen_jump (done_label));
 727   emit_barrier ();
 728   emit_label (subword_label);
 729
 730   if (!expand_subword_shift (op1_mode, binoptab,
 731                              outof_input, into_input, op1,
 732                              outof_target, into_target,
 733                              unsignedp, methods, shift_mask))
 734     return false;
 735
 736   emit_label (done_label);
 737   return true;
 738 }
 739 \f
 740 /* Subroutine of expand_binop.  Perform a double word multiplication of
 741    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
 742    as the target's word_mode.  This function return NULL_RTX if anything
 743    goes wrong, in which case it may have already emitted instructions
 744    which need to be deleted.
 745
 746    If we want to multiply two two-word values and have normal and widening
 747    multiplies of single-word values, we can do this with three smaller
 748    multiplications.
 749
 750    The multiplication proceeds as follows:
 751                                  _______________________
 752                                 [__op0_high_|__op0_low__]
 753                                  _______________________
 754         *                       [__op1_high_|__op1_low__]
 755         _______________________________________________
 756                                  _______________________
 757     (1)                         [__op0_low__*__op1_low__]
 758                      _______________________
 759     (2a)            [__op0_low__*__op1_high_]
 760                      _______________________
 761     (2b)            [__op0_high_*__op1_low__]
 762          _______________________
 763     (3) [__op0_high_*__op1_high_]
 764
 765
 766   This gives a 4-word result.  Since we are only interested in the
 767   lower 2 words, partial result (3) and the upper words of (2a) and
 768   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
 769   calculated using non-widening multiplication.
 770
 771   (1), however, needs to be calculated with an unsigned widening
 772   multiplication.  If this operation is not directly supported we
 773   try using a signed widening multiplication and adjust the result.
 774   This adjustment works as follows:
 775
 776       If both operands are positive then no adjustment is needed.
 777
 778       If the operands have different signs, for example op0_low < 0 and
 779       op1_low >= 0, the instruction treats the most significant bit of
 780       op0_low as a sign bit instead of a bit with significance
 781       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
 782       with 2**BITS_PER_WORD - op0_low, and two's complements the
 783       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
 784       the result.
 785
 786       Similarly, if both operands are negative, we need to add
 787       (op0_low + op1_low) * 2**BITS_PER_WORD.
 788
 789       We use a trick to adjust quickly.  We logically shift op0_low right
 790       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
 791       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
 792       logical shift exists, we do an arithmetic right shift and subtract
 793       the 0 or -1.  */
 794
 795 static rtx
 796 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
 797                        bool umulp, enum optab_methods methods)
 798 {
 799   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
 800   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
 801   rtx wordm1 = (umulp ? NULL_RTX
 802                 : gen_int_shift_amount (word_mode, BITS_PER_WORD - 1));
 803   rtx product, adjust, product_high, temp;
 804
 805   rtx op0_high = operand_subword_force (op0, high, mode);
 806   rtx op0_low = operand_subword_force (op0, low, mode);
 807   rtx op1_high = operand_subword_force (op1, high, mode);
 808   rtx op1_low = operand_subword_force (op1, low, mode);
 809
 810   /* If we're using an unsigned multiply to directly compute the product
 811      of the low-order words of the operands and perform any required
 812      adjustments of the operands, we begin by trying two more multiplications
 813      and then computing the appropriate sum.
 814
 815      We have checked above that the required addition is provided.
 816      Full-word addition will normally always succeed, especially if
 817      it is provided at all, so we don't worry about its failure.  The
 818      multiplication may well fail, however, so we do handle that.  */
 819
 820   if (!umulp)
 821     {
 822       /* ??? This could be done with emit_store_flag where available.  */
 823       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
 824                            NULL_RTX, 1, methods);
 825       if (temp)
 826         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
 827                                  NULL_RTX, 0, OPTAB_DIRECT);
 828       else
 829         {
 830           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
 831                                NULL_RTX, 0, methods);
 832           if (!temp)
 833             return NULL_RTX;
 834           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
 835                                    NULL_RTX, 0, OPTAB_DIRECT);
 836         }
 837
 838       if (!op0_high)
 839         return NULL_RTX;
 840     }
 841
 842   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
 843                          NULL_RTX, 0, OPTAB_DIRECT);
 844   if (!adjust)
 845     return NULL_RTX;
 846
 847   /* OP0_HIGH should now be dead.  */
 848
 849   if (!umulp)
 850     {
 851       /* ??? This could be done with emit_store_flag where available.  */
 852       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
 853                            NULL_RTX, 1, methods);
 854       if (temp)
 855         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
 856                                  NULL_RTX, 0, OPTAB_DIRECT);
 857       else
 858         {
 859           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
 860                                NULL_RTX, 0, methods);
 861           if (!temp)
 862             return NULL_RTX;
 863           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
 864                                    NULL_RTX, 0, OPTAB_DIRECT);
 865         }
 866
 867       if (!op1_high)
 868         return NULL_RTX;
 869     }
 870
 871   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
 872                        NULL_RTX, 0, OPTAB_DIRECT);
 873   if (!temp)
 874     return NULL_RTX;
 875
 876   /* OP1_HIGH should now be dead.  */
 877
 878   adjust = expand_binop (word_mode, add_optab, adjust, temp,
 879                          NULL_RTX, 0, OPTAB_DIRECT);
 880
 881   if (target && !REG_P (target))
 882     target = NULL_RTX;
 883
 884   /* *_widen_optab needs to determine operand mode, make sure at least
 885      one operand has non-VOID mode.  */
 886   if (GET_MODE (op0_low) == VOIDmode && GET_MODE (op1_low) == VOIDmode)
 887     op0_low = force_reg (word_mode, op0_low);
 888
 889   if (umulp)
 890     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
 891                             target, 1, OPTAB_DIRECT);
 892   else
 893     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
 894                             target, 1, OPTAB_DIRECT);
 895
 896   if (!product)
 897     return NULL_RTX;
 898
 899   product_high = operand_subword (product, high, 1, mode);
 900   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
 901                          NULL_RTX, 0, OPTAB_DIRECT);
 902   emit_move_insn (product_high, adjust);
 903   return product;
 904 }
 905 \f
 906 /* Wrapper around expand_binop which takes an rtx code to specify
 907    the operation to perform, not an optab pointer.  All other
 908    arguments are the same.  */
 909 rtx
 910 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
 911                      rtx op1, rtx target, int unsignedp,
 912                      enum optab_methods methods)
 913 {
 914   optab binop = code_to_optab (code);
 915   gcc_assert (binop);
 916
 917   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
 918 }
 919
 920 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
 921    binop.  Order them according to commutative_operand_precedence and, if
 922    possible, try to put TARGET or a pseudo first.  */
 923 static bool
 924 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
 925 {
 926   int op0_prec = commutative_operand_precedence (op0);
 927   int op1_prec = commutative_operand_precedence (op1);
 928
 929   if (op0_prec < op1_prec)
 930     return true;
 931
 932   if (op0_prec > op1_prec)
 933     return false;
 934
 935   /* With equal precedence, both orders are ok, but it is better if the
 936      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
 937   if (target == 0 || REG_P (target))
 938     return (REG_P (op1) && !REG_P (op0)) || target == op1;
 939   else
 940     return rtx_equal_p (op1, target);
 941 }
 942
 943 /* Return true if BINOPTAB implements a shift operation.  */
 944
 945 static bool
 946 shift_optab_p (optab binoptab)
 947 {
 948   switch (optab_to_code (binoptab))
 949     {
 950     case ASHIFT:
 951     case SS_ASHIFT:
 952     case US_ASHIFT:
 953     case ASHIFTRT:
 954     case LSHIFTRT:
 955     case ROTATE:
 956     case ROTATERT:
 957       return true;
 958
 959     default:
 960       return false;
 961     }
 962 }
 963
 964 /* Return true if BINOPTAB implements a commutative binary operation.  */
 965
 966 static bool
 967 commutative_optab_p (optab binoptab)
 968 {
 969   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
 970           || binoptab == smul_widen_optab
 971           || binoptab == umul_widen_optab
 972           || binoptab == smul_highpart_optab
 973           || binoptab == umul_highpart_optab);
 974 }
 975
 976 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
 977    optimizing, and if the operand is a constant that costs more than
 978    1 instruction, force the constant into a register and return that
 979    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
 980
 981 static rtx
 982 avoid_expensive_constant (machine_mode mode, optab binoptab,
 983                           int opn, rtx x, bool unsignedp)
 984 {
 985   bool speed = optimize_insn_for_speed_p ();
 986
 987   if (mode != VOIDmode
 988       && optimize
 989       && CONSTANT_P (x)
 990       && (rtx_cost (x, mode, optab_to_code (binoptab), opn, speed)
 991           > set_src_cost (x, mode, speed)))
 992     {
 993       if (CONST_INT_P (x))
 994         {
 995           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
 996           if (intval != INTVAL (x))
 997             x = GEN_INT (intval);
 998         }
 999       else
1000         x = convert_modes (mode, VOIDmode, x, unsignedp);
1001       x = force_reg (mode, x);
1002     }
1003   return x;
1004 }
1005
1006 /* Helper function for expand_binop: handle the case where there
1007    is an insn ICODE that directly implements the indicated operation.
1008    Returns null if this is not possible.  */
1009 static rtx
1010 expand_binop_directly (enum insn_code icode, machine_mode mode, optab binoptab,
1011                        rtx op0, rtx op1,
1012                        rtx target, int unsignedp, enum optab_methods methods,
1013                        rtx_insn *last)
1014 {
1015   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1016   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1017   machine_mode mode0, mode1, tmp_mode;
1018   struct expand_operand ops[3];
1019   bool commutative_p;
1020   rtx_insn *pat;
1021   rtx xop0 = op0, xop1 = op1;
1022   bool canonicalize_op1 = false;
1023
1024   /* If it is a commutative operator and the modes would match
1025      if we would swap the operands, we can save the conversions.  */
1026   commutative_p = commutative_optab_p (binoptab);
1027   if (commutative_p
1028       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1029       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1030     std::swap (xop0, xop1);
1031
1032   /* If we are optimizing, force expensive constants into a register.  */
1033   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1034   if (!shift_optab_p (binoptab))
1035     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1036   else
1037     /* Shifts and rotates often use a different mode for op1 from op0;
1038        for VOIDmode constants we don't know the mode, so force it
1039        to be canonicalized using convert_modes.  */
1040     canonicalize_op1 = true;
1041
1042   /* In case the insn wants input operands in modes different from
1043      those of the actual operands, convert the operands.  It would
1044      seem that we don't need to convert CONST_INTs, but we do, so
1045      that they're properly zero-extended, sign-extended or truncated
1046      for their mode.  */
1047
1048   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1049   if (xmode0 != VOIDmode && xmode0 != mode0)
1050     {
1051       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1052       mode0 = xmode0;
1053     }
1054
1055   mode1 = ((GET_MODE (xop1) != VOIDmode || canonicalize_op1)
1056            ? GET_MODE (xop1) : mode);
1057   if (xmode1 != VOIDmode && xmode1 != mode1)
1058     {
1059       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1060       mode1 = xmode1;
1061     }
1062
1063   /* If operation is commutative,
1064      try to make the first operand a register.
1065      Even better, try to make it the same as the target.
1066      Also try to make the last operand a constant.  */
1067   if (commutative_p
1068       && swap_commutative_operands_with_target (target, xop0, xop1))
1069     std::swap (xop0, xop1);
1070
1071   /* Now, if insn's predicates don't allow our operands, put them into
1072      pseudo regs.  */
1073
1074   if (binoptab == vec_pack_trunc_optab
1075       || binoptab == vec_pack_usat_optab
1076       || binoptab == vec_pack_ssat_optab
1077       || binoptab == vec_pack_ufix_trunc_optab
1078       || binoptab == vec_pack_sfix_trunc_optab
1079       || binoptab == vec_packu_float_optab
1080       || binoptab == vec_packs_float_optab)
1081     {
1082       /* The mode of the result is different then the mode of the
1083          arguments.  */
1084       tmp_mode = insn_data[(int) icode].operand[0].mode;
1085       if (VECTOR_MODE_P (mode)
1086           && maybe_ne (GET_MODE_NUNITS (tmp_mode), 2 * GET_MODE_NUNITS (mode)))
1087         {
1088           delete_insns_since (last);
1089           return NULL_RTX;
1090         }
1091     }
1092   else
1093     tmp_mode = mode;
1094
1095   create_output_operand (&ops[0], target, tmp_mode);
1096   create_input_operand (&ops[1], xop0, mode0);
1097   create_input_operand (&ops[2], xop1, mode1);
1098   pat = maybe_gen_insn (icode, 3, ops);
1099   if (pat)
1100     {
1101       /* If PAT is composed of more than one insn, try to add an appropriate
1102          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1103          operand, call expand_binop again, this time without a target.  */
1104       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1105           && ! add_equal_note (pat, ops[0].value,
1106                                optab_to_code (binoptab),
1107                                ops[1].value, ops[2].value))
1108         {
1109           delete_insns_since (last);
1110           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1111                                unsignedp, methods);
1112         }
1113
1114       emit_insn (pat);
1115       return ops[0].value;
1116     }
1117   delete_insns_since (last);
1118   return NULL_RTX;
1119 }
1120
1121 /* Generate code to perform an operation specified by BINOPTAB
1122    on operands OP0 and OP1, with result having machine-mode MODE.
1123
1124    UNSIGNEDP is for the case where we have to widen the operands
1125    to perform the operation.  It says to use zero-extension.
1126
1127    If TARGET is nonzero, the value
1128    is generated there, if it is convenient to do so.
1129    In all cases an rtx is returned for the locus of the value;
1130    this may or may not be TARGET.  */
1131
1132 rtx
1133 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1134               rtx target, int unsignedp, enum optab_methods methods)
1135 {
1136   enum optab_methods next_methods
1137     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1138        ? OPTAB_WIDEN : methods);
1139   enum mode_class mclass;
1140   enum insn_code icode;
1141   machine_mode wider_mode;
1142   scalar_int_mode int_mode;
1143   rtx libfunc;
1144   rtx temp;
1145   rtx_insn *entry_last = get_last_insn ();
1146   rtx_insn *last;
1147
1148   mclass = GET_MODE_CLASS (mode);
1149
1150   /* If subtracting an integer constant, convert this into an addition of
1151      the negated constant.  */
1152
1153   if (binoptab == sub_optab && CONST_INT_P (op1))
1154     {
1155       op1 = negate_rtx (mode, op1);
1156       binoptab = add_optab;
1157     }
1158   /* For shifts, constant invalid op1 might be expanded from different
1159      mode than MODE.  As those are invalid, force them to a register
1160      to avoid further problems during expansion.  */
1161   else if (CONST_INT_P (op1)
1162            && shift_optab_p (binoptab)
1163            && UINTVAL (op1) >= GET_MODE_BITSIZE (GET_MODE_INNER (mode)))
1164     {
1165       op1 = gen_int_mode (INTVAL (op1), GET_MODE_INNER (mode));
1166       op1 = force_reg (GET_MODE_INNER (mode), op1);
1167     }
1168
1169   /* Record where to delete back to if we backtrack.  */
1170   last = get_last_insn ();
1171
1172   /* If we can do it with a three-operand insn, do so.  */
1173
1174   if (methods != OPTAB_MUST_WIDEN)
1175     {
1176       if (convert_optab_p (binoptab))
1177         {
1178           machine_mode from_mode = widened_mode (mode, op0, op1);
1179           icode = find_widening_optab_handler (binoptab, mode, from_mode);
1180         }
1181       else
1182         icode = optab_handler (binoptab, mode);
1183       if (icode != CODE_FOR_nothing)
1184         {
1185           temp = expand_binop_directly (icode, mode, binoptab, op0, op1,
1186                                         target, unsignedp, methods, last);
1187           if (temp)
1188             return temp;
1189         }
1190     }
1191
1192   /* If we were trying to rotate, and that didn't work, try rotating
1193      the other direction before falling back to shifts and bitwise-or.  */
1194   if (((binoptab == rotl_optab
1195         && (icode = optab_handler (rotr_optab, mode)) != CODE_FOR_nothing)
1196        || (binoptab == rotr_optab
1197            && (icode = optab_handler (rotl_optab, mode)) != CODE_FOR_nothing))
1198       && is_int_mode (mode, &int_mode))
1199     {
1200       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1201       rtx newop1;
1202       unsigned int bits = GET_MODE_PRECISION (int_mode);
1203
1204       if (CONST_INT_P (op1))
1205         newop1 = gen_int_shift_amount (int_mode, bits - INTVAL (op1));
1206       else if (targetm.shift_truncation_mask (int_mode) == bits - 1)
1207         newop1 = negate_rtx (GET_MODE (op1), op1);
1208       else
1209         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1210                                gen_int_mode (bits, GET_MODE (op1)), op1,
1211                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1212
1213       temp = expand_binop_directly (icode, int_mode, otheroptab, op0, newop1,
1214                                     target, unsignedp, methods, last);
1215       if (temp)
1216         return temp;
1217     }
1218
1219   /* If this is a multiply, see if we can do a widening operation that
1220      takes operands of this mode and makes a wider mode.  */
1221
1222   if (binoptab == smul_optab
1223       && GET_MODE_2XWIDER_MODE (mode).exists (&wider_mode)
1224       && (convert_optab_handler ((unsignedp
1225                                   ? umul_widen_optab
1226                                   : smul_widen_optab),
1227                                  wider_mode, mode) != CODE_FOR_nothing))
1228     {
1229       /* *_widen_optab needs to determine operand mode, make sure at least
1230          one operand has non-VOID mode.  */
1231       if (GET_MODE (op0) == VOIDmode && GET_MODE (op1) == VOIDmode)
1232         op0 = force_reg (mode, op0);
1233       temp = expand_binop (wider_mode,
1234                            unsignedp ? umul_widen_optab : smul_widen_optab,
1235                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1236
1237       if (temp != 0)
1238         {
1239           if (GET_MODE_CLASS (mode) == MODE_INT
1240               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1241             return gen_lowpart (mode, temp);
1242           else
1243             return convert_to_mode (mode, temp, unsignedp);
1244         }
1245     }
1246
1247   /* If this is a vector shift by a scalar, see if we can do a vector
1248      shift by a vector.  If so, broadcast the scalar into a vector.  */
1249   if (mclass == MODE_VECTOR_INT)
1250     {
1251       optab otheroptab = unknown_optab;
1252
1253       if (binoptab == ashl_optab)
1254         otheroptab = vashl_optab;
1255       else if (binoptab == ashr_optab)
1256         otheroptab = vashr_optab;
1257       else if (binoptab == lshr_optab)
1258         otheroptab = vlshr_optab;
1259       else if (binoptab == rotl_optab)
1260         otheroptab = vrotl_optab;
1261       else if (binoptab == rotr_optab)
1262         otheroptab = vrotr_optab;
1263
1264       if (otheroptab
1265           && (icode = optab_handler (otheroptab, mode)) != CODE_FOR_nothing)
1266         {
1267           /* The scalar may have been extended to be too wide.  Truncate
1268              it back to the proper size to fit in the broadcast vector.  */
1269           scalar_mode inner_mode = GET_MODE_INNER (mode);
1270           if (!CONST_INT_P (op1)
1271               && (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (op1)))
1272                   > GET_MODE_BITSIZE (inner_mode)))
1273             op1 = force_reg (inner_mode,
1274                              simplify_gen_unary (TRUNCATE, inner_mode, op1,
1275                                                  GET_MODE (op1)));
1276           rtx vop1 = expand_vector_broadcast (mode, op1);
1277           if (vop1)
1278             {
1279               temp = expand_binop_directly (icode, mode, otheroptab, op0, vop1,
1280                                             target, unsignedp, methods, last);
1281               if (temp)
1282                 return temp;
1283             }
1284         }
1285     }
1286
1287   /* Look for a wider mode of the same class for which we think we
1288      can open-code the operation.  Check for a widening multiply at the
1289      wider mode as well.  */
1290
1291   if (CLASS_HAS_WIDER_MODES_P (mclass)
1292       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1293     FOR_EACH_WIDER_MODE (wider_mode, mode)
1294       {
1295         machine_mode next_mode;
1296         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1297             || (binoptab == smul_optab
1298                 && GET_MODE_WIDER_MODE (wider_mode).exists (&next_mode)
1299                 && (find_widening_optab_handler ((unsignedp
1300                                                   ? umul_widen_optab
1301                                                   : smul_widen_optab),
1302                                                  next_mode, mode)
1303                     != CODE_FOR_nothing)))
1304           {
1305             rtx xop0 = op0, xop1 = op1;
1306             int no_extend = 0;
1307
1308             /* For certain integer operations, we need not actually extend
1309                the narrow operands, as long as we will truncate
1310                the results to the same narrowness.  */
1311
1312             if ((binoptab == ior_optab || binoptab == and_optab
1313                  || binoptab == xor_optab
1314                  || binoptab == add_optab || binoptab == sub_optab
1315                  || binoptab == smul_optab || binoptab == ashl_optab)
1316                 && mclass == MODE_INT)
1317               {
1318                 no_extend = 1;
1319                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1320                                                  xop0, unsignedp);
1321                 if (binoptab != ashl_optab)
1322                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1323                                                    xop1, unsignedp);
1324               }
1325
1326             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1327
1328             /* The second operand of a shift must always be extended.  */
1329             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1330                                   no_extend && binoptab != ashl_optab);
1331
1332             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1333                                  unsignedp, OPTAB_DIRECT);
1334             if (temp)
1335               {
1336                 if (mclass != MODE_INT
1337                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1338                   {
1339                     if (target == 0)
1340                       target = gen_reg_rtx (mode);
1341                     convert_move (target, temp, 0);
1342                     return target;
1343                   }
1344                 else
1345                   return gen_lowpart (mode, temp);
1346               }
1347             else
1348               delete_insns_since (last);
1349           }
1350       }
1351
1352   /* If operation is commutative,
1353      try to make the first operand a register.
1354      Even better, try to make it the same as the target.
1355      Also try to make the last operand a constant.  */
1356   if (commutative_optab_p (binoptab)
1357       && swap_commutative_operands_with_target (target, op0, op1))
1358     std::swap (op0, op1);
1359
1360   /* These can be done a word at a time.  */
1361   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1362       && is_int_mode (mode, &int_mode)
1363       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
1364       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1365     {
1366       int i;
1367       rtx_insn *insns;
1368
1369       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1370          won't be accurate, so use a new target.  */
1371       if (target == 0
1372           || target == op0
1373           || target == op1
1374           || !valid_multiword_target_p (target))
1375         target = gen_reg_rtx (int_mode);
1376
1377       start_sequence ();
1378
1379       /* Do the actual arithmetic.  */
1380       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
1381         {
1382           rtx target_piece = operand_subword (target, i, 1, int_mode);
1383           rtx x = expand_binop (word_mode, binoptab,
1384                                 operand_subword_force (op0, i, int_mode),
1385                                 operand_subword_force (op1, i, int_mode),
1386                                 target_piece, unsignedp, next_methods);
1387
1388           if (x == 0)
1389             break;
1390
1391           if (target_piece != x)
1392             emit_move_insn (target_piece, x);
1393         }
1394
1395       insns = get_insns ();
1396       end_sequence ();
1397
1398       if (i == GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD)
1399         {
1400           emit_insn (insns);
1401           return target;
1402         }
1403     }
1404
1405   /* Synthesize double word shifts from single word shifts.  */
1406   if ((binoptab == lshr_optab || binoptab == ashl_optab
1407        || binoptab == ashr_optab)
1408       && is_int_mode (mode, &int_mode)
1409       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1410       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1411       && GET_MODE_PRECISION (int_mode) == GET_MODE_BITSIZE (int_mode)
1412       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1413       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1414       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1415     {
1416       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1417       scalar_int_mode op1_mode;
1418
1419       double_shift_mask = targetm.shift_truncation_mask (int_mode);
1420       shift_mask = targetm.shift_truncation_mask (word_mode);
1421       op1_mode = (GET_MODE (op1) != VOIDmode
1422                   ? as_a <scalar_int_mode> (GET_MODE (op1))
1423                   : word_mode);
1424
1425       /* Apply the truncation to constant shifts.  */
1426       if (double_shift_mask > 0 && CONST_INT_P (op1))
1427         op1 = gen_int_mode (INTVAL (op1) & double_shift_mask, op1_mode);
1428
1429       if (op1 == CONST0_RTX (op1_mode))
1430         return op0;
1431
1432       /* Make sure that this is a combination that expand_doubleword_shift
1433          can handle.  See the comments there for details.  */
1434       if (double_shift_mask == 0
1435           || (shift_mask == BITS_PER_WORD - 1
1436               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1437         {
1438           rtx_insn *insns;
1439           rtx into_target, outof_target;
1440           rtx into_input, outof_input;
1441           int left_shift, outof_word;
1442
1443           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1444              won't be accurate, so use a new target.  */
1445           if (target == 0
1446               || target == op0
1447               || target == op1
1448               || !valid_multiword_target_p (target))
1449             target = gen_reg_rtx (int_mode);
1450
1451           start_sequence ();
1452
1453           /* OUTOF_* is the word we are shifting bits away from, and
1454              INTO_* is the word that we are shifting bits towards, thus
1455              they differ depending on the direction of the shift and
1456              WORDS_BIG_ENDIAN.  */
1457
1458           left_shift = binoptab == ashl_optab;
1459           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1460
1461           outof_target = operand_subword (target, outof_word, 1, int_mode);
1462           into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1463
1464           outof_input = operand_subword_force (op0, outof_word, int_mode);
1465           into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1466
1467           if (expand_doubleword_shift (op1_mode, binoptab,
1468                                        outof_input, into_input, op1,
1469                                        outof_target, into_target,
1470                                        unsignedp, next_methods, shift_mask))
1471             {
1472               insns = get_insns ();
1473               end_sequence ();
1474
1475               emit_insn (insns);
1476               return target;
1477             }
1478           end_sequence ();
1479         }
1480     }
1481
1482   /* Synthesize double word rotates from single word shifts.  */
1483   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1484       && is_int_mode (mode, &int_mode)
1485       && CONST_INT_P (op1)
1486       && GET_MODE_PRECISION (int_mode) == 2 * BITS_PER_WORD
1487       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1488       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1489     {
1490       rtx_insn *insns;
1491       rtx into_target, outof_target;
1492       rtx into_input, outof_input;
1493       rtx inter;
1494       int shift_count, left_shift, outof_word;
1495
1496       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1497          won't be accurate, so use a new target. Do this also if target is not
1498          a REG, first because having a register instead may open optimization
1499          opportunities, and second because if target and op0 happen to be MEMs
1500          designating the same location, we would risk clobbering it too early
1501          in the code sequence we generate below.  */
1502       if (target == 0
1503           || target == op0
1504           || target == op1
1505           || !REG_P (target)
1506           || !valid_multiword_target_p (target))
1507         target = gen_reg_rtx (int_mode);
1508
1509       start_sequence ();
1510
1511       shift_count = INTVAL (op1);
1512
1513       /* OUTOF_* is the word we are shifting bits away from, and
1514          INTO_* is the word that we are shifting bits towards, thus
1515          they differ depending on the direction of the shift and
1516          WORDS_BIG_ENDIAN.  */
1517
1518       left_shift = (binoptab == rotl_optab);
1519       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1520
1521       outof_target = operand_subword (target, outof_word, 1, int_mode);
1522       into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1523
1524       outof_input = operand_subword_force (op0, outof_word, int_mode);
1525       into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1526
1527       if (shift_count == BITS_PER_WORD)
1528         {
1529           /* This is just a word swap.  */
1530           emit_move_insn (outof_target, into_input);
1531           emit_move_insn (into_target, outof_input);
1532           inter = const0_rtx;
1533         }
1534       else
1535         {
1536           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1537           HOST_WIDE_INT first_shift_count, second_shift_count;
1538           optab reverse_unsigned_shift, unsigned_shift;
1539
1540           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1541                                     ? lshr_optab : ashl_optab);
1542
1543           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1544                             ? ashl_optab : lshr_optab);
1545
1546           if (shift_count > BITS_PER_WORD)
1547             {
1548               first_shift_count = shift_count - BITS_PER_WORD;
1549               second_shift_count = 2 * BITS_PER_WORD - shift_count;
1550             }
1551           else
1552             {
1553               first_shift_count = BITS_PER_WORD - shift_count;
1554               second_shift_count = shift_count;
1555             }
1556           rtx first_shift_count_rtx
1557             = gen_int_shift_amount (word_mode, first_shift_count);
1558           rtx second_shift_count_rtx
1559             = gen_int_shift_amount (word_mode, second_shift_count);
1560
1561           into_temp1 = expand_binop (word_mode, unsigned_shift,
1562                                      outof_input, first_shift_count_rtx,
1563                                      NULL_RTX, unsignedp, next_methods);
1564           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1565                                      into_input, second_shift_count_rtx,
1566                                      NULL_RTX, unsignedp, next_methods);
1567
1568           if (into_temp1 != 0 && into_temp2 != 0)
1569             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1570                                   into_target, unsignedp, next_methods);
1571           else
1572             inter = 0;
1573
1574           if (inter != 0 && inter != into_target)
1575             emit_move_insn (into_target, inter);
1576
1577           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1578                                       into_input, first_shift_count_rtx,
1579                                       NULL_RTX, unsignedp, next_methods);
1580           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1581                                       outof_input, second_shift_count_rtx,
1582                                       NULL_RTX, unsignedp, next_methods);
1583
1584           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1585             inter = expand_binop (word_mode, ior_optab,
1586                                   outof_temp1, outof_temp2,
1587                                   outof_target, unsignedp, next_methods);
1588
1589           if (inter != 0 && inter != outof_target)
1590             emit_move_insn (outof_target, inter);
1591         }
1592
1593       insns = get_insns ();
1594       end_sequence ();
1595
1596       if (inter != 0)
1597         {
1598           emit_insn (insns);
1599           return target;
1600         }
1601     }
1602
1603   /* These can be done a word at a time by propagating carries.  */
1604   if ((binoptab == add_optab || binoptab == sub_optab)
1605       && is_int_mode (mode, &int_mode)
1606       && GET_MODE_SIZE (int_mode) >= 2 * UNITS_PER_WORD
1607       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1608     {
1609       unsigned int i;
1610       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1611       const unsigned int nwords = GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD;
1612       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1613       rtx xop0, xop1, xtarget;
1614
1615       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1616          value is one of those, use it.  Otherwise, use 1 since it is the
1617          one easiest to get.  */
1618 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1619       int normalizep = STORE_FLAG_VALUE;
1620 #else
1621       int normalizep = 1;
1622 #endif
1623
1624       /* Prepare the operands.  */
1625       xop0 = force_reg (int_mode, op0);
1626       xop1 = force_reg (int_mode, op1);
1627
1628       xtarget = gen_reg_rtx (int_mode);
1629
1630       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1631         target = xtarget;
1632
1633       /* Indicate for flow that the entire target reg is being set.  */
1634       if (REG_P (target))
1635         emit_clobber (xtarget);
1636
1637       /* Do the actual arithmetic.  */
1638       for (i = 0; i < nwords; i++)
1639         {
1640           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1641           rtx target_piece = operand_subword (xtarget, index, 1, int_mode);
1642           rtx op0_piece = operand_subword_force (xop0, index, int_mode);
1643           rtx op1_piece = operand_subword_force (xop1, index, int_mode);
1644           rtx x;
1645
1646           /* Main add/subtract of the input operands.  */
1647           x = expand_binop (word_mode, binoptab,
1648                             op0_piece, op1_piece,
1649                             target_piece, unsignedp, next_methods);
1650           if (x == 0)
1651             break;
1652
1653           if (i + 1 < nwords)
1654             {
1655               /* Store carry from main add/subtract.  */
1656               carry_out = gen_reg_rtx (word_mode);
1657               carry_out = emit_store_flag_force (carry_out,
1658                                                  (binoptab == add_optab
1659                                                   ? LT : GT),
1660                                                  x, op0_piece,
1661                                                  word_mode, 1, normalizep);
1662             }
1663
1664           if (i > 0)
1665             {
1666               rtx newx;
1667
1668               /* Add/subtract previous carry to main result.  */
1669               newx = expand_binop (word_mode,
1670                                    normalizep == 1 ? binoptab : otheroptab,
1671                                    x, carry_in,
1672                                    NULL_RTX, 1, next_methods);
1673
1674               if (i + 1 < nwords)
1675                 {
1676                   /* Get out carry from adding/subtracting carry in.  */
1677                   rtx carry_tmp = gen_reg_rtx (word_mode);
1678                   carry_tmp = emit_store_flag_force (carry_tmp,
1679                                                      (binoptab == add_optab
1680                                                       ? LT : GT),
1681                                                      newx, x,
1682                                                      word_mode, 1, normalizep);
1683
1684                   /* Logical-ior the two poss. carry together.  */
1685                   carry_out = expand_binop (word_mode, ior_optab,
1686                                             carry_out, carry_tmp,
1687                                             carry_out, 0, next_methods);
1688                   if (carry_out == 0)
1689                     break;
1690                 }
1691               emit_move_insn (target_piece, newx);
1692             }
1693           else
1694             {
1695               if (x != target_piece)
1696                 emit_move_insn (target_piece, x);
1697             }
1698
1699           carry_in = carry_out;
1700         }
1701
1702       if (i == GET_MODE_BITSIZE (int_mode) / (unsigned) BITS_PER_WORD)
1703         {
1704           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing
1705               || ! rtx_equal_p (target, xtarget))
1706             {
1707               rtx_insn *temp = emit_move_insn (target, xtarget);
1708
1709               set_dst_reg_note (temp, REG_EQUAL,
1710                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
1711                                                 int_mode, copy_rtx (xop0),
1712                                                 copy_rtx (xop1)),
1713                                 target);
1714             }
1715           else
1716             target = xtarget;
1717
1718           return target;
1719         }
1720
1721       else
1722         delete_insns_since (last);
1723     }
1724
1725   /* Attempt to synthesize double word multiplies using a sequence of word
1726      mode multiplications.  We first attempt to generate a sequence using a
1727      more efficient unsigned widening multiply, and if that fails we then
1728      try using a signed widening multiply.  */
1729
1730   if (binoptab == smul_optab
1731       && is_int_mode (mode, &int_mode)
1732       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1733       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
1734       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
1735     {
1736       rtx product = NULL_RTX;
1737       if (convert_optab_handler (umul_widen_optab, int_mode, word_mode)
1738           != CODE_FOR_nothing)
1739         {
1740           product = expand_doubleword_mult (int_mode, op0, op1, target,
1741                                             true, methods);
1742           if (!product)
1743             delete_insns_since (last);
1744         }
1745
1746       if (product == NULL_RTX
1747           && (convert_optab_handler (smul_widen_optab, int_mode, word_mode)
1748               != CODE_FOR_nothing))
1749         {
1750           product = expand_doubleword_mult (int_mode, op0, op1, target,
1751                                             false, methods);
1752           if (!product)
1753             delete_insns_since (last);
1754         }
1755
1756       if (product != NULL_RTX)
1757         {
1758           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing)
1759             {
1760               rtx_insn *move = emit_move_insn (target ? target : product,
1761                                                product);
1762               set_dst_reg_note (move,
1763                                 REG_EQUAL,
1764                                 gen_rtx_fmt_ee (MULT, int_mode,
1765                                                 copy_rtx (op0),
1766                                                 copy_rtx (op1)),
1767                                 target ? target : product);
1768             }
1769           return product;
1770         }
1771     }
1772
1773   /* It can't be open-coded in this mode.
1774      Use a library call if one is available and caller says that's ok.  */
1775
1776   libfunc = optab_libfunc (binoptab, mode);
1777   if (libfunc
1778       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
1779     {
1780       rtx_insn *insns;
1781       rtx op1x = op1;
1782       machine_mode op1_mode = mode;
1783       rtx value;
1784
1785       start_sequence ();
1786
1787       if (shift_optab_p (binoptab))
1788         {
1789           op1_mode = targetm.libgcc_shift_count_mode ();
1790           /* Specify unsigned here,
1791              since negative shift counts are meaningless.  */
1792           op1x = convert_to_mode (op1_mode, op1, 1);
1793         }
1794
1795       if (GET_MODE (op0) != VOIDmode
1796           && GET_MODE (op0) != mode)
1797         op0 = convert_to_mode (mode, op0, unsignedp);
1798
1799       /* Pass 1 for NO_QUEUE so we don't lose any increments
1800          if the libcall is cse'd or moved.  */
1801       value = emit_library_call_value (libfunc,
1802                                        NULL_RTX, LCT_CONST, mode,
1803                                        op0, mode, op1x, op1_mode);
1804
1805       insns = get_insns ();
1806       end_sequence ();
1807
1808       bool trapv = trapv_binoptab_p (binoptab);
1809       target = gen_reg_rtx (mode);
1810       emit_libcall_block_1 (insns, target, value,
1811                             trapv ? NULL_RTX
1812                             : gen_rtx_fmt_ee (optab_to_code (binoptab),
1813                                               mode, op0, op1), trapv);
1814
1815       return target;
1816     }
1817
1818   delete_insns_since (last);
1819
1820   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1821
1822   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
1823          || methods == OPTAB_MUST_WIDEN))
1824     {
1825       /* Caller says, don't even try.  */
1826       delete_insns_since (entry_last);
1827       return 0;
1828     }
1829
1830   /* Compute the value of METHODS to pass to recursive calls.
1831      Don't allow widening to be tried recursively.  */
1832
1833   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
1834
1835   /* Look for a wider mode of the same class for which it appears we can do
1836      the operation.  */
1837
1838   if (CLASS_HAS_WIDER_MODES_P (mclass))
1839     {
1840       /* This code doesn't make sense for conversion optabs, since we
1841          wouldn't then want to extend the operands to be the same size
1842          as the result.  */
1843       gcc_assert (!convert_optab_p (binoptab));
1844       FOR_EACH_WIDER_MODE (wider_mode, mode)
1845         {
1846           if (optab_handler (binoptab, wider_mode)
1847               || (methods == OPTAB_LIB
1848                   && optab_libfunc (binoptab, wider_mode)))
1849             {
1850               rtx xop0 = op0, xop1 = op1;
1851               int no_extend = 0;
1852
1853               /* For certain integer operations, we need not actually extend
1854                  the narrow operands, as long as we will truncate
1855                  the results to the same narrowness.  */
1856
1857               if ((binoptab == ior_optab || binoptab == and_optab
1858                    || binoptab == xor_optab
1859                    || binoptab == add_optab || binoptab == sub_optab
1860                    || binoptab == smul_optab || binoptab == ashl_optab)
1861                   && mclass == MODE_INT)
1862                 no_extend = 1;
1863
1864               xop0 = widen_operand (xop0, wider_mode, mode,
1865                                     unsignedp, no_extend);
1866
1867               /* The second operand of a shift must always be extended.  */
1868               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1869                                     no_extend && binoptab != ashl_optab);
1870
1871               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1872                                    unsignedp, methods);
1873               if (temp)
1874                 {
1875                   if (mclass != MODE_INT
1876                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1877                     {
1878                       if (target == 0)
1879                         target = gen_reg_rtx (mode);
1880                       convert_move (target, temp, 0);
1881                       return target;
1882                     }
1883                   else
1884                     return gen_lowpart (mode, temp);
1885                 }
1886               else
1887                 delete_insns_since (last);
1888             }
1889         }
1890     }
1891
1892   delete_insns_since (entry_last);
1893   return 0;
1894 }
1895 \f
1896 /* Expand a binary operator which has both signed and unsigned forms.
1897    UOPTAB is the optab for unsigned operations, and SOPTAB is for
1898    signed operations.
1899
1900    If we widen unsigned operands, we may use a signed wider operation instead
1901    of an unsigned wider operation, since the result would be the same.  */
1902
1903 rtx
1904 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
1905                    rtx op0, rtx op1, rtx target, int unsignedp,
1906                    enum optab_methods methods)
1907 {
1908   rtx temp;
1909   optab direct_optab = unsignedp ? uoptab : soptab;
1910   bool save_enable;
1911
1912   /* Do it without widening, if possible.  */
1913   temp = expand_binop (mode, direct_optab, op0, op1, target,
1914                        unsignedp, OPTAB_DIRECT);
1915   if (temp || methods == OPTAB_DIRECT)
1916     return temp;
1917
1918   /* Try widening to a signed int.  Disable any direct use of any
1919      signed insn in the current mode.  */
1920   save_enable = swap_optab_enable (soptab, mode, false);
1921
1922   temp = expand_binop (mode, soptab, op0, op1, target,
1923                        unsignedp, OPTAB_WIDEN);
1924
1925   /* For unsigned operands, try widening to an unsigned int.  */
1926   if (!temp && unsignedp)
1927     temp = expand_binop (mode, uoptab, op0, op1, target,
1928                          unsignedp, OPTAB_WIDEN);
1929   if (temp || methods == OPTAB_WIDEN)
1930     goto egress;
1931
1932   /* Use the right width libcall if that exists.  */
1933   temp = expand_binop (mode, direct_optab, op0, op1, target,
1934                        unsignedp, OPTAB_LIB);
1935   if (temp || methods == OPTAB_LIB)
1936     goto egress;
1937
1938   /* Must widen and use a libcall, use either signed or unsigned.  */
1939   temp = expand_binop (mode, soptab, op0, op1, target,
1940                        unsignedp, methods);
1941   if (!temp && unsignedp)
1942     temp = expand_binop (mode, uoptab, op0, op1, target,
1943                          unsignedp, methods);
1944
1945  egress:
1946   /* Undo the fiddling above.  */
1947   if (save_enable)
1948     swap_optab_enable (soptab, mode, true);
1949   return temp;
1950 }
1951 \f
1952 /* Generate code to perform an operation specified by UNOPPTAB
1953    on operand OP0, with two results to TARG0 and TARG1.
1954    We assume that the order of the operands for the instruction
1955    is TARG0, TARG1, OP0.
1956
1957    Either TARG0 or TARG1 may be zero, but what that means is that
1958    the result is not actually wanted.  We will generate it into
1959    a dummy pseudo-reg and discard it.  They may not both be zero.
1960
1961    Returns 1 if this operation can be performed; 0 if not.  */
1962
1963 int
1964 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
1965                     int unsignedp)
1966 {
1967   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
1968   enum mode_class mclass;
1969   machine_mode wider_mode;
1970   rtx_insn *entry_last = get_last_insn ();
1971   rtx_insn *last;
1972
1973   mclass = GET_MODE_CLASS (mode);
1974
1975   if (!targ0)
1976     targ0 = gen_reg_rtx (mode);
1977   if (!targ1)
1978     targ1 = gen_reg_rtx (mode);
1979
1980   /* Record where to go back to if we fail.  */
1981   last = get_last_insn ();
1982
1983   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
1984     {
1985       struct expand_operand ops[3];
1986       enum insn_code icode = optab_handler (unoptab, mode);
1987
1988       create_fixed_operand (&ops[0], targ0);
1989       create_fixed_operand (&ops[1], targ1);
1990       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
1991       if (maybe_expand_insn (icode, 3, ops))
1992         return 1;
1993     }
1994
1995   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1996
1997   if (CLASS_HAS_WIDER_MODES_P (mclass))
1998     {
1999       FOR_EACH_WIDER_MODE (wider_mode, mode)
2000         {
2001           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2002             {
2003               rtx t0 = gen_reg_rtx (wider_mode);
2004               rtx t1 = gen_reg_rtx (wider_mode);
2005               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2006
2007               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
2008                 {
2009                   convert_move (targ0, t0, unsignedp);
2010                   convert_move (targ1, t1, unsignedp);
2011                   return 1;
2012                 }
2013               else
2014                 delete_insns_since (last);
2015             }
2016         }
2017     }
2018
2019   delete_insns_since (entry_last);
2020   return 0;
2021 }
2022 \f
2023 /* Generate code to perform an operation specified by BINOPTAB
2024    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2025    We assume that the order of the operands for the instruction
2026    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2027    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2028
2029    Either TARG0 or TARG1 may be zero, but what that means is that
2030    the result is not actually wanted.  We will generate it into
2031    a dummy pseudo-reg and discard it.  They may not both be zero.
2032
2033    Returns 1 if this operation can be performed; 0 if not.  */
2034
2035 int
2036 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2037                      int unsignedp)
2038 {
2039   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2040   enum mode_class mclass;
2041   machine_mode wider_mode;
2042   rtx_insn *entry_last = get_last_insn ();
2043   rtx_insn *last;
2044
2045   mclass = GET_MODE_CLASS (mode);
2046
2047   if (!targ0)
2048     targ0 = gen_reg_rtx (mode);
2049   if (!targ1)
2050     targ1 = gen_reg_rtx (mode);
2051
2052   /* Record where to go back to if we fail.  */
2053   last = get_last_insn ();
2054
2055   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2056     {
2057       struct expand_operand ops[4];
2058       enum insn_code icode = optab_handler (binoptab, mode);
2059       machine_mode mode0 = insn_data[icode].operand[1].mode;
2060       machine_mode mode1 = insn_data[icode].operand[2].mode;
2061       rtx xop0 = op0, xop1 = op1;
2062
2063       /* If we are optimizing, force expensive constants into a register.  */
2064       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2065       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2066
2067       create_fixed_operand (&ops[0], targ0);
2068       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2069       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2070       create_fixed_operand (&ops[3], targ1);
2071       if (maybe_expand_insn (icode, 4, ops))
2072         return 1;
2073       delete_insns_since (last);
2074     }
2075
2076   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2077
2078   if (CLASS_HAS_WIDER_MODES_P (mclass))
2079     {
2080       FOR_EACH_WIDER_MODE (wider_mode, mode)
2081         {
2082           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2083             {
2084               rtx t0 = gen_reg_rtx (wider_mode);
2085               rtx t1 = gen_reg_rtx (wider_mode);
2086               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2087               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2088
2089               if (expand_twoval_binop (binoptab, cop0, cop1,
2090                                        t0, t1, unsignedp))
2091                 {
2092                   convert_move (targ0, t0, unsignedp);
2093                   convert_move (targ1, t1, unsignedp);
2094                   return 1;
2095                 }
2096               else
2097                 delete_insns_since (last);
2098             }
2099         }
2100     }
2101
2102   delete_insns_since (entry_last);
2103   return 0;
2104 }
2105
2106 /* Expand the two-valued library call indicated by BINOPTAB, but
2107    preserve only one of the values.  If TARG0 is non-NULL, the first
2108    value is placed into TARG0; otherwise the second value is placed
2109    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2110    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2111    This routine assumes that the value returned by the library call is
2112    as if the return value was of an integral mode twice as wide as the
2113    mode of OP0.  Returns 1 if the call was successful.  */
2114
2115 bool
2116 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2117                              rtx targ0, rtx targ1, enum rtx_code code)
2118 {
2119   machine_mode mode;
2120   machine_mode libval_mode;
2121   rtx libval;
2122   rtx_insn *insns;
2123   rtx libfunc;
2124
2125   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2126   gcc_assert (!targ0 != !targ1);
2127
2128   mode = GET_MODE (op0);
2129   libfunc = optab_libfunc (binoptab, mode);
2130   if (!libfunc)
2131     return false;
2132
2133   /* The value returned by the library function will have twice as
2134      many bits as the nominal MODE.  */
2135   libval_mode = smallest_int_mode_for_size (2 * GET_MODE_BITSIZE (mode));
2136   start_sequence ();
2137   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2138                                     libval_mode,
2139                                     op0, mode,
2140                                     op1, mode);
2141   /* Get the part of VAL containing the value that we want.  */
2142   libval = simplify_gen_subreg (mode, libval, libval_mode,
2143                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2144   insns = get_insns ();
2145   end_sequence ();
2146   /* Move the into the desired location.  */
2147   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2148                       gen_rtx_fmt_ee (code, mode, op0, op1));
2149
2150   return true;
2151 }
2152
2153 \f
2154 /* Wrapper around expand_unop which takes an rtx code to specify
2155    the operation to perform, not an optab pointer.  All other
2156    arguments are the same.  */
2157 rtx
2158 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2159                     rtx target, int unsignedp)
2160 {
2161   optab unop = code_to_optab (code);
2162   gcc_assert (unop);
2163
2164   return expand_unop (mode, unop, op0, target, unsignedp);
2165 }
2166
2167 /* Try calculating
2168         (clz:narrow x)
2169    as
2170         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2171
2172    A similar operation can be used for clrsb.  UNOPTAB says which operation
2173    we are trying to expand.  */
2174 static rtx
2175 widen_leading (scalar_int_mode mode, rtx op0, rtx target, optab unoptab)
2176 {
2177   opt_scalar_int_mode wider_mode_iter;
2178   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2179     {
2180       scalar_int_mode wider_mode = wider_mode_iter.require ();
2181       if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2182         {
2183           rtx xop0, temp;
2184           rtx_insn *last;
2185
2186           last = get_last_insn ();
2187
2188           if (target == 0)
2189             target = gen_reg_rtx (mode);
2190           xop0 = widen_operand (op0, wider_mode, mode,
2191                                 unoptab != clrsb_optab, false);
2192           temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2193                               unoptab != clrsb_optab);
2194           if (temp != 0)
2195             temp = expand_binop
2196               (wider_mode, sub_optab, temp,
2197                gen_int_mode (GET_MODE_PRECISION (wider_mode)
2198                              - GET_MODE_PRECISION (mode),
2199                              wider_mode),
2200                target, true, OPTAB_DIRECT);
2201           if (temp == 0)
2202             delete_insns_since (last);
2203
2204           return temp;
2205         }
2206     }
2207   return 0;
2208 }
2209
2210 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2211    quantities, choosing which based on whether the high word is nonzero.  */
2212 static rtx
2213 expand_doubleword_clz (scalar_int_mode mode, rtx op0, rtx target)
2214 {
2215   rtx xop0 = force_reg (mode, op0);
2216   rtx subhi = gen_highpart (word_mode, xop0);
2217   rtx sublo = gen_lowpart (word_mode, xop0);
2218   rtx_code_label *hi0_label = gen_label_rtx ();
2219   rtx_code_label *after_label = gen_label_rtx ();
2220   rtx_insn *seq;
2221   rtx temp, result;
2222
2223   /* If we were not given a target, use a word_mode register, not a
2224      'mode' register.  The result will fit, and nobody is expecting
2225      anything bigger (the return type of __builtin_clz* is int).  */
2226   if (!target)
2227     target = gen_reg_rtx (word_mode);
2228
2229   /* In any case, write to a word_mode scratch in both branches of the
2230      conditional, so we can ensure there is a single move insn setting
2231      'target' to tag a REG_EQUAL note on.  */
2232   result = gen_reg_rtx (word_mode);
2233
2234   start_sequence ();
2235
2236   /* If the high word is not equal to zero,
2237      then clz of the full value is clz of the high word.  */
2238   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2239                            word_mode, true, hi0_label);
2240
2241   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2242   if (!temp)
2243     goto fail;
2244
2245   if (temp != result)
2246     convert_move (result, temp, true);
2247
2248   emit_jump_insn (targetm.gen_jump (after_label));
2249   emit_barrier ();
2250
2251   /* Else clz of the full value is clz of the low word plus the number
2252      of bits in the high word.  */
2253   emit_label (hi0_label);
2254
2255   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2256   if (!temp)
2257     goto fail;
2258   temp = expand_binop (word_mode, add_optab, temp,
2259                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2260                        result, true, OPTAB_DIRECT);
2261   if (!temp)
2262     goto fail;
2263   if (temp != result)
2264     convert_move (result, temp, true);
2265
2266   emit_label (after_label);
2267   convert_move (target, result, true);
2268
2269   seq = get_insns ();
2270   end_sequence ();
2271
2272   add_equal_note (seq, target, CLZ, xop0, 0);
2273   emit_insn (seq);
2274   return target;
2275
2276  fail:
2277   end_sequence ();
2278   return 0;
2279 }
2280
2281 /* Try calculating popcount of a double-word quantity as two popcount's of
2282    word-sized quantities and summing up the results.  */
2283 static rtx
2284 expand_doubleword_popcount (scalar_int_mode mode, rtx op0, rtx target)
2285 {
2286   rtx t0, t1, t;
2287   rtx_insn *seq;
2288
2289   start_sequence ();
2290
2291   t0 = expand_unop_direct (word_mode, popcount_optab,
2292                            operand_subword_force (op0, 0, mode), NULL_RTX,
2293                            true);
2294   t1 = expand_unop_direct (word_mode, popcount_optab,
2295                            operand_subword_force (op0, 1, mode), NULL_RTX,
2296                            true);
2297   if (!t0 || !t1)
2298     {
2299       end_sequence ();
2300       return NULL_RTX;
2301     }
2302
2303   /* If we were not given a target, use a word_mode register, not a
2304      'mode' register.  The result will fit, and nobody is expecting
2305      anything bigger (the return type of __builtin_popcount* is int).  */
2306   if (!target)
2307     target = gen_reg_rtx (word_mode);
2308
2309   t = expand_binop (word_mode, add_optab, t0, t1, target, 0, OPTAB_DIRECT);
2310
2311   seq = get_insns ();
2312   end_sequence ();
2313
2314   add_equal_note (seq, t, POPCOUNT, op0, 0);
2315   emit_insn (seq);
2316   return t;
2317 }
2318
2319 /* Try calculating
2320         (parity:wide x)
2321    as
2322         (parity:narrow (low (x) ^ high (x))) */
2323 static rtx
2324 expand_doubleword_parity (scalar_int_mode mode, rtx op0, rtx target)
2325 {
2326   rtx t = expand_binop (word_mode, xor_optab,
2327                         operand_subword_force (op0, 0, mode),
2328                         operand_subword_force (op0, 1, mode),
2329                         NULL_RTX, 0, OPTAB_DIRECT);
2330   return expand_unop (word_mode, parity_optab, t, target, true);
2331 }
2332
2333 /* Try calculating
2334         (bswap:narrow x)
2335    as
2336         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2337 static rtx
2338 widen_bswap (scalar_int_mode mode, rtx op0, rtx target)
2339 {
2340   rtx x;
2341   rtx_insn *last;
2342   opt_scalar_int_mode wider_mode_iter;
2343
2344   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2345     if (optab_handler (bswap_optab, wider_mode_iter.require ())
2346         != CODE_FOR_nothing)
2347       break;
2348
2349   if (!wider_mode_iter.exists ())
2350     return NULL_RTX;
2351
2352   scalar_int_mode wider_mode = wider_mode_iter.require ();
2353   last = get_last_insn ();
2354
2355   x = widen_operand (op0, wider_mode, mode, true, true);
2356   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2357
2358   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2359               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2360   if (x != 0)
2361     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2362                       GET_MODE_BITSIZE (wider_mode)
2363                       - GET_MODE_BITSIZE (mode),
2364                       NULL_RTX, true);
2365
2366   if (x != 0)
2367     {
2368       if (target == 0)
2369         target = gen_reg_rtx (mode);
2370       emit_move_insn (target, gen_lowpart (mode, x));
2371     }
2372   else
2373     delete_insns_since (last);
2374
2375   return target;
2376 }
2377
2378 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2379
2380 static rtx
2381 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2382 {
2383   rtx t0, t1;
2384
2385   t1 = expand_unop (word_mode, bswap_optab,
2386                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2387   t0 = expand_unop (word_mode, bswap_optab,
2388                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2389
2390   if (target == 0 || !valid_multiword_target_p (target))
2391     target = gen_reg_rtx (mode);
2392   if (REG_P (target))
2393     emit_clobber (target);
2394   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2395   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2396
2397   return target;
2398 }
2399
2400 /* Try calculating (parity x) as (and (popcount x) 1), where
2401    popcount can also be done in a wider mode.  */
2402 static rtx
2403 expand_parity (scalar_int_mode mode, rtx op0, rtx target)
2404 {
2405   enum mode_class mclass = GET_MODE_CLASS (mode);
2406   opt_scalar_int_mode wider_mode_iter;
2407   FOR_EACH_MODE_FROM (wider_mode_iter, mode)
2408     {
2409       scalar_int_mode wider_mode = wider_mode_iter.require ();
2410       if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2411         {
2412           rtx xop0, temp;
2413           rtx_insn *last;
2414
2415           last = get_last_insn ();
2416
2417           if (target == 0 || GET_MODE (target) != wider_mode)
2418             target = gen_reg_rtx (wider_mode);
2419
2420           xop0 = widen_operand (op0, wider_mode, mode, true, false);
2421           temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2422                               true);
2423           if (temp != 0)
2424             temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2425                                  target, true, OPTAB_DIRECT);
2426
2427           if (temp)
2428             {
2429               if (mclass != MODE_INT
2430                   || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2431                 return convert_to_mode (mode, temp, 0);
2432               else
2433                 return gen_lowpart (mode, temp);
2434             }
2435           else
2436             delete_insns_since (last);
2437         }
2438     }
2439   return 0;
2440 }
2441
2442 /* Try calculating ctz(x) as K - clz(x & -x) ,
2443    where K is GET_MODE_PRECISION(mode) - 1.
2444
2445    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2446    don't have to worry about what the hardware does in that case.  (If
2447    the clz instruction produces the usual value at 0, which is K, the
2448    result of this code sequence will be -1; expand_ffs, below, relies
2449    on this.  It might be nice to have it be K instead, for consistency
2450    with the (very few) processors that provide a ctz with a defined
2451    value, but that would take one more instruction, and it would be
2452    less convenient for expand_ffs anyway.  */
2453
2454 static rtx
2455 expand_ctz (scalar_int_mode mode, rtx op0, rtx target)
2456 {
2457   rtx_insn *seq;
2458   rtx temp;
2459
2460   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2461     return 0;
2462
2463   start_sequence ();
2464
2465   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2466   if (temp)
2467     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2468                          true, OPTAB_DIRECT);
2469   if (temp)
2470     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2471   if (temp)
2472     temp = expand_binop (mode, sub_optab,
2473                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2474                          temp, target,
2475                          true, OPTAB_DIRECT);
2476   if (temp == 0)
2477     {
2478       end_sequence ();
2479       return 0;
2480     }
2481
2482   seq = get_insns ();
2483   end_sequence ();
2484
2485   add_equal_note (seq, temp, CTZ, op0, 0);
2486   emit_insn (seq);
2487   return temp;
2488 }
2489
2490
2491 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2492    else with the sequence used by expand_clz.
2493
2494    The ffs builtin promises to return zero for a zero value and ctz/clz
2495    may have an undefined value in that case.  If they do not give us a
2496    convenient value, we have to generate a test and branch.  */
2497 static rtx
2498 expand_ffs (scalar_int_mode mode, rtx op0, rtx target)
2499 {
2500   HOST_WIDE_INT val = 0;
2501   bool defined_at_zero = false;
2502   rtx temp;
2503   rtx_insn *seq;
2504
2505   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2506     {
2507       start_sequence ();
2508
2509       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2510       if (!temp)
2511         goto fail;
2512
2513       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2514     }
2515   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2516     {
2517       start_sequence ();
2518       temp = expand_ctz (mode, op0, 0);
2519       if (!temp)
2520         goto fail;
2521
2522       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2523         {
2524           defined_at_zero = true;
2525           val = (GET_MODE_PRECISION (mode) - 1) - val;
2526         }
2527     }
2528   else
2529     return 0;
2530
2531   if (defined_at_zero && val == -1)
2532     /* No correction needed at zero.  */;
2533   else
2534     {
2535       /* We don't try to do anything clever with the situation found
2536          on some processors (eg Alpha) where ctz(0:mode) ==
2537          bitsize(mode).  If someone can think of a way to send N to -1
2538          and leave alone all values in the range 0..N-1 (where N is a
2539          power of two), cheaper than this test-and-branch, please add it.
2540
2541          The test-and-branch is done after the operation itself, in case
2542          the operation sets condition codes that can be recycled for this.
2543          (This is true on i386, for instance.)  */
2544
2545       rtx_code_label *nonzero_label = gen_label_rtx ();
2546       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2547                                mode, true, nonzero_label);
2548
2549       convert_move (temp, GEN_INT (-1), false);
2550       emit_label (nonzero_label);
2551     }
2552
2553   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2554      to produce a value in the range 0..bitsize.  */
2555   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2556                        target, false, OPTAB_DIRECT);
2557   if (!temp)
2558     goto fail;
2559
2560   seq = get_insns ();
2561   end_sequence ();
2562
2563   add_equal_note (seq, temp, FFS, op0, 0);
2564   emit_insn (seq);
2565   return temp;
2566
2567  fail:
2568   end_sequence ();
2569   return 0;
2570 }
2571
2572 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2573    conditions, VAL may already be a SUBREG against which we cannot generate
2574    a further SUBREG.  In this case, we expect forcing the value into a
2575    register will work around the situation.  */
2576
2577 static rtx
2578 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
2579                            machine_mode imode)
2580 {
2581   rtx ret;
2582   ret = lowpart_subreg (omode, val, imode);
2583   if (ret == NULL)
2584     {
2585       val = force_reg (imode, val);
2586       ret = lowpart_subreg (omode, val, imode);
2587       gcc_assert (ret != NULL);
2588     }
2589   return ret;
2590 }
2591
2592 /* Expand a floating point absolute value or negation operation via a
2593    logical operation on the sign bit.  */
2594
2595 static rtx
2596 expand_absneg_bit (enum rtx_code code, scalar_float_mode mode,
2597                    rtx op0, rtx target)
2598 {
2599   const struct real_format *fmt;
2600   int bitpos, word, nwords, i;
2601   scalar_int_mode imode;
2602   rtx temp;
2603   rtx_insn *insns;
2604
2605   /* The format has to have a simple sign bit.  */
2606   fmt = REAL_MODE_FORMAT (mode);
2607   if (fmt == NULL)
2608     return NULL_RTX;
2609
2610   bitpos = fmt->signbit_rw;
2611   if (bitpos < 0)
2612     return NULL_RTX;
2613
2614   /* Don't create negative zeros if the format doesn't support them.  */
2615   if (code == NEG && !fmt->has_signed_zero)
2616     return NULL_RTX;
2617
2618   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2619     {
2620       if (!int_mode_for_mode (mode).exists (&imode))
2621         return NULL_RTX;
2622       word = 0;
2623       nwords = 1;
2624     }
2625   else
2626     {
2627       imode = word_mode;
2628
2629       if (FLOAT_WORDS_BIG_ENDIAN)
2630         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2631       else
2632         word = bitpos / BITS_PER_WORD;
2633       bitpos = bitpos % BITS_PER_WORD;
2634       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2635     }
2636
2637   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2638   if (code == ABS)
2639     mask = ~mask;
2640
2641   if (target == 0
2642       || target == op0
2643       || (nwords > 1 && !valid_multiword_target_p (target)))
2644     target = gen_reg_rtx (mode);
2645
2646   if (nwords > 1)
2647     {
2648       start_sequence ();
2649
2650       for (i = 0; i < nwords; ++i)
2651         {
2652           rtx targ_piece = operand_subword (target, i, 1, mode);
2653           rtx op0_piece = operand_subword_force (op0, i, mode);
2654
2655           if (i == word)
2656             {
2657               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2658                                    op0_piece,
2659                                    immed_wide_int_const (mask, imode),
2660                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2661               if (temp != targ_piece)
2662                 emit_move_insn (targ_piece, temp);
2663             }
2664           else
2665             emit_move_insn (targ_piece, op0_piece);
2666         }
2667
2668       insns = get_insns ();
2669       end_sequence ();
2670
2671       emit_insn (insns);
2672     }
2673   else
2674     {
2675       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2676                            gen_lowpart (imode, op0),
2677                            immed_wide_int_const (mask, imode),
2678                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2679       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2680
2681       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2682                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2683                         target);
2684     }
2685
2686   return target;
2687 }
2688
2689 /* As expand_unop, but will fail rather than attempt the operation in a
2690    different mode or with a libcall.  */
2691 static rtx
2692 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
2693                     int unsignedp)
2694 {
2695   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2696     {
2697       struct expand_operand ops[2];
2698       enum insn_code icode = optab_handler (unoptab, mode);
2699       rtx_insn *last = get_last_insn ();
2700       rtx_insn *pat;
2701
2702       create_output_operand (&ops[0], target, mode);
2703       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2704       pat = maybe_gen_insn (icode, 2, ops);
2705       if (pat)
2706         {
2707           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
2708               && ! add_equal_note (pat, ops[0].value,
2709                                    optab_to_code (unoptab),
2710                                    ops[1].value, NULL_RTX))
2711             {
2712               delete_insns_since (last);
2713               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
2714             }
2715
2716           emit_insn (pat);
2717
2718           return ops[0].value;
2719         }
2720     }
2721   return 0;
2722 }
2723
2724 /* Generate code to perform an operation specified by UNOPTAB
2725    on operand OP0, with result having machine-mode MODE.
2726
2727    UNSIGNEDP is for the case where we have to widen the operands
2728    to perform the operation.  It says to use zero-extension.
2729
2730    If TARGET is nonzero, the value
2731    is generated there, if it is convenient to do so.
2732    In all cases an rtx is returned for the locus of the value;
2733    this may or may not be TARGET.  */
2734
2735 rtx
2736 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
2737              int unsignedp)
2738 {
2739   enum mode_class mclass = GET_MODE_CLASS (mode);
2740   machine_mode wider_mode;
2741   scalar_int_mode int_mode;
2742   scalar_float_mode float_mode;
2743   rtx temp;
2744   rtx libfunc;
2745
2746   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
2747   if (temp)
2748     return temp;
2749
2750   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
2751
2752   /* Widening (or narrowing) clz needs special treatment.  */
2753   if (unoptab == clz_optab)
2754     {
2755       if (is_a <scalar_int_mode> (mode, &int_mode))
2756         {
2757           temp = widen_leading (int_mode, op0, target, unoptab);
2758           if (temp)
2759             return temp;
2760
2761           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2762               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2763             {
2764               temp = expand_doubleword_clz (int_mode, op0, target);
2765               if (temp)
2766                 return temp;
2767             }
2768         }
2769
2770       goto try_libcall;
2771     }
2772
2773   if (unoptab == clrsb_optab)
2774     {
2775       if (is_a <scalar_int_mode> (mode, &int_mode))
2776         {
2777           temp = widen_leading (int_mode, op0, target, unoptab);
2778           if (temp)
2779             return temp;
2780         }
2781       goto try_libcall;
2782     }
2783
2784   if (unoptab == popcount_optab
2785       && is_a <scalar_int_mode> (mode, &int_mode)
2786       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2787       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2788       && optimize_insn_for_speed_p ())
2789     {
2790       temp = expand_doubleword_popcount (int_mode, op0, target);
2791       if (temp)
2792         return temp;
2793     }
2794
2795   if (unoptab == parity_optab
2796       && is_a <scalar_int_mode> (mode, &int_mode)
2797       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2798       && (optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2799           || optab_handler (popcount_optab, word_mode) != CODE_FOR_nothing)
2800       && optimize_insn_for_speed_p ())
2801     {
2802       temp = expand_doubleword_parity (int_mode, op0, target);
2803       if (temp)
2804         return temp;
2805     }
2806
2807   /* Widening (or narrowing) bswap needs special treatment.  */
2808   if (unoptab == bswap_optab)
2809     {
2810       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
2811          or ROTATERT.  First try these directly; if this fails, then try the
2812          obvious pair of shifts with allowed widening, as this will probably
2813          be always more efficient than the other fallback methods.  */
2814       if (mode == HImode)
2815         {
2816           rtx_insn *last;
2817           rtx temp1, temp2;
2818
2819           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
2820             {
2821               temp = expand_binop (mode, rotl_optab, op0,
2822                                    gen_int_shift_amount (mode, 8),
2823                                    target, unsignedp, OPTAB_DIRECT);
2824               if (temp)
2825                 return temp;
2826              }
2827
2828           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
2829             {
2830               temp = expand_binop (mode, rotr_optab, op0,
2831                                    gen_int_shift_amount (mode, 8),
2832                                    target, unsignedp, OPTAB_DIRECT);
2833               if (temp)
2834                 return temp;
2835             }
2836
2837           last = get_last_insn ();
2838
2839           temp1 = expand_binop (mode, ashl_optab, op0,
2840                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2841                                 unsignedp, OPTAB_WIDEN);
2842           temp2 = expand_binop (mode, lshr_optab, op0,
2843                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2844                                 unsignedp, OPTAB_WIDEN);
2845           if (temp1 && temp2)
2846             {
2847               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
2848                                    unsignedp, OPTAB_WIDEN);
2849               if (temp)
2850                 return temp;
2851             }
2852
2853           delete_insns_since (last);
2854         }
2855
2856       if (is_a <scalar_int_mode> (mode, &int_mode))
2857         {
2858           temp = widen_bswap (int_mode, op0, target);
2859           if (temp)
2860             return temp;
2861
2862           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2863               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2864             {
2865               temp = expand_doubleword_bswap (mode, op0, target);
2866               if (temp)
2867                 return temp;
2868             }
2869         }
2870
2871       goto try_libcall;
2872     }
2873
2874   if (CLASS_HAS_WIDER_MODES_P (mclass))
2875     FOR_EACH_WIDER_MODE (wider_mode, mode)
2876       {
2877         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2878           {
2879             rtx xop0 = op0;
2880             rtx_insn *last = get_last_insn ();
2881
2882             /* For certain operations, we need not actually extend
2883                the narrow operand, as long as we will truncate the
2884                results to the same narrowness.  */
2885
2886             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
2887                                   (unoptab == neg_optab
2888                                    || unoptab == one_cmpl_optab)
2889                                   && mclass == MODE_INT);
2890
2891             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2892                                 unsignedp);
2893
2894             if (temp)
2895               {
2896                 if (mclass != MODE_INT
2897                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2898                   {
2899                     if (target == 0)
2900                       target = gen_reg_rtx (mode);
2901                     convert_move (target, temp, 0);
2902                     return target;
2903                   }
2904                 else
2905                   return gen_lowpart (mode, temp);
2906               }
2907             else
2908               delete_insns_since (last);
2909           }
2910       }
2911
2912   /* These can be done a word at a time.  */
2913   if (unoptab == one_cmpl_optab
2914       && is_int_mode (mode, &int_mode)
2915       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
2916       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2917     {
2918       int i;
2919       rtx_insn *insns;
2920
2921       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
2922         target = gen_reg_rtx (int_mode);
2923
2924       start_sequence ();
2925
2926       /* Do the actual arithmetic.  */
2927       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
2928         {
2929           rtx target_piece = operand_subword (target, i, 1, int_mode);
2930           rtx x = expand_unop (word_mode, unoptab,
2931                                operand_subword_force (op0, i, int_mode),
2932                                target_piece, unsignedp);
2933
2934           if (target_piece != x)
2935             emit_move_insn (target_piece, x);
2936         }
2937
2938       insns = get_insns ();
2939       end_sequence ();
2940
2941       emit_insn (insns);
2942       return target;
2943     }
2944
2945   if (optab_to_code (unoptab) == NEG)
2946     {
2947       /* Try negating floating point values by flipping the sign bit.  */
2948       if (is_a <scalar_float_mode> (mode, &float_mode))
2949         {
2950           temp = expand_absneg_bit (NEG, float_mode, op0, target);
2951           if (temp)
2952             return temp;
2953         }
2954
2955       /* If there is no negation pattern, and we have no negative zero,
2956          try subtracting from zero.  */
2957       if (!HONOR_SIGNED_ZEROS (mode))
2958         {
2959           temp = expand_binop (mode, (unoptab == negv_optab
2960                                       ? subv_optab : sub_optab),
2961                                CONST0_RTX (mode), op0, target,
2962                                unsignedp, OPTAB_DIRECT);
2963           if (temp)
2964             return temp;
2965         }
2966     }
2967
2968   /* Try calculating parity (x) as popcount (x) % 2.  */
2969   if (unoptab == parity_optab && is_a <scalar_int_mode> (mode, &int_mode))
2970     {
2971       temp = expand_parity (int_mode, op0, target);
2972       if (temp)
2973         return temp;
2974     }
2975
2976   /* Try implementing ffs (x) in terms of clz (x).  */
2977   if (unoptab == ffs_optab && is_a <scalar_int_mode> (mode, &int_mode))
2978     {
2979       temp = expand_ffs (int_mode, op0, target);
2980       if (temp)
2981         return temp;
2982     }
2983
2984   /* Try implementing ctz (x) in terms of clz (x).  */
2985   if (unoptab == ctz_optab && is_a <scalar_int_mode> (mode, &int_mode))
2986     {
2987       temp = expand_ctz (int_mode, op0, target);
2988       if (temp)
2989         return temp;
2990     }
2991
2992  try_libcall:
2993   /* Now try a library call in this mode.  */
2994   libfunc = optab_libfunc (unoptab, mode);
2995   if (libfunc)
2996     {
2997       rtx_insn *insns;
2998       rtx value;
2999       rtx eq_value;
3000       machine_mode outmode = mode;
3001
3002       /* All of these functions return small values.  Thus we choose to
3003          have them return something that isn't a double-word.  */
3004       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
3005           || unoptab == clrsb_optab || unoptab == popcount_optab
3006           || unoptab == parity_optab)
3007         outmode
3008           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3009                                           optab_libfunc (unoptab, mode)));
3010
3011       start_sequence ();
3012
3013       /* Pass 1 for NO_QUEUE so we don't lose any increments
3014          if the libcall is cse'd or moved.  */
3015       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3016                                        op0, mode);
3017       insns = get_insns ();
3018       end_sequence ();
3019
3020       target = gen_reg_rtx (outmode);
3021       bool trapv = trapv_unoptab_p (unoptab);
3022       if (trapv)
3023         eq_value = NULL_RTX;
3024       else
3025         {
3026           eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3027           if (GET_MODE_UNIT_SIZE (outmode) < GET_MODE_UNIT_SIZE (mode))
3028             eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3029           else if (GET_MODE_UNIT_SIZE (outmode) > GET_MODE_UNIT_SIZE (mode))
3030             eq_value = simplify_gen_unary (ZERO_EXTEND,
3031                                            outmode, eq_value, mode);
3032         }
3033       emit_libcall_block_1 (insns, target, value, eq_value, trapv);
3034
3035       return target;
3036     }
3037
3038   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3039
3040   if (CLASS_HAS_WIDER_MODES_P (mclass))
3041     {
3042       FOR_EACH_WIDER_MODE (wider_mode, mode)
3043         {
3044           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3045               || optab_libfunc (unoptab, wider_mode))
3046             {
3047               rtx xop0 = op0;
3048               rtx_insn *last = get_last_insn ();
3049
3050               /* For certain operations, we need not actually extend
3051                  the narrow operand, as long as we will truncate the
3052                  results to the same narrowness.  */
3053               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3054                                     (unoptab == neg_optab
3055                                      || unoptab == one_cmpl_optab
3056                                      || unoptab == bswap_optab)
3057                                     && mclass == MODE_INT);
3058
3059               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3060                                   unsignedp);
3061
3062               /* If we are generating clz using wider mode, adjust the
3063                  result.  Similarly for clrsb.  */
3064               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3065                   && temp != 0)
3066                 {
3067                   scalar_int_mode wider_int_mode
3068                     = as_a <scalar_int_mode> (wider_mode);
3069                   int_mode = as_a <scalar_int_mode> (mode);
3070                   temp = expand_binop
3071                     (wider_mode, sub_optab, temp,
3072                      gen_int_mode (GET_MODE_PRECISION (wider_int_mode)
3073                                    - GET_MODE_PRECISION (int_mode),
3074                                    wider_int_mode),
3075                      target, true, OPTAB_DIRECT);
3076                 }
3077
3078               /* Likewise for bswap.  */
3079               if (unoptab == bswap_optab && temp != 0)
3080                 {
3081                   scalar_int_mode wider_int_mode
3082                     = as_a <scalar_int_mode> (wider_mode);
3083                   int_mode = as_a <scalar_int_mode> (mode);
3084                   gcc_assert (GET_MODE_PRECISION (wider_int_mode)
3085                               == GET_MODE_BITSIZE (wider_int_mode)
3086                               && GET_MODE_PRECISION (int_mode)
3087                                  == GET_MODE_BITSIZE (int_mode));
3088
3089                   temp = expand_shift (RSHIFT_EXPR, wider_int_mode, temp,
3090                                        GET_MODE_BITSIZE (wider_int_mode)
3091                                        - GET_MODE_BITSIZE (int_mode),
3092                                        NULL_RTX, true);
3093                 }
3094
3095               if (temp)
3096                 {
3097                   if (mclass != MODE_INT)
3098                     {
3099                       if (target == 0)
3100                         target = gen_reg_rtx (mode);
3101                       convert_move (target, temp, 0);
3102                       return target;
3103                     }
3104                   else
3105                     return gen_lowpart (mode, temp);
3106                 }
3107               else
3108                 delete_insns_since (last);
3109             }
3110         }
3111     }
3112
3113   /* One final attempt at implementing negation via subtraction,
3114      this time allowing widening of the operand.  */
3115   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3116     {
3117       rtx temp;
3118       temp = expand_binop (mode,
3119                            unoptab == negv_optab ? subv_optab : sub_optab,
3120                            CONST0_RTX (mode), op0,
3121                            target, unsignedp, OPTAB_LIB_WIDEN);
3122       if (temp)
3123         return temp;
3124     }
3125
3126   return 0;
3127 }
3128 \f
3129 /* Emit code to compute the absolute value of OP0, with result to
3130    TARGET if convenient.  (TARGET may be 0.)  The return value says
3131    where the result actually is to be found.
3132
3133    MODE is the mode of the operand; the mode of the result is
3134    different but can be deduced from MODE.
3135
3136  */
3137
3138 rtx
3139 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3140                    int result_unsignedp)
3141 {
3142   rtx temp;
3143
3144   if (GET_MODE_CLASS (mode) != MODE_INT
3145       || ! flag_trapv)
3146     result_unsignedp = 1;
3147
3148   /* First try to do it with a special abs instruction.  */
3149   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3150                       op0, target, 0);
3151   if (temp != 0)
3152     return temp;
3153
3154   /* For floating point modes, try clearing the sign bit.  */
3155   scalar_float_mode float_mode;
3156   if (is_a <scalar_float_mode> (mode, &float_mode))
3157     {
3158       temp = expand_absneg_bit (ABS, float_mode, op0, target);
3159       if (temp)
3160         return temp;
3161     }
3162
3163   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3164   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3165       && !HONOR_SIGNED_ZEROS (mode))
3166     {
3167       rtx_insn *last = get_last_insn ();
3168
3169       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3170                           op0, NULL_RTX, 0);
3171       if (temp != 0)
3172         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3173                              OPTAB_WIDEN);
3174
3175       if (temp != 0)
3176         return temp;
3177
3178       delete_insns_since (last);
3179     }
3180
3181   /* If this machine has expensive jumps, we can do integer absolute
3182      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3183      where W is the width of MODE.  */
3184
3185   scalar_int_mode int_mode;
3186   if (is_int_mode (mode, &int_mode)
3187       && BRANCH_COST (optimize_insn_for_speed_p (),
3188                       false) >= 2)
3189     {
3190       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3191                                    GET_MODE_PRECISION (int_mode) - 1,
3192                                    NULL_RTX, 0);
3193
3194       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3195                            OPTAB_LIB_WIDEN);
3196       if (temp != 0)
3197         temp = expand_binop (int_mode,
3198                              result_unsignedp ? sub_optab : subv_optab,
3199                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3200
3201       if (temp != 0)
3202         return temp;
3203     }
3204
3205   return NULL_RTX;
3206 }
3207
3208 rtx
3209 expand_abs (machine_mode mode, rtx op0, rtx target,
3210             int result_unsignedp, int safe)
3211 {
3212   rtx temp;
3213   rtx_code_label *op1;
3214
3215   if (GET_MODE_CLASS (mode) != MODE_INT
3216       || ! flag_trapv)
3217     result_unsignedp = 1;
3218
3219   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3220   if (temp != 0)
3221     return temp;
3222
3223   /* If that does not win, use conditional jump and negate.  */
3224
3225   /* It is safe to use the target if it is the same
3226      as the source if this is also a pseudo register */
3227   if (op0 == target && REG_P (op0)
3228       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3229     safe = 1;
3230
3231   op1 = gen_label_rtx ();
3232   if (target == 0 || ! safe
3233       || GET_MODE (target) != mode
3234       || (MEM_P (target) && MEM_VOLATILE_P (target))
3235       || (REG_P (target)
3236           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3237     target = gen_reg_rtx (mode);
3238
3239   emit_move_insn (target, op0);
3240   NO_DEFER_POP;
3241
3242   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3243                            NULL_RTX, NULL, op1,
3244                            profile_probability::uninitialized ());
3245
3246   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3247                      target, target, 0);
3248   if (op0 != target)
3249     emit_move_insn (target, op0);
3250   emit_label (op1);
3251   OK_DEFER_POP;
3252   return target;
3253 }
3254
3255 /* Emit code to compute the one's complement absolute value of OP0
3256    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3257    (TARGET may be NULL_RTX.)  The return value says where the result
3258    actually is to be found.
3259
3260    MODE is the mode of the operand; the mode of the result is
3261    different but can be deduced from MODE.  */
3262
3263 rtx
3264 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3265 {
3266   rtx temp;
3267
3268   /* Not applicable for floating point modes.  */
3269   if (FLOAT_MODE_P (mode))
3270     return NULL_RTX;
3271
3272   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3273   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3274     {
3275       rtx_insn *last = get_last_insn ();
3276
3277       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3278       if (temp != 0)
3279         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3280                              OPTAB_WIDEN);
3281
3282       if (temp != 0)
3283         return temp;
3284
3285       delete_insns_since (last);
3286     }
3287
3288   /* If this machine has expensive jumps, we can do one's complement
3289      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3290
3291   scalar_int_mode int_mode;
3292   if (is_int_mode (mode, &int_mode)
3293       && BRANCH_COST (optimize_insn_for_speed_p (),
3294                      false) >= 2)
3295     {
3296       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3297                                    GET_MODE_PRECISION (int_mode) - 1,
3298                                    NULL_RTX, 0);
3299
3300       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3301                            OPTAB_LIB_WIDEN);
3302
3303       if (temp != 0)
3304         return temp;
3305     }
3306
3307   return NULL_RTX;
3308 }
3309
3310 /* A subroutine of expand_copysign, perform the copysign operation using the
3311    abs and neg primitives advertised to exist on the target.  The assumption
3312    is that we have a split register file, and leaving op0 in fp registers,
3313    and not playing with subregs so much, will help the register allocator.  */
3314
3315 static rtx
3316 expand_copysign_absneg (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3317                         int bitpos, bool op0_is_abs)
3318 {
3319   scalar_int_mode imode;
3320   enum insn_code icode;
3321   rtx sign;
3322   rtx_code_label *label;
3323
3324   if (target == op1)
3325     target = NULL_RTX;
3326
3327   /* Check if the back end provides an insn that handles signbit for the
3328      argument's mode. */
3329   icode = optab_handler (signbit_optab, mode);
3330   if (icode != CODE_FOR_nothing)
3331     {
3332       imode = as_a <scalar_int_mode> (insn_data[(int) icode].operand[0].mode);
3333       sign = gen_reg_rtx (imode);
3334       emit_unop_insn (icode, sign, op1, UNKNOWN);
3335     }
3336   else
3337     {
3338       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3339         {
3340           if (!int_mode_for_mode (mode).exists (&imode))
3341             return NULL_RTX;
3342           op1 = gen_lowpart (imode, op1);
3343         }
3344       else
3345         {
3346           int word;
3347
3348           imode = word_mode;
3349           if (FLOAT_WORDS_BIG_ENDIAN)
3350             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3351           else
3352             word = bitpos / BITS_PER_WORD;
3353           bitpos = bitpos % BITS_PER_WORD;
3354           op1 = operand_subword_force (op1, word, mode);
3355         }
3356
3357       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3358       sign = expand_binop (imode, and_optab, op1,
3359                            immed_wide_int_const (mask, imode),
3360                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3361     }
3362
3363   if (!op0_is_abs)
3364     {
3365       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3366       if (op0 == NULL)
3367         return NULL_RTX;
3368       target = op0;
3369     }
3370   else
3371     {
3372       if (target == NULL_RTX)
3373         target = copy_to_reg (op0);
3374       else
3375         emit_move_insn (target, op0);
3376     }
3377
3378   label = gen_label_rtx ();
3379   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3380
3381   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3382     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3383   else
3384     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3385   if (op0 != target)
3386     emit_move_insn (target, op0);
3387
3388   emit_label (label);
3389
3390   return target;
3391 }
3392
3393
3394 /* A subroutine of expand_copysign, perform the entire copysign operation
3395    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3396    is true if op0 is known to have its sign bit clear.  */
3397
3398 static rtx
3399 expand_copysign_bit (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3400                      int bitpos, bool op0_is_abs)
3401 {
3402   scalar_int_mode imode;
3403   int word, nwords, i;
3404   rtx temp;
3405   rtx_insn *insns;
3406
3407   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3408     {
3409       if (!int_mode_for_mode (mode).exists (&imode))
3410         return NULL_RTX;
3411       word = 0;
3412       nwords = 1;
3413     }
3414   else
3415     {
3416       imode = word_mode;
3417
3418       if (FLOAT_WORDS_BIG_ENDIAN)
3419         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3420       else
3421         word = bitpos / BITS_PER_WORD;
3422       bitpos = bitpos % BITS_PER_WORD;
3423       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3424     }
3425
3426   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3427
3428   if (target == 0
3429       || target == op0
3430       || target == op1
3431       || (nwords > 1 && !valid_multiword_target_p (target)))
3432     target = gen_reg_rtx (mode);
3433
3434   if (nwords > 1)
3435     {
3436       start_sequence ();
3437
3438       for (i = 0; i < nwords; ++i)
3439         {
3440           rtx targ_piece = operand_subword (target, i, 1, mode);
3441           rtx op0_piece = operand_subword_force (op0, i, mode);
3442
3443           if (i == word)
3444             {
3445               if (!op0_is_abs)
3446                 op0_piece
3447                   = expand_binop (imode, and_optab, op0_piece,
3448                                   immed_wide_int_const (~mask, imode),
3449                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3450               op1 = expand_binop (imode, and_optab,
3451                                   operand_subword_force (op1, i, mode),
3452                                   immed_wide_int_const (mask, imode),
3453                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3454
3455               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3456                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3457               if (temp != targ_piece)
3458                 emit_move_insn (targ_piece, temp);
3459             }
3460           else
3461             emit_move_insn (targ_piece, op0_piece);
3462         }
3463
3464       insns = get_insns ();
3465       end_sequence ();
3466
3467       emit_insn (insns);
3468     }
3469   else
3470     {
3471       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3472                           immed_wide_int_const (mask, imode),
3473                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3474
3475       op0 = gen_lowpart (imode, op0);
3476       if (!op0_is_abs)
3477         op0 = expand_binop (imode, and_optab, op0,
3478                             immed_wide_int_const (~mask, imode),
3479                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3480
3481       temp = expand_binop (imode, ior_optab, op0, op1,
3482                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3483       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3484     }
3485
3486   return target;
3487 }
3488
3489 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3490    scalar floating point mode.  Return NULL if we do not know how to
3491    expand the operation inline.  */
3492
3493 rtx
3494 expand_copysign (rtx op0, rtx op1, rtx target)
3495 {
3496   scalar_float_mode mode;
3497   const struct real_format *fmt;
3498   bool op0_is_abs;
3499   rtx temp;
3500
3501   mode = as_a <scalar_float_mode> (GET_MODE (op0));
3502   gcc_assert (GET_MODE (op1) == mode);
3503
3504   /* First try to do it with a special instruction.  */
3505   temp = expand_binop (mode, copysign_optab, op0, op1,
3506                        target, 0, OPTAB_DIRECT);
3507   if (temp)
3508     return temp;
3509
3510   fmt = REAL_MODE_FORMAT (mode);
3511   if (fmt == NULL || !fmt->has_signed_zero)
3512     return NULL_RTX;
3513
3514   op0_is_abs = false;
3515   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3516     {
3517       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3518         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3519       op0_is_abs = true;
3520     }
3521
3522   if (fmt->signbit_ro >= 0
3523       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3524           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3525               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3526     {
3527       temp = expand_copysign_absneg (mode, op0, op1, target,
3528                                      fmt->signbit_ro, op0_is_abs);
3529       if (temp)
3530         return temp;
3531     }
3532
3533   if (fmt->signbit_rw < 0)
3534     return NULL_RTX;
3535   return expand_copysign_bit (mode, op0, op1, target,
3536                               fmt->signbit_rw, op0_is_abs);
3537 }
3538 \f
3539 /* Generate an instruction whose insn-code is INSN_CODE,
3540    with two operands: an output TARGET and an input OP0.
3541    TARGET *must* be nonzero, and the output is always stored there.
3542    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3543    the value that is stored into TARGET.
3544
3545    Return false if expansion failed.  */
3546
3547 bool
3548 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3549                       enum rtx_code code)
3550 {
3551   struct expand_operand ops[2];
3552   rtx_insn *pat;
3553
3554   create_output_operand (&ops[0], target, GET_MODE (target));
3555   create_input_operand (&ops[1], op0, GET_MODE (op0));
3556   pat = maybe_gen_insn (icode, 2, ops);
3557   if (!pat)
3558     return false;
3559
3560   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3561       && code != UNKNOWN)
3562     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3563
3564   emit_insn (pat);
3565
3566   if (ops[0].value != target)
3567     emit_move_insn (target, ops[0].value);
3568   return true;
3569 }
3570 /* Generate an instruction whose insn-code is INSN_CODE,
3571    with two operands: an output TARGET and an input OP0.
3572    TARGET *must* be nonzero, and the output is always stored there.
3573    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3574    the value that is stored into TARGET.  */
3575
3576 void
3577 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3578 {
3579   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3580   gcc_assert (ok);
3581 }
3582 \f
3583 struct no_conflict_data
3584 {
3585   rtx target;
3586   rtx_insn *first, *insn;
3587   bool must_stay;
3588 };
3589
3590 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3591    the currently examined clobber / store has to stay in the list of
3592    insns that constitute the actual libcall block.  */
3593 static void
3594 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3595 {
3596   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3597
3598   /* If this inns directly contributes to setting the target, it must stay.  */
3599   if (reg_overlap_mentioned_p (p->target, dest))
3600     p->must_stay = true;
3601   /* If we haven't committed to keeping any other insns in the list yet,
3602      there is nothing more to check.  */
3603   else if (p->insn == p->first)
3604     return;
3605   /* If this insn sets / clobbers a register that feeds one of the insns
3606      already in the list, this insn has to stay too.  */
3607   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3608            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3609            || reg_used_between_p (dest, p->first, p->insn)
3610            /* Likewise if this insn depends on a register set by a previous
3611               insn in the list, or if it sets a result (presumably a hard
3612               register) that is set or clobbered by a previous insn.
3613               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3614               SET_DEST perform the former check on the address, and the latter
3615               check on the MEM.  */
3616            || (GET_CODE (set) == SET
3617                && (modified_in_p (SET_SRC (set), p->first)
3618                    || modified_in_p (SET_DEST (set), p->first)
3619                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3620                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3621     p->must_stay = true;
3622 }
3623
3624 \f
3625 /* Emit code to make a call to a constant function or a library call.
3626
3627    INSNS is a list containing all insns emitted in the call.
3628    These insns leave the result in RESULT.  Our block is to copy RESULT
3629    to TARGET, which is logically equivalent to EQUIV.
3630
3631    We first emit any insns that set a pseudo on the assumption that these are
3632    loading constants into registers; doing so allows them to be safely cse'ed
3633    between blocks.  Then we emit all the other insns in the block, followed by
3634    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3635    note with an operand of EQUIV.  */
3636
3637 static void
3638 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3639                       bool equiv_may_trap)
3640 {
3641   rtx final_dest = target;
3642   rtx_insn *next, *last, *insn;
3643
3644   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3645      into a MEM later.  Protect the libcall block from this change.  */
3646   if (! REG_P (target) || REG_USERVAR_P (target))
3647     target = gen_reg_rtx (GET_MODE (target));
3648
3649   /* If we're using non-call exceptions, a libcall corresponding to an
3650      operation that may trap may also trap.  */
3651   /* ??? See the comment in front of make_reg_eh_region_note.  */
3652   if (cfun->can_throw_non_call_exceptions
3653       && (equiv_may_trap || may_trap_p (equiv)))
3654     {
3655       for (insn = insns; insn; insn = NEXT_INSN (insn))
3656         if (CALL_P (insn))
3657           {
3658             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3659             if (note)
3660               {
3661                 int lp_nr = INTVAL (XEXP (note, 0));
3662                 if (lp_nr == 0 || lp_nr == INT_MIN)
3663                   remove_note (insn, note);
3664               }
3665           }
3666     }
3667   else
3668     {
3669       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3670          reg note to indicate that this call cannot throw or execute a nonlocal
3671          goto (unless there is already a REG_EH_REGION note, in which case
3672          we update it).  */
3673       for (insn = insns; insn; insn = NEXT_INSN (insn))
3674         if (CALL_P (insn))
3675           make_reg_eh_region_note_nothrow_nononlocal (insn);
3676     }
3677
3678   /* First emit all insns that set pseudos.  Remove them from the list as
3679      we go.  Avoid insns that set pseudos which were referenced in previous
3680      insns.  These can be generated by move_by_pieces, for example,
3681      to update an address.  Similarly, avoid insns that reference things
3682      set in previous insns.  */
3683
3684   for (insn = insns; insn; insn = next)
3685     {
3686       rtx set = single_set (insn);
3687
3688       next = NEXT_INSN (insn);
3689
3690       if (set != 0 && REG_P (SET_DEST (set))
3691           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3692         {
3693           struct no_conflict_data data;
3694
3695           data.target = const0_rtx;
3696           data.first = insns;
3697           data.insn = insn;
3698           data.must_stay = 0;
3699           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3700           if (! data.must_stay)
3701             {
3702               if (PREV_INSN (insn))
3703                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3704               else
3705                 insns = next;
3706
3707               if (next)
3708                 SET_PREV_INSN (next) = PREV_INSN (insn);
3709
3710               add_insn (insn);
3711             }
3712         }
3713
3714       /* Some ports use a loop to copy large arguments onto the stack.
3715          Don't move anything outside such a loop.  */
3716       if (LABEL_P (insn))
3717         break;
3718     }
3719
3720   /* Write the remaining insns followed by the final copy.  */
3721   for (insn = insns; insn; insn = next)
3722     {
3723       next = NEXT_INSN (insn);
3724
3725       add_insn (insn);
3726     }
3727
3728   last = emit_move_insn (target, result);
3729   if (equiv)
3730     set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3731
3732   if (final_dest != target)
3733     emit_move_insn (final_dest, target);
3734 }
3735
3736 void
3737 emit_libcall_block (rtx_insn *insns, rtx target, rtx result, rtx equiv)
3738 {
3739   emit_libcall_block_1 (insns, target, result, equiv, false);
3740 }
3741 \f
3742 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3743    PURPOSE describes how this comparison will be used.  CODE is the rtx
3744    comparison code we will be using.
3745
3746    ??? Actually, CODE is slightly weaker than that.  A target is still
3747    required to implement all of the normal bcc operations, but not
3748    required to implement all (or any) of the unordered bcc operations.  */
3749
3750 int
3751 can_compare_p (enum rtx_code code, machine_mode mode,
3752                enum can_compare_purpose purpose)
3753 {
3754   rtx test;
3755   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
3756   do
3757     {
3758       enum insn_code icode;
3759
3760       if (purpose == ccp_jump
3761           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
3762           && insn_operand_matches (icode, 0, test))
3763         return 1;
3764       if (purpose == ccp_store_flag
3765           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
3766           && insn_operand_matches (icode, 1, test))
3767         return 1;
3768       if (purpose == ccp_cmov
3769           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
3770         return 1;
3771
3772       mode = GET_MODE_WIDER_MODE (mode).else_void ();
3773       PUT_MODE (test, mode);
3774     }
3775   while (mode != VOIDmode);
3776
3777   return 0;
3778 }
3779
3780 /* This function is called when we are going to emit a compare instruction that
3781    compares the values found in X and Y, using the rtl operator COMPARISON.
3782
3783    If they have mode BLKmode, then SIZE specifies the size of both operands.
3784
3785    UNSIGNEDP nonzero says that the operands are unsigned;
3786    this matters if they need to be widened (as given by METHODS).
3787
3788    *PTEST is where the resulting comparison RTX is returned or NULL_RTX
3789    if we failed to produce one.
3790
3791    *PMODE is the mode of the inputs (in case they are const_int).
3792
3793    This function performs all the setup necessary so that the caller only has
3794    to emit a single comparison insn.  This setup can involve doing a BLKmode
3795    comparison or emitting a library call to perform the comparison if no insn
3796    is available to handle it.
3797    The values which are passed in through pointers can be modified; the caller
3798    should perform the comparison on the modified values.  Constant
3799    comparisons must have already been folded.  */
3800
3801 static void
3802 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
3803                   int unsignedp, enum optab_methods methods,
3804                   rtx *ptest, machine_mode *pmode)
3805 {
3806   machine_mode mode = *pmode;
3807   rtx libfunc, test;
3808   machine_mode cmp_mode;
3809   enum mode_class mclass;
3810
3811   /* The other methods are not needed.  */
3812   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
3813               || methods == OPTAB_LIB_WIDEN);
3814
3815   if (CONST_SCALAR_INT_P (y))
3816     canonicalize_comparison (mode, &comparison, &y);
3817
3818   /* If we are optimizing, force expensive constants into a register.  */
3819   if (CONSTANT_P (x) && optimize
3820       && (rtx_cost (x, mode, COMPARE, 0, optimize_insn_for_speed_p ())
3821           > COSTS_N_INSNS (1)))
3822     x = force_reg (mode, x);
3823
3824   if (CONSTANT_P (y) && optimize
3825       && (rtx_cost (y, mode, COMPARE, 1, optimize_insn_for_speed_p ())
3826           > COSTS_N_INSNS (1)))
3827     y = force_reg (mode, y);
3828
3829 #if HAVE_cc0
3830   /* Make sure if we have a canonical comparison.  The RTL
3831      documentation states that canonical comparisons are required only
3832      for targets which have cc0.  */
3833   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
3834 #endif
3835
3836   /* Don't let both operands fail to indicate the mode.  */
3837   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
3838     x = force_reg (mode, x);
3839   if (mode == VOIDmode)
3840     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
3841
3842   /* Handle all BLKmode compares.  */
3843
3844   if (mode == BLKmode)
3845     {
3846       machine_mode result_mode;
3847       enum insn_code cmp_code;
3848       rtx result;
3849       rtx opalign
3850         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
3851
3852       gcc_assert (size);
3853
3854       /* Try to use a memory block compare insn - either cmpstr
3855          or cmpmem will do.  */
3856       opt_scalar_int_mode cmp_mode_iter;
3857       FOR_EACH_MODE_IN_CLASS (cmp_mode_iter, MODE_INT)
3858         {
3859           scalar_int_mode cmp_mode = cmp_mode_iter.require ();
3860           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
3861           if (cmp_code == CODE_FOR_nothing)
3862             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
3863           if (cmp_code == CODE_FOR_nothing)
3864             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
3865           if (cmp_code == CODE_FOR_nothing)
3866             continue;
3867
3868           /* Must make sure the size fits the insn's mode.  */
3869           if (CONST_INT_P (size)
3870               ? INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode))
3871               : (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (size)))
3872                  > GET_MODE_BITSIZE (cmp_mode)))
3873             continue;
3874
3875           result_mode = insn_data[cmp_code].operand[0].mode;
3876           result = gen_reg_rtx (result_mode);
3877           size = convert_to_mode (cmp_mode, size, 1);
3878           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
3879
3880           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
3881           *pmode = result_mode;
3882           return;
3883         }
3884
3885       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
3886         goto fail;
3887
3888       /* Otherwise call a library function.  */
3889       result = emit_block_comp_via_libcall (XEXP (x, 0), XEXP (y, 0), size);
3890
3891       x = result;
3892       y = const0_rtx;
3893       mode = TYPE_MODE (integer_type_node);
3894       methods = OPTAB_LIB_WIDEN;
3895       unsignedp = false;
3896     }
3897
3898   /* Don't allow operands to the compare to trap, as that can put the
3899      compare and branch in different basic blocks.  */
3900   if (cfun->can_throw_non_call_exceptions)
3901     {
3902       if (may_trap_p (x))
3903         x = copy_to_reg (x);
3904       if (may_trap_p (y))
3905         y = copy_to_reg (y);
3906     }
3907
3908   if (GET_MODE_CLASS (mode) == MODE_CC)
3909     {
3910       enum insn_code icode = optab_handler (cbranch_optab, CCmode);
3911       test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3912       gcc_assert (icode != CODE_FOR_nothing
3913                   && insn_operand_matches (icode, 0, test));
3914       *ptest = test;
3915       return;
3916     }
3917
3918   mclass = GET_MODE_CLASS (mode);
3919   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3920   FOR_EACH_MODE_FROM (cmp_mode, mode)
3921     {
3922       enum insn_code icode;
3923       icode = optab_handler (cbranch_optab, cmp_mode);
3924       if (icode != CODE_FOR_nothing
3925           && insn_operand_matches (icode, 0, test))
3926         {
3927           rtx_insn *last = get_last_insn ();
3928           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
3929           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
3930           if (op0 && op1
3931               && insn_operand_matches (icode, 1, op0)
3932               && insn_operand_matches (icode, 2, op1))
3933             {
3934               XEXP (test, 0) = op0;
3935               XEXP (test, 1) = op1;
3936               *ptest = test;
3937               *pmode = cmp_mode;
3938               return;
3939             }
3940           delete_insns_since (last);
3941         }
3942
3943       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
3944         break;
3945     }
3946
3947   if (methods != OPTAB_LIB_WIDEN)
3948     goto fail;
3949
3950   if (SCALAR_FLOAT_MODE_P (mode))
3951     {
3952       /* Small trick if UNORDERED isn't implemented by the hardware.  */
3953       if (comparison == UNORDERED && rtx_equal_p (x, y))
3954         {
3955           prepare_cmp_insn (x, y, UNLT, NULL_RTX, unsignedp, OPTAB_WIDEN,
3956                             ptest, pmode);
3957           if (*ptest)
3958             return;
3959         }
3960
3961       prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
3962     }
3963   else
3964     {
3965       rtx result;
3966       machine_mode ret_mode;
3967
3968       /* Handle a libcall just for the mode we are using.  */
3969       libfunc = optab_libfunc (cmp_optab, mode);
3970       gcc_assert (libfunc);
3971
3972       /* If we want unsigned, and this mode has a distinct unsigned
3973          comparison routine, use that.  */
3974       if (unsignedp)
3975         {
3976           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
3977           if (ulibfunc)
3978             libfunc = ulibfunc;
3979         }
3980
3981       ret_mode = targetm.libgcc_cmp_return_mode ();
3982       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
3983                                         ret_mode, x, mode, y, mode);
3984
3985       /* There are two kinds of comparison routines. Biased routines
3986          return 0/1/2, and unbiased routines return -1/0/1. Other parts
3987          of gcc expect that the comparison operation is equivalent
3988          to the modified comparison. For signed comparisons compare the
3989          result against 1 in the biased case, and zero in the unbiased
3990          case. For unsigned comparisons always compare against 1 after
3991          biasing the unbiased result by adding 1. This gives us a way to
3992          represent LTU.
3993          The comparisons in the fixed-point helper library are always
3994          biased.  */
3995       x = result;
3996       y = const1_rtx;
3997
3998       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
3999         {
4000           if (unsignedp)
4001             x = plus_constant (ret_mode, result, 1);
4002           else
4003             y = const0_rtx;
4004         }
4005
4006       *pmode = ret_mode;
4007       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
4008                         ptest, pmode);
4009     }
4010
4011   return;
4012
4013  fail:
4014   *ptest = NULL_RTX;
4015 }
4016
4017 /* Before emitting an insn with code ICODE, make sure that X, which is going
4018    to be used for operand OPNUM of the insn, is converted from mode MODE to
4019    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
4020    that it is accepted by the operand predicate.  Return the new value.  */
4021
4022 rtx
4023 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
4024                  machine_mode wider_mode, int unsignedp)
4025 {
4026   if (mode != wider_mode)
4027     x = convert_modes (wider_mode, mode, x, unsignedp);
4028
4029   if (!insn_operand_matches (icode, opnum, x))
4030     {
4031       machine_mode op_mode = insn_data[(int) icode].operand[opnum].mode;
4032       if (reload_completed)
4033         return NULL_RTX;
4034       if (GET_MODE (x) != op_mode && GET_MODE (x) != VOIDmode)
4035         return NULL_RTX;
4036       x = copy_to_mode_reg (op_mode, x);
4037     }
4038
4039   return x;
4040 }
4041
4042 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4043    we can do the branch.  */
4044
4045 static void
4046 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label,
4047                           profile_probability prob)
4048 {
4049   machine_mode optab_mode;
4050   enum mode_class mclass;
4051   enum insn_code icode;
4052   rtx_insn *insn;
4053
4054   mclass = GET_MODE_CLASS (mode);
4055   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4056   icode = optab_handler (cbranch_optab, optab_mode);
4057
4058   gcc_assert (icode != CODE_FOR_nothing);
4059   gcc_assert (insn_operand_matches (icode, 0, test));
4060   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4061                                           XEXP (test, 1), label));
4062   if (prob.initialized_p ()
4063       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4064       && insn
4065       && JUMP_P (insn)
4066       && any_condjump_p (insn)
4067       && !find_reg_note (insn, REG_BR_PROB, 0))
4068     add_reg_br_prob_note (insn, prob);
4069 }
4070
4071 /* Generate code to compare X with Y so that the condition codes are
4072    set and to jump to LABEL if the condition is true.  If X is a
4073    constant and Y is not a constant, then the comparison is swapped to
4074    ensure that the comparison RTL has the canonical form.
4075
4076    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4077    need to be widened.  UNSIGNEDP is also used to select the proper
4078    branch condition code.
4079
4080    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4081
4082    MODE is the mode of the inputs (in case they are const_int).
4083
4084    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4085    It will be potentially converted into an unsigned variant based on
4086    UNSIGNEDP to select a proper jump instruction.
4087
4088    PROB is the probability of jumping to LABEL.  */
4089
4090 void
4091 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4092                          machine_mode mode, int unsignedp, rtx label,
4093                          profile_probability prob)
4094 {
4095   rtx op0 = x, op1 = y;
4096   rtx test;
4097
4098   /* Swap operands and condition to ensure canonical RTL.  */
4099   if (swap_commutative_operands_p (x, y)
4100       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4101     {
4102       op0 = y, op1 = x;
4103       comparison = swap_condition (comparison);
4104     }
4105
4106   /* If OP0 is still a constant, then both X and Y must be constants
4107      or the opposite comparison is not supported.  Force X into a register
4108      to create canonical RTL.  */
4109   if (CONSTANT_P (op0))
4110     op0 = force_reg (mode, op0);
4111
4112   if (unsignedp)
4113     comparison = unsigned_condition (comparison);
4114
4115   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4116                     &test, &mode);
4117   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4118 }
4119
4120 \f
4121 /* Emit a library call comparison between floating point X and Y.
4122    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4123
4124 static void
4125 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4126                        rtx *ptest, machine_mode *pmode)
4127 {
4128   enum rtx_code swapped = swap_condition (comparison);
4129   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4130   machine_mode orig_mode = GET_MODE (x);
4131   machine_mode mode;
4132   rtx true_rtx, false_rtx;
4133   rtx value, target, equiv;
4134   rtx_insn *insns;
4135   rtx libfunc = 0;
4136   bool reversed_p = false;
4137   scalar_int_mode cmp_mode = targetm.libgcc_cmp_return_mode ();
4138
4139   FOR_EACH_MODE_FROM (mode, orig_mode)
4140     {
4141       if (code_to_optab (comparison)
4142           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4143         break;
4144
4145       if (code_to_optab (swapped)
4146           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4147         {
4148           std::swap (x, y);
4149           comparison = swapped;
4150           break;
4151         }
4152
4153       if (code_to_optab (reversed)
4154           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4155         {
4156           comparison = reversed;
4157           reversed_p = true;
4158           break;
4159         }
4160     }
4161
4162   gcc_assert (mode != VOIDmode);
4163
4164   if (mode != orig_mode)
4165     {
4166       x = convert_to_mode (mode, x, 0);
4167       y = convert_to_mode (mode, y, 0);
4168     }
4169
4170   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4171      the RTL.  The allows the RTL optimizers to delete the libcall if the
4172      condition can be determined at compile-time.  */
4173   if (comparison == UNORDERED
4174       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4175     {
4176       true_rtx = const_true_rtx;
4177       false_rtx = const0_rtx;
4178     }
4179   else
4180     {
4181       switch (comparison)
4182         {
4183         case EQ:
4184           true_rtx = const0_rtx;
4185           false_rtx = const_true_rtx;
4186           break;
4187
4188         case NE:
4189           true_rtx = const_true_rtx;
4190           false_rtx = const0_rtx;
4191           break;
4192
4193         case GT:
4194           true_rtx = const1_rtx;
4195           false_rtx = const0_rtx;
4196           break;
4197
4198         case GE:
4199           true_rtx = const0_rtx;
4200           false_rtx = constm1_rtx;
4201           break;
4202
4203         case LT:
4204           true_rtx = constm1_rtx;
4205           false_rtx = const0_rtx;
4206           break;
4207
4208         case LE:
4209           true_rtx = const0_rtx;
4210           false_rtx = const1_rtx;
4211           break;
4212
4213         default:
4214           gcc_unreachable ();
4215         }
4216     }
4217
4218   if (comparison == UNORDERED)
4219     {
4220       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4221       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4222       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4223                                     temp, const_true_rtx, equiv);
4224     }
4225   else
4226     {
4227       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4228       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4229         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4230                                       equiv, true_rtx, false_rtx);
4231     }
4232
4233   start_sequence ();
4234   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4235                                    cmp_mode, x, mode, y, mode);
4236   insns = get_insns ();
4237   end_sequence ();
4238
4239   target = gen_reg_rtx (cmp_mode);
4240   emit_libcall_block (insns, target, value, equiv);
4241
4242   if (comparison == UNORDERED
4243       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4244       || reversed_p)
4245     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4246   else
4247     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4248
4249   *pmode = cmp_mode;
4250 }
4251 \f
4252 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4253
4254 void
4255 emit_indirect_jump (rtx loc)
4256 {
4257   if (!targetm.have_indirect_jump ())
4258     sorry ("indirect jumps are not available on this target");
4259   else
4260     {
4261       struct expand_operand ops[1];
4262       create_address_operand (&ops[0], loc);
4263       expand_jump_insn (targetm.code_for_indirect_jump, 1, ops);
4264       emit_barrier ();
4265     }
4266 }
4267 \f
4268
4269 /* Emit a conditional move instruction if the machine supports one for that
4270    condition and machine mode.
4271
4272    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4273    the mode to use should they be constants.  If it is VOIDmode, they cannot
4274    both be constants.
4275
4276    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4277    should be stored there.  MODE is the mode to use should they be constants.
4278    If it is VOIDmode, they cannot both be constants.
4279
4280    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4281    is not supported.  */
4282
4283 rtx
4284 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4285                        machine_mode cmode, rtx op2, rtx op3,
4286                        machine_mode mode, int unsignedp)
4287 {
4288   rtx comparison;
4289   rtx_insn *last;
4290   enum insn_code icode;
4291   enum rtx_code reversed;
4292
4293   /* If the two source operands are identical, that's just a move.  */
4294
4295   if (rtx_equal_p (op2, op3))
4296     {
4297       if (!target)
4298         target = gen_reg_rtx (mode);
4299
4300       emit_move_insn (target, op3);
4301       return target;
4302     }
4303
4304   /* If one operand is constant, make it the second one.  Only do this
4305      if the other operand is not constant as well.  */
4306
4307   if (swap_commutative_operands_p (op0, op1))
4308     {
4309       std::swap (op0, op1);
4310       code = swap_condition (code);
4311     }
4312
4313   /* get_condition will prefer to generate LT and GT even if the old
4314      comparison was against zero, so undo that canonicalization here since
4315      comparisons against zero are cheaper.  */
4316   if (code == LT && op1 == const1_rtx)
4317     code = LE, op1 = const0_rtx;
4318   else if (code == GT && op1 == constm1_rtx)
4319     code = GE, op1 = const0_rtx;
4320
4321   if (cmode == VOIDmode)
4322     cmode = GET_MODE (op0);
4323
4324   enum rtx_code orig_code = code;
4325   bool swapped = false;
4326   if (swap_commutative_operands_p (op2, op3)
4327       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4328           != UNKNOWN))
4329     {
4330       std::swap (op2, op3);
4331       code = reversed;
4332       swapped = true;
4333     }
4334
4335   if (mode == VOIDmode)
4336     mode = GET_MODE (op2);
4337
4338   icode = direct_optab_handler (movcc_optab, mode);
4339
4340   if (icode == CODE_FOR_nothing)
4341     return NULL_RTX;
4342
4343   if (!target)
4344     target = gen_reg_rtx (mode);
4345
4346   for (int pass = 0; ; pass++)
4347     {
4348       code = unsignedp ? unsigned_condition (code) : code;
4349       comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4350
4351       /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4352          punt and let the caller figure out how best to deal with this
4353          situation.  */
4354       if (COMPARISON_P (comparison))
4355         {
4356           saved_pending_stack_adjust save;
4357           save_pending_stack_adjust (&save);
4358           last = get_last_insn ();
4359           do_pending_stack_adjust ();
4360           machine_mode cmpmode = cmode;
4361           prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4362                             GET_CODE (comparison), NULL_RTX, unsignedp,
4363                             OPTAB_WIDEN, &comparison, &cmpmode);
4364           if (comparison)
4365             {
4366               struct expand_operand ops[4];
4367
4368               create_output_operand (&ops[0], target, mode);
4369               create_fixed_operand (&ops[1], comparison);
4370               create_input_operand (&ops[2], op2, mode);
4371               create_input_operand (&ops[3], op3, mode);
4372               if (maybe_expand_insn (icode, 4, ops))
4373                 {
4374                   if (ops[0].value != target)
4375                     convert_move (target, ops[0].value, false);
4376                   return target;
4377                 }
4378             }
4379           delete_insns_since (last);
4380           restore_pending_stack_adjust (&save);
4381         }
4382
4383       if (pass == 1)
4384         return NULL_RTX;
4385
4386       /* If the preferred op2/op3 order is not usable, retry with other
4387          operand order, perhaps it will expand successfully.  */
4388       if (swapped)
4389         code = orig_code;
4390       else if ((reversed = reversed_comparison_code_parts (orig_code, op0, op1,
4391                                                            NULL))
4392                != UNKNOWN)
4393         code = reversed;
4394       else
4395         return NULL_RTX;
4396       std::swap (op2, op3);
4397     }
4398 }
4399
4400
4401 /* Emit a conditional negate or bitwise complement using the
4402    negcc or notcc optabs if available.  Return NULL_RTX if such operations
4403    are not available.  Otherwise return the RTX holding the result.
4404    TARGET is the desired destination of the result.  COMP is the comparison
4405    on which to negate.  If COND is true move into TARGET the negation
4406    or bitwise complement of OP1.  Otherwise move OP2 into TARGET.
4407    CODE is either NEG or NOT.  MODE is the machine mode in which the
4408    operation is performed.  */
4409
4410 rtx
4411 emit_conditional_neg_or_complement (rtx target, rtx_code code,
4412                                      machine_mode mode, rtx cond, rtx op1,
4413                                      rtx op2)
4414 {
4415   optab op = unknown_optab;
4416   if (code == NEG)
4417     op = negcc_optab;
4418   else if (code == NOT)
4419     op = notcc_optab;
4420   else
4421     gcc_unreachable ();
4422
4423   insn_code icode = direct_optab_handler (op, mode);
4424
4425   if (icode == CODE_FOR_nothing)
4426     return NULL_RTX;
4427
4428   if (!target)
4429     target = gen_reg_rtx (mode);
4430
4431   rtx_insn *last = get_last_insn ();
4432   struct expand_operand ops[4];
4433
4434   create_output_operand (&ops[0], target, mode);
4435   create_fixed_operand (&ops[1], cond);
4436   create_input_operand (&ops[2], op1, mode);
4437   create_input_operand (&ops[3], op2, mode);
4438
4439   if (maybe_expand_insn (icode, 4, ops))
4440     {
4441       if (ops[0].value != target)
4442         convert_move (target, ops[0].value, false);
4443
4444       return target;
4445     }
4446   delete_insns_since (last);
4447   return NULL_RTX;
4448 }
4449
4450 /* Emit a conditional addition instruction if the machine supports one for that
4451    condition and machine mode.
4452
4453    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4454    the mode to use should they be constants.  If it is VOIDmode, they cannot
4455    both be constants.
4456
4457    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4458    should be stored there.  MODE is the mode to use should they be constants.
4459    If it is VOIDmode, they cannot both be constants.
4460
4461    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4462    is not supported.  */
4463
4464 rtx
4465 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4466                       machine_mode cmode, rtx op2, rtx op3,
4467                       machine_mode mode, int unsignedp)
4468 {
4469   rtx comparison;
4470   rtx_insn *last;
4471   enum insn_code icode;
4472
4473   /* If one operand is constant, make it the second one.  Only do this
4474      if the other operand is not constant as well.  */
4475
4476   if (swap_commutative_operands_p (op0, op1))
4477     {
4478       std::swap (op0, op1);
4479       code = swap_condition (code);
4480     }
4481
4482   /* get_condition will prefer to generate LT and GT even if the old
4483      comparison was against zero, so undo that canonicalization here since
4484      comparisons against zero are cheaper.  */
4485   if (code == LT && op1 == const1_rtx)
4486     code = LE, op1 = const0_rtx;
4487   else if (code == GT && op1 == constm1_rtx)
4488     code = GE, op1 = const0_rtx;
4489
4490   if (cmode == VOIDmode)
4491     cmode = GET_MODE (op0);
4492
4493   if (mode == VOIDmode)
4494     mode = GET_MODE (op2);
4495
4496   icode = optab_handler (addcc_optab, mode);
4497
4498   if (icode == CODE_FOR_nothing)
4499     return 0;
4500
4501   if (!target)
4502     target = gen_reg_rtx (mode);
4503
4504   code = unsignedp ? unsigned_condition (code) : code;
4505   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4506
4507   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4508      return NULL and let the caller figure out how best to deal with this
4509      situation.  */
4510   if (!COMPARISON_P (comparison))
4511     return NULL_RTX;
4512
4513   do_pending_stack_adjust ();
4514   last = get_last_insn ();
4515   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4516                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4517                     &comparison, &cmode);
4518   if (comparison)
4519     {
4520       struct expand_operand ops[4];
4521
4522       create_output_operand (&ops[0], target, mode);
4523       create_fixed_operand (&ops[1], comparison);
4524       create_input_operand (&ops[2], op2, mode);
4525       create_input_operand (&ops[3], op3, mode);
4526       if (maybe_expand_insn (icode, 4, ops))
4527         {
4528           if (ops[0].value != target)
4529             convert_move (target, ops[0].value, false);
4530           return target;
4531         }
4532     }
4533   delete_insns_since (last);
4534   return NULL_RTX;
4535 }
4536 \f
4537 /* These functions attempt to generate an insn body, rather than
4538    emitting the insn, but if the gen function already emits them, we
4539    make no attempt to turn them back into naked patterns.  */
4540
4541 /* Generate and return an insn body to add Y to X.  */
4542
4543 rtx_insn *
4544 gen_add2_insn (rtx x, rtx y)
4545 {
4546   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4547
4548   gcc_assert (insn_operand_matches (icode, 0, x));
4549   gcc_assert (insn_operand_matches (icode, 1, x));
4550   gcc_assert (insn_operand_matches (icode, 2, y));
4551
4552   return GEN_FCN (icode) (x, x, y);
4553 }
4554
4555 /* Generate and return an insn body to add r1 and c,
4556    storing the result in r0.  */
4557
4558 rtx_insn *
4559 gen_add3_insn (rtx r0, rtx r1, rtx c)
4560 {
4561   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4562
4563   if (icode == CODE_FOR_nothing
4564       || !insn_operand_matches (icode, 0, r0)
4565       || !insn_operand_matches (icode, 1, r1)
4566       || !insn_operand_matches (icode, 2, c))
4567     return NULL;
4568
4569   return GEN_FCN (icode) (r0, r1, c);
4570 }
4571
4572 int
4573 have_add2_insn (rtx x, rtx y)
4574 {
4575   enum insn_code icode;
4576
4577   gcc_assert (GET_MODE (x) != VOIDmode);
4578
4579   icode = optab_handler (add_optab, GET_MODE (x));
4580
4581   if (icode == CODE_FOR_nothing)
4582     return 0;
4583
4584   if (!insn_operand_matches (icode, 0, x)
4585       || !insn_operand_matches (icode, 1, x)
4586       || !insn_operand_matches (icode, 2, y))
4587     return 0;
4588
4589   return 1;
4590 }
4591
4592 /* Generate and return an insn body to add Y to X.  */
4593
4594 rtx_insn *
4595 gen_addptr3_insn (rtx x, rtx y, rtx z)
4596 {
4597   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4598
4599   gcc_assert (insn_operand_matches (icode, 0, x));
4600   gcc_assert (insn_operand_matches (icode, 1, y));
4601   gcc_assert (insn_operand_matches (icode, 2, z));
4602
4603   return GEN_FCN (icode) (x, y, z);
4604 }
4605
4606 /* Return true if the target implements an addptr pattern and X, Y,
4607    and Z are valid for the pattern predicates.  */
4608
4609 int
4610 have_addptr3_insn (rtx x, rtx y, rtx z)
4611 {
4612   enum insn_code icode;
4613
4614   gcc_assert (GET_MODE (x) != VOIDmode);
4615
4616   icode = optab_handler (addptr3_optab, GET_MODE (x));
4617
4618   if (icode == CODE_FOR_nothing)
4619     return 0;
4620
4621   if (!insn_operand_matches (icode, 0, x)
4622       || !insn_operand_matches (icode, 1, y)
4623       || !insn_operand_matches (icode, 2, z))
4624     return 0;
4625
4626   return 1;
4627 }
4628
4629 /* Generate and return an insn body to subtract Y from X.  */
4630
4631 rtx_insn *
4632 gen_sub2_insn (rtx x, rtx y)
4633 {
4634   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4635
4636   gcc_assert (insn_operand_matches (icode, 0, x));
4637   gcc_assert (insn_operand_matches (icode, 1, x));
4638   gcc_assert (insn_operand_matches (icode, 2, y));
4639
4640   return GEN_FCN (icode) (x, x, y);
4641 }
4642
4643 /* Generate and return an insn body to subtract r1 and c,
4644    storing the result in r0.  */
4645
4646 rtx_insn *
4647 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4648 {
4649   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4650
4651   if (icode == CODE_FOR_nothing
4652       || !insn_operand_matches (icode, 0, r0)
4653       || !insn_operand_matches (icode, 1, r1)
4654       || !insn_operand_matches (icode, 2, c))
4655     return NULL;
4656
4657   return GEN_FCN (icode) (r0, r1, c);
4658 }
4659
4660 int
4661 have_sub2_insn (rtx x, rtx y)
4662 {
4663   enum insn_code icode;
4664
4665   gcc_assert (GET_MODE (x) != VOIDmode);
4666
4667   icode = optab_handler (sub_optab, GET_MODE (x));
4668
4669   if (icode == CODE_FOR_nothing)
4670     return 0;
4671
4672   if (!insn_operand_matches (icode, 0, x)
4673       || !insn_operand_matches (icode, 1, x)
4674       || !insn_operand_matches (icode, 2, y))
4675     return 0;
4676
4677   return 1;
4678 }
4679 \f
4680 /* Generate the body of an insn to extend Y (with mode MFROM)
4681    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4682
4683 rtx_insn *
4684 gen_extend_insn (rtx x, rtx y, machine_mode mto,
4685                  machine_mode mfrom, int unsignedp)
4686 {
4687   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4688   return GEN_FCN (icode) (x, y);
4689 }
4690 \f
4691 /* Generate code to convert FROM to floating point
4692    and store in TO.  FROM must be fixed point and not VOIDmode.
4693    UNSIGNEDP nonzero means regard FROM as unsigned.
4694    Normally this is done by correcting the final value
4695    if it is negative.  */
4696
4697 void
4698 expand_float (rtx to, rtx from, int unsignedp)
4699 {
4700   enum insn_code icode;
4701   rtx target = to;
4702   scalar_mode from_mode, to_mode;
4703   machine_mode fmode, imode;
4704   bool can_do_signed = false;
4705
4706   /* Crash now, because we won't be able to decide which mode to use.  */
4707   gcc_assert (GET_MODE (from) != VOIDmode);
4708
4709   /* Look for an insn to do the conversion.  Do it in the specified
4710      modes if possible; otherwise convert either input, output or both to
4711      wider mode.  If the integer mode is wider than the mode of FROM,
4712      we can do the conversion signed even if the input is unsigned.  */
4713
4714   FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
4715     FOR_EACH_MODE_FROM (imode, GET_MODE (from))
4716       {
4717         int doing_unsigned = unsignedp;
4718
4719         if (fmode != GET_MODE (to)
4720             && (significand_size (fmode)
4721                 < GET_MODE_UNIT_PRECISION (GET_MODE (from))))
4722           continue;
4723
4724         icode = can_float_p (fmode, imode, unsignedp);
4725         if (icode == CODE_FOR_nothing && unsignedp)
4726           {
4727             enum insn_code scode = can_float_p (fmode, imode, 0);
4728             if (scode != CODE_FOR_nothing)
4729               can_do_signed = true;
4730             if (imode != GET_MODE (from))
4731               icode = scode, doing_unsigned = 0;
4732           }
4733
4734         if (icode != CODE_FOR_nothing)
4735           {
4736             if (imode != GET_MODE (from))
4737               from = convert_to_mode (imode, from, unsignedp);
4738
4739             if (fmode != GET_MODE (to))
4740               target = gen_reg_rtx (fmode);
4741
4742             emit_unop_insn (icode, target, from,
4743                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
4744
4745             if (target != to)
4746               convert_move (to, target, 0);
4747             return;
4748           }
4749       }
4750
4751   /* Unsigned integer, and no way to convert directly.  Convert as signed,
4752      then unconditionally adjust the result.  */
4753   if (unsignedp
4754       && can_do_signed
4755       && is_a <scalar_mode> (GET_MODE (to), &to_mode)
4756       && is_a <scalar_mode> (GET_MODE (from), &from_mode))
4757     {
4758       opt_scalar_mode fmode_iter;
4759       rtx_code_label *label = gen_label_rtx ();
4760       rtx temp;
4761       REAL_VALUE_TYPE offset;
4762
4763       /* Look for a usable floating mode FMODE wider than the source and at
4764          least as wide as the target.  Using FMODE will avoid rounding woes
4765          with unsigned values greater than the signed maximum value.  */
4766
4767       FOR_EACH_MODE_FROM (fmode_iter, to_mode)
4768         {
4769           scalar_mode fmode = fmode_iter.require ();
4770           if (GET_MODE_PRECISION (from_mode) < GET_MODE_BITSIZE (fmode)
4771               && can_float_p (fmode, from_mode, 0) != CODE_FOR_nothing)
4772             break;
4773         }
4774
4775       if (!fmode_iter.exists (&fmode))
4776         {
4777           /* There is no such mode.  Pretend the target is wide enough.  */
4778           fmode = to_mode;
4779
4780           /* Avoid double-rounding when TO is narrower than FROM.  */
4781           if ((significand_size (fmode) + 1)
4782               < GET_MODE_PRECISION (from_mode))
4783             {
4784               rtx temp1;
4785               rtx_code_label *neglabel = gen_label_rtx ();
4786
4787               /* Don't use TARGET if it isn't a register, is a hard register,
4788                  or is the wrong mode.  */
4789               if (!REG_P (target)
4790                   || REGNO (target) < FIRST_PSEUDO_REGISTER
4791                   || GET_MODE (target) != fmode)
4792                 target = gen_reg_rtx (fmode);
4793
4794               imode = from_mode;
4795               do_pending_stack_adjust ();
4796
4797               /* Test whether the sign bit is set.  */
4798               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
4799                                        0, neglabel);
4800
4801               /* The sign bit is not set.  Convert as signed.  */
4802               expand_float (target, from, 0);
4803               emit_jump_insn (targetm.gen_jump (label));
4804               emit_barrier ();
4805
4806               /* The sign bit is set.
4807                  Convert to a usable (positive signed) value by shifting right
4808                  one bit, while remembering if a nonzero bit was shifted
4809                  out; i.e., compute  (from & 1) | (from >> 1).  */
4810
4811               emit_label (neglabel);
4812               temp = expand_binop (imode, and_optab, from, const1_rtx,
4813                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
4814               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
4815               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
4816                                    OPTAB_LIB_WIDEN);
4817               expand_float (target, temp, 0);
4818
4819               /* Multiply by 2 to undo the shift above.  */
4820               temp = expand_binop (fmode, add_optab, target, target,
4821                                    target, 0, OPTAB_LIB_WIDEN);
4822               if (temp != target)
4823                 emit_move_insn (target, temp);
4824
4825               do_pending_stack_adjust ();
4826               emit_label (label);
4827               goto done;
4828             }
4829         }
4830
4831       /* If we are about to do some arithmetic to correct for an
4832          unsigned operand, do it in a pseudo-register.  */
4833
4834       if (to_mode != fmode
4835           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
4836         target = gen_reg_rtx (fmode);
4837
4838       /* Convert as signed integer to floating.  */
4839       expand_float (target, from, 0);
4840
4841       /* If FROM is negative (and therefore TO is negative),
4842          correct its value by 2**bitwidth.  */
4843
4844       do_pending_stack_adjust ();
4845       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, from_mode,
4846                                0, label);
4847
4848
4849       real_2expN (&offset, GET_MODE_PRECISION (from_mode), fmode);
4850       temp = expand_binop (fmode, add_optab, target,
4851                            const_double_from_real_value (offset, fmode),
4852                            target, 0, OPTAB_LIB_WIDEN);
4853       if (temp != target)
4854         emit_move_insn (target, temp);
4855
4856       do_pending_stack_adjust ();
4857       emit_label (label);
4858       goto done;
4859     }
4860
4861   /* No hardware instruction available; call a library routine.  */
4862     {
4863       rtx libfunc;
4864       rtx_insn *insns;
4865       rtx value;
4866       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
4867
4868       if (is_narrower_int_mode (GET_MODE (from), SImode))
4869         from = convert_to_mode (SImode, from, unsignedp);
4870
4871       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
4872       gcc_assert (libfunc);
4873
4874       start_sequence ();
4875
4876       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4877                                        GET_MODE (to), from, GET_MODE (from));
4878       insns = get_insns ();
4879       end_sequence ();
4880
4881       emit_libcall_block (insns, target, value,
4882                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
4883                                          GET_MODE (to), from));
4884     }
4885
4886  done:
4887
4888   /* Copy result to requested destination
4889      if we have been computing in a temp location.  */
4890
4891   if (target != to)
4892     {
4893       if (GET_MODE (target) == GET_MODE (to))
4894         emit_move_insn (to, target);
4895       else
4896         convert_move (to, target, 0);
4897     }
4898 }
4899 \f
4900 /* Generate code to convert FROM to fixed point and store in TO.  FROM
4901    must be floating point.  */
4902
4903 void
4904 expand_fix (rtx to, rtx from, int unsignedp)
4905 {
4906   enum insn_code icode;
4907   rtx target = to;
4908   machine_mode fmode, imode;
4909   opt_scalar_mode fmode_iter;
4910   bool must_trunc = false;
4911
4912   /* We first try to find a pair of modes, one real and one integer, at
4913      least as wide as FROM and TO, respectively, in which we can open-code
4914      this conversion.  If the integer mode is wider than the mode of TO,
4915      we can do the conversion either signed or unsigned.  */
4916
4917   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
4918     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
4919       {
4920         int doing_unsigned = unsignedp;
4921
4922         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
4923         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
4924           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
4925
4926         if (icode != CODE_FOR_nothing)
4927           {
4928             rtx_insn *last = get_last_insn ();
4929             if (fmode != GET_MODE (from))
4930               from = convert_to_mode (fmode, from, 0);
4931
4932             if (must_trunc)
4933               {
4934                 rtx temp = gen_reg_rtx (GET_MODE (from));
4935                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
4936                                     temp, 0);
4937               }
4938
4939             if (imode != GET_MODE (to))
4940               target = gen_reg_rtx (imode);
4941
4942             if (maybe_emit_unop_insn (icode, target, from,
4943                                       doing_unsigned ? UNSIGNED_FIX : FIX))
4944               {
4945                 if (target != to)
4946                   convert_move (to, target, unsignedp);
4947                 return;
4948               }
4949             delete_insns_since (last);
4950           }
4951       }
4952
4953   /* For an unsigned conversion, there is one more way to do it.
4954      If we have a signed conversion, we generate code that compares
4955      the real value to the largest representable positive number.  If if
4956      is smaller, the conversion is done normally.  Otherwise, subtract
4957      one plus the highest signed number, convert, and add it back.
4958
4959      We only need to check all real modes, since we know we didn't find
4960      anything with a wider integer mode.
4961
4962      This code used to extend FP value into mode wider than the destination.
4963      This is needed for decimal float modes which cannot accurately
4964      represent one plus the highest signed number of the same size, but
4965      not for binary modes.  Consider, for instance conversion from SFmode
4966      into DImode.
4967
4968      The hot path through the code is dealing with inputs smaller than 2^63
4969      and doing just the conversion, so there is no bits to lose.
4970
4971      In the other path we know the value is positive in the range 2^63..2^64-1
4972      inclusive.  (as for other input overflow happens and result is undefined)
4973      So we know that the most important bit set in mantissa corresponds to
4974      2^63.  The subtraction of 2^63 should not generate any rounding as it
4975      simply clears out that bit.  The rest is trivial.  */
4976
4977   scalar_int_mode to_mode;
4978   if (unsignedp
4979       && is_a <scalar_int_mode> (GET_MODE (to), &to_mode)
4980       && HWI_COMPUTABLE_MODE_P (to_mode))
4981     FOR_EACH_MODE_FROM (fmode_iter, as_a <scalar_mode> (GET_MODE (from)))
4982       {
4983         scalar_mode fmode = fmode_iter.require ();
4984         if (CODE_FOR_nothing != can_fix_p (to_mode, fmode,
4985                                            0, &must_trunc)
4986             && (!DECIMAL_FLOAT_MODE_P (fmode)
4987                 || (GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (to_mode))))
4988           {
4989             int bitsize;
4990             REAL_VALUE_TYPE offset;
4991             rtx limit;
4992             rtx_code_label *lab1, *lab2;
4993             rtx_insn *insn;
4994
4995             bitsize = GET_MODE_PRECISION (to_mode);
4996             real_2expN (&offset, bitsize - 1, fmode);
4997             limit = const_double_from_real_value (offset, fmode);
4998             lab1 = gen_label_rtx ();
4999             lab2 = gen_label_rtx ();
5000
5001             if (fmode != GET_MODE (from))
5002               from = convert_to_mode (fmode, from, 0);
5003
5004             /* See if we need to do the subtraction.  */
5005             do_pending_stack_adjust ();
5006             emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX,
5007                                      GET_MODE (from), 0, lab1);
5008
5009             /* If not, do the signed "fix" and branch around fixup code.  */
5010             expand_fix (to, from, 0);
5011             emit_jump_insn (targetm.gen_jump (lab2));
5012             emit_barrier ();
5013
5014             /* Otherwise, subtract 2**(N-1), convert to signed number,
5015                then add 2**(N-1).  Do the addition using XOR since this
5016                will often generate better code.  */
5017             emit_label (lab1);
5018             target = expand_binop (GET_MODE (from), sub_optab, from, limit,
5019                                    NULL_RTX, 0, OPTAB_LIB_WIDEN);
5020             expand_fix (to, target, 0);
5021             target = expand_binop (to_mode, xor_optab, to,
5022                                    gen_int_mode
5023                                    (HOST_WIDE_INT_1 << (bitsize - 1),
5024                                     to_mode),
5025                                    to, 1, OPTAB_LIB_WIDEN);
5026
5027             if (target != to)
5028               emit_move_insn (to, target);
5029
5030             emit_label (lab2);
5031
5032             if (optab_handler (mov_optab, to_mode) != CODE_FOR_nothing)
5033               {
5034                 /* Make a place for a REG_NOTE and add it.  */
5035                 insn = emit_move_insn (to, to);
5036                 set_dst_reg_note (insn, REG_EQUAL,
5037                                   gen_rtx_fmt_e (UNSIGNED_FIX, to_mode,
5038                                                  copy_rtx (from)),
5039                                   to);
5040               }
5041
5042             return;
5043           }
5044       }
5045
5046   /* We can't do it with an insn, so use a library call.  But first ensure
5047      that the mode of TO is at least as wide as SImode, since those are the
5048      only library calls we know about.  */
5049
5050   if (is_narrower_int_mode (GET_MODE (to), SImode))
5051     {
5052       target = gen_reg_rtx (SImode);
5053
5054       expand_fix (target, from, unsignedp);
5055     }
5056   else
5057     {
5058       rtx_insn *insns;
5059       rtx value;
5060       rtx libfunc;
5061
5062       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5063       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5064       gcc_assert (libfunc);
5065
5066       start_sequence ();
5067
5068       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5069                                        GET_MODE (to), from, GET_MODE (from));
5070       insns = get_insns ();
5071       end_sequence ();
5072
5073       emit_libcall_block (insns, target, value,
5074                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5075                                          GET_MODE (to), from));
5076     }
5077
5078   if (target != to)
5079     {
5080       if (GET_MODE (to) == GET_MODE (target))
5081         emit_move_insn (to, target);
5082       else
5083         convert_move (to, target, 0);
5084     }
5085 }
5086
5087
5088 /* Promote integer arguments for a libcall if necessary.
5089    emit_library_call_value cannot do the promotion because it does not
5090    know if it should do a signed or unsigned promotion.  This is because
5091    there are no tree types defined for libcalls.  */
5092
5093 static rtx
5094 prepare_libcall_arg (rtx arg, int uintp)
5095 {
5096   scalar_int_mode mode;
5097   machine_mode arg_mode;
5098   if (is_a <scalar_int_mode> (GET_MODE (arg), &mode))
5099     {
5100       /*  If we need to promote the integer function argument we need to do
5101           it here instead of inside emit_library_call_value because in
5102           emit_library_call_value we don't know if we should do a signed or
5103           unsigned promotion.  */
5104
5105       int unsigned_p = 0;
5106       arg_mode = promote_function_mode (NULL_TREE, mode,
5107                                         &unsigned_p, NULL_TREE, 0);
5108       if (arg_mode != mode)
5109         return convert_to_mode (arg_mode, arg, uintp);
5110     }
5111     return arg;
5112 }
5113
5114 /* Generate code to convert FROM or TO a fixed-point.
5115    If UINTP is true, either TO or FROM is an unsigned integer.
5116    If SATP is true, we need to saturate the result.  */
5117
5118 void
5119 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5120 {
5121   machine_mode to_mode = GET_MODE (to);
5122   machine_mode from_mode = GET_MODE (from);
5123   convert_optab tab;
5124   enum rtx_code this_code;
5125   enum insn_code code;
5126   rtx_insn *insns;
5127   rtx value;
5128   rtx libfunc;
5129
5130   if (to_mode == from_mode)
5131     {
5132       emit_move_insn (to, from);
5133       return;
5134     }
5135
5136   if (uintp)
5137     {
5138       tab = satp ? satfractuns_optab : fractuns_optab;
5139       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5140     }
5141   else
5142     {
5143       tab = satp ? satfract_optab : fract_optab;
5144       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5145     }
5146   code = convert_optab_handler (tab, to_mode, from_mode);
5147   if (code != CODE_FOR_nothing)
5148     {
5149       emit_unop_insn (code, to, from, this_code);
5150       return;
5151     }
5152
5153   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5154   gcc_assert (libfunc);
5155
5156   from = prepare_libcall_arg (from, uintp);
5157   from_mode = GET_MODE (from);
5158
5159   start_sequence ();
5160   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5161                                    from, from_mode);
5162   insns = get_insns ();
5163   end_sequence ();
5164
5165   emit_libcall_block (insns, to, value,
5166                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5167 }
5168
5169 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5170    must be floating point, TO must be signed.  Use the conversion optab
5171    TAB to do the conversion.  */
5172
5173 bool
5174 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5175 {
5176   enum insn_code icode;
5177   rtx target = to;
5178   machine_mode fmode, imode;
5179
5180   /* We first try to find a pair of modes, one real and one integer, at
5181      least as wide as FROM and TO, respectively, in which we can open-code
5182      this conversion.  If the integer mode is wider than the mode of TO,
5183      we can do the conversion either signed or unsigned.  */
5184
5185   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
5186     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
5187       {
5188         icode = convert_optab_handler (tab, imode, fmode);
5189         if (icode != CODE_FOR_nothing)
5190           {
5191             rtx_insn *last = get_last_insn ();
5192             if (fmode != GET_MODE (from))
5193               from = convert_to_mode (fmode, from, 0);
5194
5195             if (imode != GET_MODE (to))
5196               target = gen_reg_rtx (imode);
5197
5198             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5199               {
5200                 delete_insns_since (last);
5201                 continue;
5202               }
5203             if (target != to)
5204               convert_move (to, target, 0);
5205             return true;
5206           }
5207       }
5208
5209   return false;
5210 }
5211 \f
5212 /* Report whether we have an instruction to perform the operation
5213    specified by CODE on operands of mode MODE.  */
5214 int
5215 have_insn_for (enum rtx_code code, machine_mode mode)
5216 {
5217   return (code_to_optab (code)
5218           && (optab_handler (code_to_optab (code), mode)
5219               != CODE_FOR_nothing));
5220 }
5221
5222 /* Print information about the current contents of the optabs on
5223    STDERR.  */
5224
5225 DEBUG_FUNCTION void
5226 debug_optab_libfuncs (void)
5227 {
5228   int i, j, k;
5229
5230   /* Dump the arithmetic optabs.  */
5231   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
5232     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5233       {
5234         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
5235         if (l)
5236           {
5237             gcc_assert (GET_CODE (l) == SYMBOL_REF);
5238             fprintf (stderr, "%s\t%s:\t%s\n",
5239                      GET_RTX_NAME (optab_to_code ((optab) i)),
5240                      GET_MODE_NAME (j),
5241                      XSTR (l, 0));
5242           }
5243       }
5244
5245   /* Dump the conversion optabs.  */
5246   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
5247     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5248       for (k = 0; k < NUM_MACHINE_MODES; ++k)
5249         {
5250           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
5251                                          (machine_mode) k);
5252           if (l)
5253             {
5254               gcc_assert (GET_CODE (l) == SYMBOL_REF);
5255               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
5256                        GET_RTX_NAME (optab_to_code ((optab) i)),
5257                        GET_MODE_NAME (j),
5258                        GET_MODE_NAME (k),
5259                        XSTR (l, 0));
5260             }
5261         }
5262 }
5263
5264 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
5265    CODE.  Return 0 on failure.  */
5266
5267 rtx_insn *
5268 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
5269 {
5270   machine_mode mode = GET_MODE (op1);
5271   enum insn_code icode;
5272   rtx_insn *insn;
5273   rtx trap_rtx;
5274
5275   if (mode == VOIDmode)
5276     return 0;
5277
5278   icode = optab_handler (ctrap_optab, mode);
5279   if (icode == CODE_FOR_nothing)
5280     return 0;
5281
5282   /* Some targets only accept a zero trap code.  */
5283   if (!insn_operand_matches (icode, 3, tcode))
5284     return 0;
5285
5286   do_pending_stack_adjust ();
5287   start_sequence ();
5288   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
5289                     &trap_rtx, &mode);
5290   if (!trap_rtx)
5291     insn = NULL;
5292   else
5293     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
5294                             tcode);
5295
5296   /* If that failed, then give up.  */
5297   if (insn == 0)
5298     {
5299       end_sequence ();
5300       return 0;
5301     }
5302
5303   emit_insn (insn);
5304   insn = get_insns ();
5305   end_sequence ();
5306   return insn;
5307 }
5308
5309 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
5310    or unsigned operation code.  */
5311
5312 enum rtx_code
5313 get_rtx_code (enum tree_code tcode, bool unsignedp)
5314 {
5315   enum rtx_code code;
5316   switch (tcode)
5317     {
5318     case EQ_EXPR:
5319       code = EQ;
5320       break;
5321     case NE_EXPR:
5322       code = NE;
5323       break;
5324     case LT_EXPR:
5325       code = unsignedp ? LTU : LT;
5326       break;
5327     case LE_EXPR:
5328       code = unsignedp ? LEU : LE;
5329       break;
5330     case GT_EXPR:
5331       code = unsignedp ? GTU : GT;
5332       break;
5333     case GE_EXPR:
5334       code = unsignedp ? GEU : GE;
5335       break;
5336
5337     case UNORDERED_EXPR:
5338       code = UNORDERED;
5339       break;
5340     case ORDERED_EXPR:
5341       code = ORDERED;
5342       break;
5343     case UNLT_EXPR:
5344       code = UNLT;
5345       break;
5346     case UNLE_EXPR:
5347       code = UNLE;
5348       break;
5349     case UNGT_EXPR:
5350       code = UNGT;
5351       break;
5352     case UNGE_EXPR:
5353       code = UNGE;
5354       break;
5355     case UNEQ_EXPR:
5356       code = UNEQ;
5357       break;
5358     case LTGT_EXPR:
5359       code = LTGT;
5360       break;
5361
5362     case BIT_AND_EXPR:
5363       code = AND;
5364       break;
5365
5366     case BIT_IOR_EXPR:
5367       code = IOR;
5368       break;
5369
5370     default:
5371       gcc_unreachable ();
5372     }
5373   return code;
5374 }
5375
5376 /* Return a comparison rtx of mode CMP_MODE for COND.  Use UNSIGNEDP to
5377    select signed or unsigned operators.  OPNO holds the index of the
5378    first comparison operand for insn ICODE.  Do not generate the
5379    compare instruction itself.  */
5380
5381 static rtx
5382 vector_compare_rtx (machine_mode cmp_mode, enum tree_code tcode,
5383                     tree t_op0, tree t_op1, bool unsignedp,
5384                     enum insn_code icode, unsigned int opno)
5385 {
5386   struct expand_operand ops[2];
5387   rtx rtx_op0, rtx_op1;
5388   machine_mode m0, m1;
5389   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
5390
5391   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
5392
5393   /* Expand operands.  For vector types with scalar modes, e.g. where int64x1_t
5394      has mode DImode, this can produce a constant RTX of mode VOIDmode; in such
5395      cases, use the original mode.  */
5396   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
5397                          EXPAND_STACK_PARM);
5398   m0 = GET_MODE (rtx_op0);
5399   if (m0 == VOIDmode)
5400     m0 = TYPE_MODE (TREE_TYPE (t_op0));
5401
5402   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
5403                          EXPAND_STACK_PARM);
5404   m1 = GET_MODE (rtx_op1);
5405   if (m1 == VOIDmode)
5406     m1 = TYPE_MODE (TREE_TYPE (t_op1));
5407
5408   create_input_operand (&ops[0], rtx_op0, m0);
5409   create_input_operand (&ops[1], rtx_op1, m1);
5410   if (!maybe_legitimize_operands (icode, opno, 2, ops))
5411     gcc_unreachable ();
5412   return gen_rtx_fmt_ee (rcode, cmp_mode, ops[0].value, ops[1].value);
5413 }
5414
5415 /* Check if vec_perm mask SEL is a constant equivalent to a shift of
5416    the first vec_perm operand, assuming the second operand is a constant
5417    vector of zeros.  Return the shift distance in bits if so, or NULL_RTX
5418    if the vec_perm is not a shift.  MODE is the mode of the value being
5419    shifted.  */
5420 static rtx
5421 shift_amt_for_vec_perm_mask (machine_mode mode, const vec_perm_indices &sel)
5422 {
5423   unsigned int bitsize = GET_MODE_UNIT_BITSIZE (mode);
5424   poly_int64 first = sel[0];
5425   if (maybe_ge (sel[0], GET_MODE_NUNITS (mode)))
5426     return NULL_RTX;
5427
5428   if (!sel.series_p (0, 1, first, 1))
5429     {
5430       unsigned int nelt;
5431       if (!GET_MODE_NUNITS (mode).is_constant (&nelt))
5432         return NULL_RTX;
5433       for (unsigned int i = 1; i < nelt; i++)
5434         {
5435           poly_int64 expected = i + first;
5436           /* Indices into the second vector are all equivalent.  */
5437           if (maybe_lt (sel[i], nelt)
5438               ? maybe_ne (sel[i], expected)
5439               : maybe_lt (expected, nelt))
5440             return NULL_RTX;
5441         }
5442     }
5443
5444   return gen_int_shift_amount (mode, first * bitsize);
5445 }
5446
5447 /* A subroutine of expand_vec_perm_var for expanding one vec_perm insn.  */
5448
5449 static rtx
5450 expand_vec_perm_1 (enum insn_code icode, rtx target,
5451                    rtx v0, rtx v1, rtx sel)
5452 {
5453   machine_mode tmode = GET_MODE (target);
5454   machine_mode smode = GET_MODE (sel);
5455   struct expand_operand ops[4];
5456
5457   gcc_assert (GET_MODE_CLASS (smode) == MODE_VECTOR_INT
5458               || mode_for_int_vector (tmode).require () == smode);
5459   create_output_operand (&ops[0], target, tmode);
5460   create_input_operand (&ops[3], sel, smode);
5461
5462   /* Make an effort to preserve v0 == v1.  The target expander is able to
5463      rely on this to determine if we're permuting a single input operand.  */
5464   if (rtx_equal_p (v0, v1))
5465     {
5466       if (!insn_operand_matches (icode, 1, v0))
5467         v0 = force_reg (tmode, v0);
5468       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
5469       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
5470
5471       create_fixed_operand (&ops[1], v0);
5472       create_fixed_operand (&ops[2], v0);
5473     }
5474   else
5475     {
5476       create_input_operand (&ops[1], v0, tmode);
5477       create_input_operand (&ops[2], v1, tmode);
5478     }
5479
5480   if (maybe_expand_insn (icode, 4, ops))
5481     return ops[0].value;
5482   return NULL_RTX;
5483 }
5484
5485 /* Implement a permutation of vectors v0 and v1 using the permutation
5486    vector in SEL and return the result.  Use TARGET to hold the result
5487    if nonnull and convenient.
5488
5489    MODE is the mode of the vectors being permuted (V0 and V1).  SEL_MODE
5490    is the TYPE_MODE associated with SEL, or BLKmode if SEL isn't known
5491    to have a particular mode.  */
5492
5493 rtx
5494 expand_vec_perm_const (machine_mode mode, rtx v0, rtx v1,
5495                        const vec_perm_builder &sel, machine_mode sel_mode,
5496                        rtx target)
5497 {
5498   if (!target || !register_operand (target, mode))
5499     target = gen_reg_rtx (mode);
5500
5501   /* Set QIMODE to a different vector mode with byte elements.
5502      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
5503   machine_mode qimode;
5504   if (!qimode_for_vec_perm (mode).exists (&qimode))
5505     qimode = VOIDmode;
5506
5507   rtx_insn *last = get_last_insn ();
5508
5509   bool single_arg_p = rtx_equal_p (v0, v1);
5510   /* Always specify two input vectors here and leave the target to handle
5511      cases in which the inputs are equal.  Not all backends can cope with
5512      the single-input representation when testing for a double-input
5513      target instruction.  */
5514   vec_perm_indices indices (sel, 2, GET_MODE_NUNITS (mode));
5515
5516   /* See if this can be handled with a vec_shr.  We only do this if the
5517      second vector is all zeroes.  */
5518   insn_code shift_code = optab_handler (vec_shr_optab, mode);
5519   insn_code shift_code_qi = ((qimode != VOIDmode && qimode != mode)
5520                              ? optab_handler (vec_shr_optab, qimode)
5521                              : CODE_FOR_nothing);
5522
5523   if (v1 == CONST0_RTX (GET_MODE (v1))
5524       && (shift_code != CODE_FOR_nothing
5525           || shift_code_qi != CODE_FOR_nothing))
5526     {
5527       rtx shift_amt = shift_amt_for_vec_perm_mask (mode, indices);
5528       if (shift_amt)
5529         {
5530           struct expand_operand ops[3];
5531           if (shift_code != CODE_FOR_nothing)
5532             {
5533               create_output_operand (&ops[0], target, mode);
5534               create_input_operand (&ops[1], v0, mode);
5535               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
5536               if (maybe_expand_insn (shift_code, 3, ops))
5537                 return ops[0].value;
5538             }
5539           if (shift_code_qi != CODE_FOR_nothing)
5540             {
5541               rtx tmp = gen_reg_rtx (qimode);
5542               create_output_operand (&ops[0], tmp, qimode);
5543               create_input_operand (&ops[1], gen_lowpart (qimode, v0), qimode);
5544               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
5545               if (maybe_expand_insn (shift_code_qi, 3, ops))
5546                 return gen_lowpart (mode, ops[0].value);
5547             }
5548         }
5549     }
5550
5551   if (targetm.vectorize.vec_perm_const != NULL)
5552     {
5553       v0 = force_reg (mode, v0);
5554       if (single_arg_p)
5555         v1 = v0;
5556       else
5557         v1 = force_reg (mode, v1);
5558
5559       if (targetm.vectorize.vec_perm_const (mode, target, v0, v1, indices))
5560         return target;
5561     }
5562
5563   /* Fall back to a constant byte-based permutation.  */
5564   vec_perm_indices qimode_indices;
5565   rtx target_qi = NULL_RTX, v0_qi = NULL_RTX, v1_qi = NULL_RTX;
5566   if (qimode != VOIDmode)
5567     {
5568       qimode_indices.new_expanded_vector (indices, GET_MODE_UNIT_SIZE (mode));
5569       target_qi = gen_reg_rtx (qimode);
5570       v0_qi = gen_lowpart (qimode, v0);
5571       v1_qi = gen_lowpart (qimode, v1);
5572       if (targetm.vectorize.vec_perm_const != NULL
5573           && targetm.vectorize.vec_perm_const (qimode, target_qi, v0_qi,
5574                                                v1_qi, qimode_indices))
5575         return gen_lowpart (mode, target_qi);
5576     }
5577
5578   /* Otherwise expand as a fully variable permuation.  */
5579
5580   /* The optabs are only defined for selectors with the same width
5581      as the values being permuted.  */
5582   machine_mode required_sel_mode;
5583   if (!mode_for_int_vector (mode).exists (&required_sel_mode)
5584       || !VECTOR_MODE_P (required_sel_mode))
5585     {
5586       delete_insns_since (last);
5587       return NULL_RTX;
5588     }
5589
5590   /* We know that it is semantically valid to treat SEL as having SEL_MODE.
5591      If that isn't the mode we want then we need to prove that using
5592      REQUIRED_SEL_MODE is OK.  */
5593   if (sel_mode != required_sel_mode)
5594     {
5595       if (!selector_fits_mode_p (required_sel_mode, indices))
5596         {
5597           delete_insns_since (last);
5598           return NULL_RTX;
5599         }
5600       sel_mode = required_sel_mode;
5601     }
5602
5603   insn_code icode = direct_optab_handler (vec_perm_optab, mode);
5604   if (icode != CODE_FOR_nothing)
5605     {
5606       rtx sel_rtx = vec_perm_indices_to_rtx (sel_mode, indices);
5607       rtx tmp = expand_vec_perm_1 (icode, target, v0, v1, sel_rtx);
5608       if (tmp)
5609         return tmp;
5610     }
5611
5612   if (qimode != VOIDmode
5613       && selector_fits_mode_p (qimode, qimode_indices))
5614     {
5615       icode = direct_optab_handler (vec_perm_optab, qimode);
5616       if (icode != CODE_FOR_nothing)
5617         {
5618           rtx sel_qi = vec_perm_indices_to_rtx (qimode, qimode_indices);
5619           rtx tmp = expand_vec_perm_1 (icode, target_qi, v0_qi, v1_qi, sel_qi);
5620           if (tmp)
5621             return gen_lowpart (mode, tmp);
5622         }
5623     }
5624
5625   delete_insns_since (last);
5626   return NULL_RTX;
5627 }
5628
5629 /* Implement a permutation of vectors v0 and v1 using the permutation
5630    vector in SEL and return the result.  Use TARGET to hold the result
5631    if nonnull and convenient.
5632
5633    MODE is the mode of the vectors being permuted (V0 and V1).
5634    SEL must have the integer equivalent of MODE and is known to be
5635    unsuitable for permutes with a constant permutation vector.  */
5636
5637 rtx
5638 expand_vec_perm_var (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
5639 {
5640   enum insn_code icode;
5641   unsigned int i, u;
5642   rtx tmp, sel_qi;
5643
5644   u = GET_MODE_UNIT_SIZE (mode);
5645
5646   if (!target || GET_MODE (target) != mode)
5647     target = gen_reg_rtx (mode);
5648
5649   icode = direct_optab_handler (vec_perm_optab, mode);
5650   if (icode != CODE_FOR_nothing)
5651     {
5652       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5653       if (tmp)
5654         return tmp;
5655     }
5656
5657   /* As a special case to aid several targets, lower the element-based
5658      permutation to a byte-based permutation and try again.  */
5659   machine_mode qimode;
5660   if (!qimode_for_vec_perm (mode).exists (&qimode)
5661       || maybe_gt (GET_MODE_NUNITS (qimode), GET_MODE_MASK (QImode) + 1))
5662     return NULL_RTX;
5663   icode = direct_optab_handler (vec_perm_optab, qimode);
5664   if (icode == CODE_FOR_nothing)
5665     return NULL_RTX;
5666
5667   /* Multiply each element by its byte size.  */
5668   machine_mode selmode = GET_MODE (sel);
5669   if (u == 2)
5670     sel = expand_simple_binop (selmode, PLUS, sel, sel,
5671                                NULL, 0, OPTAB_DIRECT);
5672   else
5673     sel = expand_simple_binop (selmode, ASHIFT, sel,
5674                                gen_int_shift_amount (selmode, exact_log2 (u)),
5675                                NULL, 0, OPTAB_DIRECT);
5676   gcc_assert (sel != NULL);
5677
5678   /* Broadcast the low byte each element into each of its bytes.
5679      The encoding has U interleaved stepped patterns, one for each
5680      byte of an element.  */
5681   vec_perm_builder const_sel (GET_MODE_SIZE (mode), u, 3);
5682   unsigned int low_byte_in_u = BYTES_BIG_ENDIAN ? u - 1 : 0;
5683   for (i = 0; i < 3; ++i)
5684     for (unsigned int j = 0; j < u; ++j)
5685       const_sel.quick_push (i * u + low_byte_in_u);
5686   sel = gen_lowpart (qimode, sel);
5687   sel = expand_vec_perm_const (qimode, sel, sel, const_sel, qimode, NULL);
5688   gcc_assert (sel != NULL);
5689
5690   /* Add the byte offset to each byte element.  */
5691   /* Note that the definition of the indicies here is memory ordering,
5692      so there should be no difference between big and little endian.  */
5693   rtx_vector_builder byte_indices (qimode, u, 1);
5694   for (i = 0; i < u; ++i)
5695     byte_indices.quick_push (GEN_INT (i));
5696   tmp = byte_indices.build ();
5697   sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
5698                                 sel, 0, OPTAB_DIRECT);
5699   gcc_assert (sel_qi != NULL);
5700
5701   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5702   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5703                            gen_lowpart (qimode, v1), sel_qi);
5704   if (tmp)
5705     tmp = gen_lowpart (mode, tmp);
5706   return tmp;
5707 }
5708
5709 /* Generate insns for a VEC_COND_EXPR with mask, given its TYPE and its
5710    three operands.  */
5711
5712 rtx
5713 expand_vec_cond_mask_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5714                            rtx target)
5715 {
5716   struct expand_operand ops[4];
5717   machine_mode mode = TYPE_MODE (vec_cond_type);
5718   machine_mode mask_mode = TYPE_MODE (TREE_TYPE (op0));
5719   enum insn_code icode = get_vcond_mask_icode (mode, mask_mode);
5720   rtx mask, rtx_op1, rtx_op2;
5721
5722   if (icode == CODE_FOR_nothing)
5723     return 0;
5724
5725   mask = expand_normal (op0);
5726   rtx_op1 = expand_normal (op1);
5727   rtx_op2 = expand_normal (op2);
5728
5729   mask = force_reg (mask_mode, mask);
5730   rtx_op1 = force_reg (GET_MODE (rtx_op1), rtx_op1);
5731
5732   create_output_operand (&ops[0], target, mode);
5733   create_input_operand (&ops[1], rtx_op1, mode);
5734   create_input_operand (&ops[2], rtx_op2, mode);
5735   create_input_operand (&ops[3], mask, mask_mode);
5736   expand_insn (icode, 4, ops);
5737
5738   return ops[0].value;
5739 }
5740
5741 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
5742    three operands.  */
5743
5744 rtx
5745 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5746                       rtx target)
5747 {
5748   struct expand_operand ops[6];
5749   enum insn_code icode;
5750   rtx comparison, rtx_op1, rtx_op2;
5751   machine_mode mode = TYPE_MODE (vec_cond_type);
5752   machine_mode cmp_op_mode;
5753   bool unsignedp;
5754   tree op0a, op0b;
5755   enum tree_code tcode;
5756
5757   if (COMPARISON_CLASS_P (op0))
5758     {
5759       op0a = TREE_OPERAND (op0, 0);
5760       op0b = TREE_OPERAND (op0, 1);
5761       tcode = TREE_CODE (op0);
5762     }
5763   else
5764     {
5765       gcc_assert (VECTOR_BOOLEAN_TYPE_P (TREE_TYPE (op0)));
5766       if (get_vcond_mask_icode (mode, TYPE_MODE (TREE_TYPE (op0)))
5767           != CODE_FOR_nothing)
5768         return expand_vec_cond_mask_expr (vec_cond_type, op0, op1,
5769                                           op2, target);
5770       /* Fake op0 < 0.  */
5771       else
5772         {
5773           gcc_assert (GET_MODE_CLASS (TYPE_MODE (TREE_TYPE (op0)))
5774                       == MODE_VECTOR_INT);
5775           op0a = op0;
5776           op0b = build_zero_cst (TREE_TYPE (op0));
5777           tcode = LT_EXPR;
5778         }
5779     }
5780   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
5781   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5782
5783
5784   gcc_assert (known_eq (GET_MODE_SIZE (mode), GET_MODE_SIZE (cmp_op_mode))
5785               && known_eq (GET_MODE_NUNITS (mode),
5786                            GET_MODE_NUNITS (cmp_op_mode)));
5787
5788   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
5789   if (icode == CODE_FOR_nothing)
5790     {
5791       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5792         icode = get_vcond_eq_icode (mode, cmp_op_mode);
5793       if (icode == CODE_FOR_nothing)
5794         return 0;
5795     }
5796
5797   comparison = vector_compare_rtx (VOIDmode, tcode, op0a, op0b, unsignedp,
5798                                    icode, 4);
5799   rtx_op1 = expand_normal (op1);
5800   rtx_op2 = expand_normal (op2);
5801
5802   create_output_operand (&ops[0], target, mode);
5803   create_input_operand (&ops[1], rtx_op1, mode);
5804   create_input_operand (&ops[2], rtx_op2, mode);
5805   create_fixed_operand (&ops[3], comparison);
5806   create_fixed_operand (&ops[4], XEXP (comparison, 0));
5807   create_fixed_operand (&ops[5], XEXP (comparison, 1));
5808   expand_insn (icode, 6, ops);
5809   return ops[0].value;
5810 }
5811
5812 /* Generate VEC_SERIES_EXPR <OP0, OP1>, returning a value of mode VMODE.
5813    Use TARGET for the result if nonnull and convenient.  */
5814
5815 rtx
5816 expand_vec_series_expr (machine_mode vmode, rtx op0, rtx op1, rtx target)
5817 {
5818   struct expand_operand ops[3];
5819   enum insn_code icode;
5820   machine_mode emode = GET_MODE_INNER (vmode);
5821
5822   icode = direct_optab_handler (vec_series_optab, vmode);
5823   gcc_assert (icode != CODE_FOR_nothing);
5824
5825   create_output_operand (&ops[0], target, vmode);
5826   create_input_operand (&ops[1], op0, emode);
5827   create_input_operand (&ops[2], op1, emode);
5828
5829   expand_insn (icode, 3, ops);
5830   return ops[0].value;
5831 }
5832
5833 /* Generate insns for a vector comparison into a mask.  */
5834
5835 rtx
5836 expand_vec_cmp_expr (tree type, tree exp, rtx target)
5837 {
5838   struct expand_operand ops[4];
5839   enum insn_code icode;
5840   rtx comparison;
5841   machine_mode mask_mode = TYPE_MODE (type);
5842   machine_mode vmode;
5843   bool unsignedp;
5844   tree op0a, op0b;
5845   enum tree_code tcode;
5846
5847   op0a = TREE_OPERAND (exp, 0);
5848   op0b = TREE_OPERAND (exp, 1);
5849   tcode = TREE_CODE (exp);
5850
5851   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5852   vmode = TYPE_MODE (TREE_TYPE (op0a));
5853
5854   icode = get_vec_cmp_icode (vmode, mask_mode, unsignedp);
5855   if (icode == CODE_FOR_nothing)
5856     {
5857       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5858         icode = get_vec_cmp_eq_icode (vmode, mask_mode);
5859       if (icode == CODE_FOR_nothing)
5860         return 0;
5861     }
5862
5863   comparison = vector_compare_rtx (mask_mode, tcode, op0a, op0b,
5864                                    unsignedp, icode, 2);
5865   create_output_operand (&ops[0], target, mask_mode);
5866   create_fixed_operand (&ops[1], comparison);
5867   create_fixed_operand (&ops[2], XEXP (comparison, 0));
5868   create_fixed_operand (&ops[3], XEXP (comparison, 1));
5869   expand_insn (icode, 4, ops);
5870   return ops[0].value;
5871 }
5872
5873 /* Expand a highpart multiply.  */
5874
5875 rtx
5876 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
5877                       rtx target, bool uns_p)
5878 {
5879   struct expand_operand eops[3];
5880   enum insn_code icode;
5881   int method, i;
5882   machine_mode wmode;
5883   rtx m1, m2;
5884   optab tab1, tab2;
5885
5886   method = can_mult_highpart_p (mode, uns_p);
5887   switch (method)
5888     {
5889     case 0:
5890       return NULL_RTX;
5891     case 1:
5892       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
5893       return expand_binop (mode, tab1, op0, op1, target, uns_p,
5894                            OPTAB_LIB_WIDEN);
5895     case 2:
5896       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
5897       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
5898       break;
5899     case 3:
5900       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
5901       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
5902       if (BYTES_BIG_ENDIAN)
5903         std::swap (tab1, tab2);
5904       break;
5905     default:
5906       gcc_unreachable ();
5907     }
5908
5909   icode = optab_handler (tab1, mode);
5910   wmode = insn_data[icode].operand[0].mode;
5911   gcc_checking_assert (known_eq (2 * GET_MODE_NUNITS (wmode),
5912                                  GET_MODE_NUNITS (mode)));
5913   gcc_checking_assert (known_eq (GET_MODE_SIZE (wmode), GET_MODE_SIZE (mode)));
5914
5915   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5916   create_input_operand (&eops[1], op0, mode);
5917   create_input_operand (&eops[2], op1, mode);
5918   expand_insn (icode, 3, eops);
5919   m1 = gen_lowpart (mode, eops[0].value);
5920
5921   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5922   create_input_operand (&eops[1], op0, mode);
5923   create_input_operand (&eops[2], op1, mode);
5924   expand_insn (optab_handler (tab2, mode), 3, eops);
5925   m2 = gen_lowpart (mode, eops[0].value);
5926
5927   vec_perm_builder sel;
5928   if (method == 2)
5929     {
5930       /* The encoding has 2 interleaved stepped patterns.  */
5931       sel.new_vector (GET_MODE_NUNITS (mode), 2, 3);
5932       for (i = 0; i < 6; ++i)
5933         sel.quick_push (!BYTES_BIG_ENDIAN + (i & ~1)
5934                         + ((i & 1) ? GET_MODE_NUNITS (mode) : 0));
5935     }
5936   else
5937     {
5938       /* The encoding has a single interleaved stepped pattern.  */
5939       sel.new_vector (GET_MODE_NUNITS (mode), 1, 3);
5940       for (i = 0; i < 3; ++i)
5941         sel.quick_push (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
5942     }
5943
5944   return expand_vec_perm_const (mode, m1, m2, sel, BLKmode, target);
5945 }
5946 \f
5947 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
5948    pattern.  */
5949
5950 static void
5951 find_cc_set (rtx x, const_rtx pat, void *data)
5952 {
5953   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
5954       && GET_CODE (pat) == SET)
5955     {
5956       rtx *p_cc_reg = (rtx *) data;
5957       gcc_assert (!*p_cc_reg);
5958       *p_cc_reg = x;
5959     }
5960 }
5961
5962 /* This is a helper function for the other atomic operations.  This function
5963    emits a loop that contains SEQ that iterates until a compare-and-swap
5964    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
5965    a set of instructions that takes a value from OLD_REG as an input and
5966    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
5967    set to the current contents of MEM.  After SEQ, a compare-and-swap will
5968    attempt to update MEM with NEW_REG.  The function returns true when the
5969    loop was generated successfully.  */
5970
5971 static bool
5972 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
5973 {
5974   machine_mode mode = GET_MODE (mem);
5975   rtx_code_label *label;
5976   rtx cmp_reg, success, oldval;
5977
5978   /* The loop we want to generate looks like
5979
5980         cmp_reg = mem;
5981       label:
5982         old_reg = cmp_reg;
5983         seq;
5984         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
5985         if (success)
5986           goto label;
5987
5988      Note that we only do the plain load from memory once.  Subsequent
5989      iterations use the value loaded by the compare-and-swap pattern.  */
5990
5991   label = gen_label_rtx ();
5992   cmp_reg = gen_reg_rtx (mode);
5993
5994   emit_move_insn (cmp_reg, mem);
5995   emit_label (label);
5996   emit_move_insn (old_reg, cmp_reg);
5997   if (seq)
5998     emit_insn (seq);
5999
6000   success = NULL_RTX;
6001   oldval = cmp_reg;
6002   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
6003                                        new_reg, false, MEMMODEL_SYNC_SEQ_CST,
6004                                        MEMMODEL_RELAXED))
6005     return false;
6006
6007   if (oldval != cmp_reg)
6008     emit_move_insn (cmp_reg, oldval);
6009
6010   /* Mark this jump predicted not taken.  */
6011   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
6012                            GET_MODE (success), 1, label,
6013                            profile_probability::guessed_never ());
6014   return true;
6015 }
6016
6017
6018 /* This function tries to emit an atomic_exchange intruction.  VAL is written
6019    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
6020    using TARGET if possible.  */
6021
6022 static rtx
6023 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6024 {
6025   machine_mode mode = GET_MODE (mem);
6026   enum insn_code icode;
6027
6028   /* If the target supports the exchange directly, great.  */
6029   icode = direct_optab_handler (atomic_exchange_optab, mode);
6030   if (icode != CODE_FOR_nothing)
6031     {
6032       struct expand_operand ops[4];
6033
6034       create_output_operand (&ops[0], target, mode);
6035       create_fixed_operand (&ops[1], mem);
6036       create_input_operand (&ops[2], val, mode);
6037       create_integer_operand (&ops[3], model);
6038       if (maybe_expand_insn (icode, 4, ops))
6039         return ops[0].value;
6040     }
6041
6042   return NULL_RTX;
6043 }
6044
6045 /* This function tries to implement an atomic exchange operation using
6046    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
6047    The previous contents of *MEM are returned, using TARGET if possible.
6048    Since this instructionn is an acquire barrier only, stronger memory
6049    models may require additional barriers to be emitted.  */
6050
6051 static rtx
6052 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
6053                                    enum memmodel model)
6054 {
6055   machine_mode mode = GET_MODE (mem);
6056   enum insn_code icode;
6057   rtx_insn *last_insn = get_last_insn ();
6058
6059   icode = optab_handler (sync_lock_test_and_set_optab, mode);
6060
6061   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
6062      exists, and the memory model is stronger than acquire, add a release
6063      barrier before the instruction.  */
6064
6065   if (is_mm_seq_cst (model) || is_mm_release (model) || is_mm_acq_rel (model))
6066     expand_mem_thread_fence (model);
6067
6068   if (icode != CODE_FOR_nothing)
6069     {
6070       struct expand_operand ops[3];
6071       create_output_operand (&ops[0], target, mode);
6072       create_fixed_operand (&ops[1], mem);
6073       create_input_operand (&ops[2], val, mode);
6074       if (maybe_expand_insn (icode, 3, ops))
6075         return ops[0].value;
6076     }
6077
6078   /* If an external test-and-set libcall is provided, use that instead of
6079      any external compare-and-swap that we might get from the compare-and-
6080      swap-loop expansion later.  */
6081   if (!can_compare_and_swap_p (mode, false))
6082     {
6083       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
6084       if (libfunc != NULL)
6085         {
6086           rtx addr;
6087
6088           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6089           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6090                                           mode, addr, ptr_mode,
6091                                           val, mode);
6092         }
6093     }
6094
6095   /* If the test_and_set can't be emitted, eliminate any barrier that might
6096      have been emitted.  */
6097   delete_insns_since (last_insn);
6098   return NULL_RTX;
6099 }
6100
6101 /* This function tries to implement an atomic exchange operation using a
6102    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
6103    *MEM are returned, using TARGET if possible.  No memory model is required
6104    since a compare_and_swap loop is seq-cst.  */
6105
6106 static rtx
6107 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
6108 {
6109   machine_mode mode = GET_MODE (mem);
6110
6111   if (can_compare_and_swap_p (mode, true))
6112     {
6113       if (!target || !register_operand (target, mode))
6114         target = gen_reg_rtx (mode);
6115       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
6116         return target;
6117     }
6118
6119   return NULL_RTX;
6120 }
6121
6122 /* This function tries to implement an atomic test-and-set operation
6123    using the atomic_test_and_set instruction pattern.  A boolean value
6124    is returned from the operation, using TARGET if possible.  */
6125
6126 static rtx
6127 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6128 {
6129   machine_mode pat_bool_mode;
6130   struct expand_operand ops[3];
6131
6132   if (!targetm.have_atomic_test_and_set ())
6133     return NULL_RTX;
6134
6135   /* While we always get QImode from __atomic_test_and_set, we get
6136      other memory modes from __sync_lock_test_and_set.  Note that we
6137      use no endian adjustment here.  This matches the 4.6 behavior
6138      in the Sparc backend.  */
6139   enum insn_code icode = targetm.code_for_atomic_test_and_set;
6140   gcc_checking_assert (insn_data[icode].operand[1].mode == QImode);
6141   if (GET_MODE (mem) != QImode)
6142     mem = adjust_address_nv (mem, QImode, 0);
6143
6144   pat_bool_mode = insn_data[icode].operand[0].mode;
6145   create_output_operand (&ops[0], target, pat_bool_mode);
6146   create_fixed_operand (&ops[1], mem);
6147   create_integer_operand (&ops[2], model);
6148
6149   if (maybe_expand_insn (icode, 3, ops))
6150     return ops[0].value;
6151   return NULL_RTX;
6152 }
6153
6154 /* This function expands the legacy _sync_lock test_and_set operation which is
6155    generally an atomic exchange.  Some limited targets only allow the
6156    constant 1 to be stored.  This is an ACQUIRE operation.
6157
6158    TARGET is an optional place to stick the return value.
6159    MEM is where VAL is stored.  */
6160
6161 rtx
6162 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
6163 {
6164   rtx ret;
6165
6166   /* Try an atomic_exchange first.  */
6167   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_SYNC_ACQUIRE);
6168   if (ret)
6169     return ret;
6170
6171   ret = maybe_emit_sync_lock_test_and_set (target, mem, val,
6172                                            MEMMODEL_SYNC_ACQUIRE);
6173   if (ret)
6174     return ret;
6175
6176   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6177   if (ret)
6178     return ret;
6179
6180   /* If there are no other options, try atomic_test_and_set if the value
6181      being stored is 1.  */
6182   if (val == const1_rtx)
6183     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_SYNC_ACQUIRE);
6184
6185   return ret;
6186 }
6187
6188 /* This function expands the atomic test_and_set operation:
6189    atomically store a boolean TRUE into MEM and return the previous value.
6190
6191    MEMMODEL is the memory model variant to use.
6192    TARGET is an optional place to stick the return value.  */
6193
6194 rtx
6195 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6196 {
6197   machine_mode mode = GET_MODE (mem);
6198   rtx ret, trueval, subtarget;
6199
6200   ret = maybe_emit_atomic_test_and_set (target, mem, model);
6201   if (ret)
6202     return ret;
6203
6204   /* Be binary compatible with non-default settings of trueval, and different
6205      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
6206      another only has atomic-exchange.  */
6207   if (targetm.atomic_test_and_set_trueval == 1)
6208     {
6209       trueval = const1_rtx;
6210       subtarget = target ? target : gen_reg_rtx (mode);
6211     }
6212   else
6213     {
6214       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
6215       subtarget = gen_reg_rtx (mode);
6216     }
6217
6218   /* Try the atomic-exchange optab...  */
6219   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
6220
6221   /* ... then an atomic-compare-and-swap loop ... */
6222   if (!ret)
6223     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
6224
6225   /* ... before trying the vaguely defined legacy lock_test_and_set. */
6226   if (!ret)
6227     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
6228
6229   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
6230      things with the value 1.  Thus we try again without trueval.  */
6231   if (!ret && targetm.atomic_test_and_set_trueval != 1)
6232     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
6233
6234   /* Failing all else, assume a single threaded environment and simply
6235      perform the operation.  */
6236   if (!ret)
6237     {
6238       /* If the result is ignored skip the move to target.  */
6239       if (subtarget != const0_rtx)
6240         emit_move_insn (subtarget, mem);
6241
6242       emit_move_insn (mem, trueval);
6243       ret = subtarget;
6244     }
6245
6246   /* Recall that have to return a boolean value; rectify if trueval
6247      is not exactly one.  */
6248   if (targetm.atomic_test_and_set_trueval != 1)
6249     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
6250
6251   return ret;
6252 }
6253
6254 /* This function expands the atomic exchange operation:
6255    atomically store VAL in MEM and return the previous value in MEM.
6256
6257    MEMMODEL is the memory model variant to use.
6258    TARGET is an optional place to stick the return value.  */
6259
6260 rtx
6261 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6262 {
6263   machine_mode mode = GET_MODE (mem);
6264   rtx ret;
6265
6266   /* If loads are not atomic for the required size and we are not called to
6267      provide a __sync builtin, do not do anything so that we stay consistent
6268      with atomic loads of the same size.  */
6269   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6270     return NULL_RTX;
6271
6272   ret = maybe_emit_atomic_exchange (target, mem, val, model);
6273
6274   /* Next try a compare-and-swap loop for the exchange.  */
6275   if (!ret)
6276     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6277
6278   return ret;
6279 }
6280
6281 /* This function expands the atomic compare exchange operation:
6282
6283    *PTARGET_BOOL is an optional place to store the boolean success/failure.
6284    *PTARGET_OVAL is an optional place to store the old value from memory.
6285    Both target parameters may be NULL or const0_rtx to indicate that we do
6286    not care about that return value.  Both target parameters are updated on
6287    success to the actual location of the corresponding result.
6288
6289    MEMMODEL is the memory model variant to use.
6290
6291    The return value of the function is true for success.  */
6292
6293 bool
6294 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
6295                                 rtx mem, rtx expected, rtx desired,
6296                                 bool is_weak, enum memmodel succ_model,
6297                                 enum memmodel fail_model)
6298 {
6299   machine_mode mode = GET_MODE (mem);
6300   struct expand_operand ops[8];
6301   enum insn_code icode;
6302   rtx target_oval, target_bool = NULL_RTX;
6303   rtx libfunc;
6304
6305   /* If loads are not atomic for the required size and we are not called to
6306      provide a __sync builtin, do not do anything so that we stay consistent
6307      with atomic loads of the same size.  */
6308   if (!can_atomic_load_p (mode) && !is_mm_sync (succ_model))
6309     return false;
6310
6311   /* Load expected into a register for the compare and swap.  */
6312   if (MEM_P (expected))
6313     expected = copy_to_reg (expected);
6314
6315   /* Make sure we always have some place to put the return oldval.
6316      Further, make sure that place is distinct from the input expected,
6317      just in case we need that path down below.  */
6318   if (ptarget_oval && *ptarget_oval == const0_rtx)
6319     ptarget_oval = NULL;
6320
6321   if (ptarget_oval == NULL
6322       || (target_oval = *ptarget_oval) == NULL
6323       || reg_overlap_mentioned_p (expected, target_oval))
6324     target_oval = gen_reg_rtx (mode);
6325
6326   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
6327   if (icode != CODE_FOR_nothing)
6328     {
6329       machine_mode bool_mode = insn_data[icode].operand[0].mode;
6330
6331       if (ptarget_bool && *ptarget_bool == const0_rtx)
6332         ptarget_bool = NULL;
6333
6334       /* Make sure we always have a place for the bool operand.  */
6335       if (ptarget_bool == NULL
6336           || (target_bool = *ptarget_bool) == NULL
6337           || GET_MODE (target_bool) != bool_mode)
6338         target_bool = gen_reg_rtx (bool_mode);
6339
6340       /* Emit the compare_and_swap.  */
6341       create_output_operand (&ops[0], target_bool, bool_mode);
6342       create_output_operand (&ops[1], target_oval, mode);
6343       create_fixed_operand (&ops[2], mem);
6344       create_input_operand (&ops[3], expected, mode);
6345       create_input_operand (&ops[4], desired, mode);
6346       create_integer_operand (&ops[5], is_weak);
6347       create_integer_operand (&ops[6], succ_model);
6348       create_integer_operand (&ops[7], fail_model);
6349       if (maybe_expand_insn (icode, 8, ops))
6350         {
6351           /* Return success/failure.  */
6352           target_bool = ops[0].value;
6353           target_oval = ops[1].value;
6354           goto success;
6355         }
6356     }
6357
6358   /* Otherwise fall back to the original __sync_val_compare_and_swap
6359      which is always seq-cst.  */
6360   icode = optab_handler (sync_compare_and_swap_optab, mode);
6361   if (icode != CODE_FOR_nothing)
6362     {
6363       rtx cc_reg;
6364
6365       create_output_operand (&ops[0], target_oval, mode);
6366       create_fixed_operand (&ops[1], mem);
6367       create_input_operand (&ops[2], expected, mode);
6368       create_input_operand (&ops[3], desired, mode);
6369       if (!maybe_expand_insn (icode, 4, ops))
6370         return false;
6371
6372       target_oval = ops[0].value;
6373
6374       /* If the caller isn't interested in the boolean return value,
6375          skip the computation of it.  */
6376       if (ptarget_bool == NULL)
6377         goto success;
6378
6379       /* Otherwise, work out if the compare-and-swap succeeded.  */
6380       cc_reg = NULL_RTX;
6381       if (have_insn_for (COMPARE, CCmode))
6382         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
6383       if (cc_reg)
6384         {
6385           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
6386                                                const0_rtx, VOIDmode, 0, 1);
6387           goto success;
6388         }
6389       goto success_bool_from_val;
6390     }
6391
6392   /* Also check for library support for __sync_val_compare_and_swap.  */
6393   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
6394   if (libfunc != NULL)
6395     {
6396       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6397       rtx target = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6398                                             mode, addr, ptr_mode,
6399                                             expected, mode, desired, mode);
6400       emit_move_insn (target_oval, target);
6401
6402       /* Compute the boolean return value only if requested.  */
6403       if (ptarget_bool)
6404         goto success_bool_from_val;
6405       else
6406         goto success;
6407     }
6408
6409   /* Failure.  */
6410   return false;
6411
6412  success_bool_from_val:
6413    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
6414                                         expected, VOIDmode, 1, 1);
6415  success:
6416   /* Make sure that the oval output winds up where the caller asked.  */
6417   if (ptarget_oval)
6418     *ptarget_oval = target_oval;
6419   if (ptarget_bool)
6420     *ptarget_bool = target_bool;
6421   return true;
6422 }
6423
6424 /* Generate asm volatile("" : : : "memory") as the memory blockage.  */
6425
6426 static void
6427 expand_asm_memory_blockage (void)
6428 {
6429   rtx asm_op, clob;
6430
6431   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, "", "", 0,
6432                                  rtvec_alloc (0), rtvec_alloc (0),
6433                                  rtvec_alloc (0), UNKNOWN_LOCATION);
6434   MEM_VOLATILE_P (asm_op) = 1;
6435
6436   clob = gen_rtx_SCRATCH (VOIDmode);
6437   clob = gen_rtx_MEM (BLKmode, clob);
6438   clob = gen_rtx_CLOBBER (VOIDmode, clob);
6439
6440   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
6441 }
6442
6443 /* Do not propagate memory accesses across this point.  */
6444
6445 static void
6446 expand_memory_blockage (void)
6447 {
6448   if (targetm.have_memory_blockage ())
6449     emit_insn (targetm.gen_memory_blockage ());
6450   else
6451     expand_asm_memory_blockage ();
6452 }
6453
6454 /* This routine will either emit the mem_thread_fence pattern or issue a
6455    sync_synchronize to generate a fence for memory model MEMMODEL.  */
6456
6457 void
6458 expand_mem_thread_fence (enum memmodel model)
6459 {
6460   if (is_mm_relaxed (model))
6461     return;
6462   if (targetm.have_mem_thread_fence ())
6463     {
6464       emit_insn (targetm.gen_mem_thread_fence (GEN_INT (model)));
6465       expand_memory_blockage ();
6466     }
6467   else if (targetm.have_memory_barrier ())
6468     emit_insn (targetm.gen_memory_barrier ());
6469   else if (synchronize_libfunc != NULL_RTX)
6470     emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode);
6471   else
6472     expand_memory_blockage ();
6473 }
6474
6475 /* Emit a signal fence with given memory model.  */
6476
6477 void
6478 expand_mem_signal_fence (enum memmodel model)
6479 {
6480   /* No machine barrier is required to implement a signal fence, but
6481      a compiler memory barrier must be issued, except for relaxed MM.  */
6482   if (!is_mm_relaxed (model))
6483     expand_memory_blockage ();
6484 }
6485
6486 /* This function expands the atomic load operation:
6487    return the atomically loaded value in MEM.
6488
6489    MEMMODEL is the memory model variant to use.
6490    TARGET is an option place to stick the return value.  */
6491
6492 rtx
6493 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
6494 {
6495   machine_mode mode = GET_MODE (mem);
6496   enum insn_code icode;
6497
6498   /* If the target supports the load directly, great.  */
6499   icode = direct_optab_handler (atomic_load_optab, mode);
6500   if (icode != CODE_FOR_nothing)
6501     {
6502       struct expand_operand ops[3];
6503       rtx_insn *last = get_last_insn ();
6504       if (is_mm_seq_cst (model))
6505         expand_memory_blockage ();
6506
6507       create_output_operand (&ops[0], target, mode);
6508       create_fixed_operand (&ops[1], mem);
6509       create_integer_operand (&ops[2], model);
6510       if (maybe_expand_insn (icode, 3, ops))
6511         {
6512           if (!is_mm_relaxed (model))
6513             expand_memory_blockage ();
6514           return ops[0].value;
6515         }
6516       delete_insns_since (last);
6517     }
6518
6519   /* If the size of the object is greater than word size on this target,
6520      then we assume that a load will not be atomic.  We could try to
6521      emulate a load with a compare-and-swap operation, but the store that
6522      doing this could result in would be incorrect if this is a volatile
6523      atomic load or targetting read-only-mapped memory.  */
6524   if (maybe_gt (GET_MODE_PRECISION (mode), BITS_PER_WORD))
6525     /* If there is no atomic load, leave the library call.  */
6526     return NULL_RTX;
6527
6528   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
6529   if (!target || target == const0_rtx)
6530     target = gen_reg_rtx (mode);
6531
6532   /* For SEQ_CST, emit a barrier before the load.  */
6533   if (is_mm_seq_cst (model))
6534     expand_mem_thread_fence (model);
6535
6536   emit_move_insn (target, mem);
6537
6538   /* Emit the appropriate barrier after the load.  */
6539   expand_mem_thread_fence (model);
6540
6541   return target;
6542 }
6543
6544 /* This function expands the atomic store operation:
6545    Atomically store VAL in MEM.
6546    MEMMODEL is the memory model variant to use.
6547    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
6548    function returns const0_rtx if a pattern was emitted.  */
6549
6550 rtx
6551 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
6552 {
6553   machine_mode mode = GET_MODE (mem);
6554   enum insn_code icode;
6555   struct expand_operand ops[3];
6556
6557   /* If the target supports the store directly, great.  */
6558   icode = direct_optab_handler (atomic_store_optab, mode);
6559   if (icode != CODE_FOR_nothing)
6560     {
6561       rtx_insn *last = get_last_insn ();
6562       if (!is_mm_relaxed (model))
6563         expand_memory_blockage ();
6564       create_fixed_operand (&ops[0], mem);
6565       create_input_operand (&ops[1], val, mode);
6566       create_integer_operand (&ops[2], model);
6567       if (maybe_expand_insn (icode, 3, ops))
6568         {
6569           if (is_mm_seq_cst (model))
6570             expand_memory_blockage ();
6571           return const0_rtx;
6572         }
6573       delete_insns_since (last);
6574     }
6575
6576   /* If using __sync_lock_release is a viable alternative, try it.
6577      Note that this will not be set to true if we are expanding a generic
6578      __atomic_store_n.  */
6579   if (use_release)
6580     {
6581       icode = direct_optab_handler (sync_lock_release_optab, mode);
6582       if (icode != CODE_FOR_nothing)
6583         {
6584           create_fixed_operand (&ops[0], mem);
6585           create_input_operand (&ops[1], const0_rtx, mode);
6586           if (maybe_expand_insn (icode, 2, ops))
6587             {
6588               /* lock_release is only a release barrier.  */
6589               if (is_mm_seq_cst (model))
6590                 expand_mem_thread_fence (model);
6591               return const0_rtx;
6592             }
6593         }
6594     }
6595
6596   /* If the size of the object is greater than word size on this target,
6597      a default store will not be atomic.  */
6598   if (maybe_gt (GET_MODE_PRECISION (mode), BITS_PER_WORD))
6599     {
6600       /* If loads are atomic or we are called to provide a __sync builtin,
6601          we can try a atomic_exchange and throw away the result.  Otherwise,
6602          don't do anything so that we do not create an inconsistency between
6603          loads and stores.  */
6604       if (can_atomic_load_p (mode) || is_mm_sync (model))
6605         {
6606           rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
6607           if (!target)
6608             target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem,
6609                                                                 val);
6610           if (target)
6611             return const0_rtx;
6612         }
6613         return NULL_RTX;
6614     }
6615
6616   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
6617   expand_mem_thread_fence (model);
6618
6619   emit_move_insn (mem, val);
6620
6621   /* For SEQ_CST, also emit a barrier after the store.  */
6622   if (is_mm_seq_cst (model))
6623     expand_mem_thread_fence (model);
6624
6625   return const0_rtx;
6626 }
6627
6628
6629 /* Structure containing the pointers and values required to process the
6630    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
6631
6632 struct atomic_op_functions
6633 {
6634   direct_optab mem_fetch_before;
6635   direct_optab mem_fetch_after;
6636   direct_optab mem_no_result;
6637   optab fetch_before;
6638   optab fetch_after;
6639   direct_optab no_result;
6640   enum rtx_code reverse_code;
6641 };
6642
6643
6644 /* Fill in structure pointed to by OP with the various optab entries for an
6645    operation of type CODE.  */
6646
6647 static void
6648 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
6649 {
6650   gcc_assert (op!= NULL);
6651
6652   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
6653      in the source code during compilation, and the optab entries are not
6654      computable until runtime.  Fill in the values at runtime.  */
6655   switch (code)
6656     {
6657     case PLUS:
6658       op->mem_fetch_before = atomic_fetch_add_optab;
6659       op->mem_fetch_after = atomic_add_fetch_optab;
6660       op->mem_no_result = atomic_add_optab;
6661       op->fetch_before = sync_old_add_optab;
6662       op->fetch_after = sync_new_add_optab;
6663       op->no_result = sync_add_optab;
6664       op->reverse_code = MINUS;
6665       break;
6666     case MINUS:
6667       op->mem_fetch_before = atomic_fetch_sub_optab;
6668       op->mem_fetch_after = atomic_sub_fetch_optab;
6669       op->mem_no_result = atomic_sub_optab;
6670       op->fetch_before = sync_old_sub_optab;
6671       op->fetch_after = sync_new_sub_optab;
6672       op->no_result = sync_sub_optab;
6673       op->reverse_code = PLUS;
6674       break;
6675     case XOR:
6676       op->mem_fetch_before = atomic_fetch_xor_optab;
6677       op->mem_fetch_after = atomic_xor_fetch_optab;
6678       op->mem_no_result = atomic_xor_optab;
6679       op->fetch_before = sync_old_xor_optab;
6680       op->fetch_after = sync_new_xor_optab;
6681       op->no_result = sync_xor_optab;
6682       op->reverse_code = XOR;
6683       break;
6684     case AND:
6685       op->mem_fetch_before = atomic_fetch_and_optab;
6686       op->mem_fetch_after = atomic_and_fetch_optab;
6687       op->mem_no_result = atomic_and_optab;
6688       op->fetch_before = sync_old_and_optab;
6689       op->fetch_after = sync_new_and_optab;
6690       op->no_result = sync_and_optab;
6691       op->reverse_code = UNKNOWN;
6692       break;
6693     case IOR:
6694       op->mem_fetch_before = atomic_fetch_or_optab;
6695       op->mem_fetch_after = atomic_or_fetch_optab;
6696       op->mem_no_result = atomic_or_optab;
6697       op->fetch_before = sync_old_ior_optab;
6698       op->fetch_after = sync_new_ior_optab;
6699       op->no_result = sync_ior_optab;
6700       op->reverse_code = UNKNOWN;
6701       break;
6702     case NOT:
6703       op->mem_fetch_before = atomic_fetch_nand_optab;
6704       op->mem_fetch_after = atomic_nand_fetch_optab;
6705       op->mem_no_result = atomic_nand_optab;
6706       op->fetch_before = sync_old_nand_optab;
6707       op->fetch_after = sync_new_nand_optab;
6708       op->no_result = sync_nand_optab;
6709       op->reverse_code = UNKNOWN;
6710       break;
6711     default:
6712       gcc_unreachable ();
6713     }
6714 }
6715
6716 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
6717    using memory order MODEL.  If AFTER is true the operation needs to return
6718    the value of *MEM after the operation, otherwise the previous value.
6719    TARGET is an optional place to place the result.  The result is unused if
6720    it is const0_rtx.
6721    Return the result if there is a better sequence, otherwise NULL_RTX.  */
6722
6723 static rtx
6724 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6725                          enum memmodel model, bool after)
6726 {
6727   /* If the value is prefetched, or not used, it may be possible to replace
6728      the sequence with a native exchange operation.  */
6729   if (!after || target == const0_rtx)
6730     {
6731       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
6732       if (code == AND && val == const0_rtx)
6733         {
6734           if (target == const0_rtx)
6735             target = gen_reg_rtx (GET_MODE (mem));
6736           return maybe_emit_atomic_exchange (target, mem, val, model);
6737         }
6738
6739       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
6740       if (code == IOR && val == constm1_rtx)
6741         {
6742           if (target == const0_rtx)
6743             target = gen_reg_rtx (GET_MODE (mem));
6744           return maybe_emit_atomic_exchange (target, mem, val, model);
6745         }
6746     }
6747
6748   return NULL_RTX;
6749 }
6750
6751 /* Try to emit an instruction for a specific operation varaition.
6752    OPTAB contains the OP functions.
6753    TARGET is an optional place to return the result. const0_rtx means unused.
6754    MEM is the memory location to operate on.
6755    VAL is the value to use in the operation.
6756    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
6757    MODEL is the memory model, if used.
6758    AFTER is true if the returned result is the value after the operation.  */
6759
6760 static rtx
6761 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
6762                rtx val, bool use_memmodel, enum memmodel model, bool after)
6763 {
6764   machine_mode mode = GET_MODE (mem);
6765   struct expand_operand ops[4];
6766   enum insn_code icode;
6767   int op_counter = 0;
6768   int num_ops;
6769
6770   /* Check to see if there is a result returned.  */
6771   if (target == const0_rtx)
6772     {
6773       if (use_memmodel)
6774         {
6775           icode = direct_optab_handler (optab->mem_no_result, mode);
6776           create_integer_operand (&ops[2], model);
6777           num_ops = 3;
6778         }
6779       else
6780         {
6781           icode = direct_optab_handler (optab->no_result, mode);
6782           num_ops = 2;
6783         }
6784     }
6785   /* Otherwise, we need to generate a result.  */
6786   else
6787     {
6788       if (use_memmodel)
6789         {
6790           icode = direct_optab_handler (after ? optab->mem_fetch_after
6791                                         : optab->mem_fetch_before, mode);
6792           create_integer_operand (&ops[3], model);
6793           num_ops = 4;
6794         }
6795       else
6796         {
6797           icode = optab_handler (after ? optab->fetch_after
6798                                  : optab->fetch_before, mode);
6799           num_ops = 3;
6800         }
6801       create_output_operand (&ops[op_counter++], target, mode);
6802     }
6803   if (icode == CODE_FOR_nothing)
6804     return NULL_RTX;
6805
6806   create_fixed_operand (&ops[op_counter++], mem);
6807   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
6808   create_convert_operand_to (&ops[op_counter++], val, mode, true);
6809
6810   if (maybe_expand_insn (icode, num_ops, ops))
6811     return (target == const0_rtx ? const0_rtx : ops[0].value);
6812
6813   return NULL_RTX;
6814 }
6815
6816
6817 /* This function expands an atomic fetch_OP or OP_fetch operation:
6818    TARGET is an option place to stick the return value.  const0_rtx indicates
6819    the result is unused.
6820    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6821    CODE is the operation being performed (OP)
6822    MEMMODEL is the memory model variant to use.
6823    AFTER is true to return the result of the operation (OP_fetch).
6824    AFTER is false to return the value before the operation (fetch_OP).
6825
6826    This function will *only* generate instructions if there is a direct
6827    optab. No compare and swap loops or libcalls will be generated. */
6828
6829 static rtx
6830 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
6831                                     enum rtx_code code, enum memmodel model,
6832                                     bool after)
6833 {
6834   machine_mode mode = GET_MODE (mem);
6835   struct atomic_op_functions optab;
6836   rtx result;
6837   bool unused_result = (target == const0_rtx);
6838
6839   get_atomic_op_for_code (&optab, code);
6840
6841   /* Check to see if there are any better instructions.  */
6842   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
6843   if (result)
6844     return result;
6845
6846   /* Check for the case where the result isn't used and try those patterns.  */
6847   if (unused_result)
6848     {
6849       /* Try the memory model variant first.  */
6850       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
6851       if (result)
6852         return result;
6853
6854       /* Next try the old style withuot a memory model.  */
6855       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
6856       if (result)
6857         return result;
6858
6859       /* There is no no-result pattern, so try patterns with a result.  */
6860       target = NULL_RTX;
6861     }
6862
6863   /* Try the __atomic version.  */
6864   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
6865   if (result)
6866     return result;
6867
6868   /* Try the older __sync version.  */
6869   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
6870   if (result)
6871     return result;
6872
6873   /* If the fetch value can be calculated from the other variation of fetch,
6874      try that operation.  */
6875   if (after || unused_result || optab.reverse_code != UNKNOWN)
6876     {
6877       /* Try the __atomic version, then the older __sync version.  */
6878       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
6879       if (!result)
6880         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
6881
6882       if (result)
6883         {
6884           /* If the result isn't used, no need to do compensation code.  */
6885           if (unused_result)
6886             return result;
6887
6888           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
6889              Fetch_before == after REVERSE_OP val.  */
6890           if (!after)
6891             code = optab.reverse_code;
6892           if (code == NOT)
6893             {
6894               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
6895                                             true, OPTAB_LIB_WIDEN);
6896               result = expand_simple_unop (mode, NOT, result, target, true);
6897             }
6898           else
6899             result = expand_simple_binop (mode, code, result, val, target,
6900                                           true, OPTAB_LIB_WIDEN);
6901           return result;
6902         }
6903     }
6904
6905   /* No direct opcode can be generated.  */
6906   return NULL_RTX;
6907 }
6908
6909
6910
6911 /* This function expands an atomic fetch_OP or OP_fetch operation:
6912    TARGET is an option place to stick the return value.  const0_rtx indicates
6913    the result is unused.
6914    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6915    CODE is the operation being performed (OP)
6916    MEMMODEL is the memory model variant to use.
6917    AFTER is true to return the result of the operation (OP_fetch).
6918    AFTER is false to return the value before the operation (fetch_OP).  */
6919 rtx
6920 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6921                         enum memmodel model, bool after)
6922 {
6923   machine_mode mode = GET_MODE (mem);
6924   rtx result;
6925   bool unused_result = (target == const0_rtx);
6926
6927   /* If loads are not atomic for the required size and we are not called to
6928      provide a __sync builtin, do not do anything so that we stay consistent
6929      with atomic loads of the same size.  */
6930   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6931     return NULL_RTX;
6932
6933   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
6934                                                after);
6935
6936   if (result)
6937     return result;
6938
6939   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
6940   if (code == PLUS || code == MINUS)
6941     {
6942       rtx tmp;
6943       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
6944
6945       start_sequence ();
6946       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
6947       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
6948                                                    model, after);
6949       if (result)
6950         {
6951           /* PLUS worked so emit the insns and return.  */
6952           tmp = get_insns ();
6953           end_sequence ();
6954           emit_insn (tmp);
6955           return result;
6956         }
6957
6958       /* PLUS did not work, so throw away the negation code and continue.  */
6959       end_sequence ();
6960     }
6961
6962   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
6963   if (!can_compare_and_swap_p (mode, false))
6964     {
6965       rtx libfunc;
6966       bool fixup = false;
6967       enum rtx_code orig_code = code;
6968       struct atomic_op_functions optab;
6969
6970       get_atomic_op_for_code (&optab, code);
6971       libfunc = optab_libfunc (after ? optab.fetch_after
6972                                : optab.fetch_before, mode);
6973       if (libfunc == NULL
6974           && (after || unused_result || optab.reverse_code != UNKNOWN))
6975         {
6976           fixup = true;
6977           if (!after)
6978             code = optab.reverse_code;
6979           libfunc = optab_libfunc (after ? optab.fetch_before
6980                                    : optab.fetch_after, mode);
6981         }
6982       if (libfunc != NULL)
6983         {
6984           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6985           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
6986                                             addr, ptr_mode, val, mode);
6987
6988           if (!unused_result && fixup)
6989             result = expand_simple_binop (mode, code, result, val, target,
6990                                           true, OPTAB_LIB_WIDEN);
6991           return result;
6992         }
6993
6994       /* We need the original code for any further attempts.  */
6995       code = orig_code;
6996     }
6997
6998   /* If nothing else has succeeded, default to a compare and swap loop.  */
6999   if (can_compare_and_swap_p (mode, true))
7000     {
7001       rtx_insn *insn;
7002       rtx t0 = gen_reg_rtx (mode), t1;
7003
7004       start_sequence ();
7005
7006       /* If the result is used, get a register for it.  */
7007       if (!unused_result)
7008         {
7009           if (!target || !register_operand (target, mode))
7010             target = gen_reg_rtx (mode);
7011           /* If fetch_before, copy the value now.  */
7012           if (!after)
7013             emit_move_insn (target, t0);
7014         }
7015       else
7016         target = const0_rtx;
7017
7018       t1 = t0;
7019       if (code == NOT)
7020         {
7021           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
7022                                     true, OPTAB_LIB_WIDEN);
7023           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
7024         }
7025       else
7026         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
7027                                   OPTAB_LIB_WIDEN);
7028
7029       /* For after, copy the value now.  */
7030       if (!unused_result && after)
7031         emit_move_insn (target, t1);
7032       insn = get_insns ();
7033       end_sequence ();
7034
7035       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
7036         return target;
7037     }
7038
7039   return NULL_RTX;
7040 }
7041 \f
7042 /* Return true if OPERAND is suitable for operand number OPNO of
7043    instruction ICODE.  */
7044
7045 bool
7046 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
7047 {
7048   return (!insn_data[(int) icode].operand[opno].predicate
7049           || (insn_data[(int) icode].operand[opno].predicate
7050               (operand, insn_data[(int) icode].operand[opno].mode)));
7051 }
7052 \f
7053 /* TARGET is a target of a multiword operation that we are going to
7054    implement as a series of word-mode operations.  Return true if
7055    TARGET is suitable for this purpose.  */
7056
7057 bool
7058 valid_multiword_target_p (rtx target)
7059 {
7060   machine_mode mode;
7061   int i, size;
7062
7063   mode = GET_MODE (target);
7064   if (!GET_MODE_SIZE (mode).is_constant (&size))
7065     return false;
7066   for (i = 0; i < size; i += UNITS_PER_WORD)
7067     if (!validate_subreg (word_mode, mode, target, i))
7068       return false;
7069   return true;
7070 }
7071
7072 /* Make OP describe an input operand that has value INTVAL and that has
7073    no inherent mode.  This function should only be used for operands that
7074    are always expand-time constants.  The backend may request that INTVAL
7075    be copied into a different kind of rtx, but it must specify the mode
7076    of that rtx if so.  */
7077
7078 void
7079 create_integer_operand (struct expand_operand *op, poly_int64 intval)
7080 {
7081   create_expand_operand (op, EXPAND_INTEGER,
7082                          gen_int_mode (intval, MAX_MODE_INT),
7083                          VOIDmode, false, intval);
7084 }
7085
7086 /* Like maybe_legitimize_operand, but do not change the code of the
7087    current rtx value.  */
7088
7089 static bool
7090 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
7091                                     struct expand_operand *op)
7092 {
7093   /* See if the operand matches in its current form.  */
7094   if (insn_operand_matches (icode, opno, op->value))
7095     return true;
7096
7097   /* If the operand is a memory whose address has no side effects,
7098      try forcing the address into a non-virtual pseudo register.
7099      The check for side effects is important because copy_to_mode_reg
7100      cannot handle things like auto-modified addresses.  */
7101   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
7102     {
7103       rtx addr, mem;
7104
7105       mem = op->value;
7106       addr = XEXP (mem, 0);
7107       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
7108           && !side_effects_p (addr))
7109         {
7110           rtx_insn *last;
7111           machine_mode mode;
7112
7113           last = get_last_insn ();
7114           mode = get_address_mode (mem);
7115           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
7116           if (insn_operand_matches (icode, opno, mem))
7117             {
7118               op->value = mem;
7119               return true;
7120             }
7121           delete_insns_since (last);
7122         }
7123     }
7124
7125   return false;
7126 }
7127
7128 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
7129    on success, storing the new operand value back in OP.  */
7130
7131 static bool
7132 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
7133                           struct expand_operand *op)
7134 {
7135   machine_mode mode, imode;
7136   bool old_volatile_ok, result;
7137
7138   mode = op->mode;
7139   switch (op->type)
7140     {
7141     case EXPAND_FIXED:
7142       old_volatile_ok = volatile_ok;
7143       volatile_ok = true;
7144       result = maybe_legitimize_operand_same_code (icode, opno, op);
7145       volatile_ok = old_volatile_ok;
7146       return result;
7147
7148     case EXPAND_OUTPUT:
7149       gcc_assert (mode != VOIDmode);
7150       if (op->value
7151           && op->value != const0_rtx
7152           && GET_MODE (op->value) == mode
7153           && maybe_legitimize_operand_same_code (icode, opno, op))
7154         return true;
7155
7156       op->value = gen_reg_rtx (mode);
7157       op->target = 0;
7158       break;
7159
7160     case EXPAND_INPUT:
7161     input:
7162       gcc_assert (mode != VOIDmode);
7163       gcc_assert (GET_MODE (op->value) == VOIDmode
7164                   || GET_MODE (op->value) == mode);
7165       if (maybe_legitimize_operand_same_code (icode, opno, op))
7166         return true;
7167
7168       op->value = copy_to_mode_reg (mode, op->value);
7169       break;
7170
7171     case EXPAND_CONVERT_TO:
7172       gcc_assert (mode != VOIDmode);
7173       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
7174       goto input;
7175
7176     case EXPAND_CONVERT_FROM:
7177       if (GET_MODE (op->value) != VOIDmode)
7178         mode = GET_MODE (op->value);
7179       else
7180         /* The caller must tell us what mode this value has.  */
7181         gcc_assert (mode != VOIDmode);
7182
7183       imode = insn_data[(int) icode].operand[opno].mode;
7184       if (imode != VOIDmode && imode != mode)
7185         {
7186           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
7187           mode = imode;
7188         }
7189       goto input;
7190
7191     case EXPAND_ADDRESS:
7192       op->value = convert_memory_address (as_a <scalar_int_mode> (mode),
7193                                           op->value);
7194       goto input;
7195
7196     case EXPAND_INTEGER:
7197       mode = insn_data[(int) icode].operand[opno].mode;
7198       if (mode != VOIDmode
7199           && known_eq (trunc_int_for_mode (op->int_value, mode),
7200                        op->int_value))
7201         {
7202           op->value = gen_int_mode (op->int_value, mode);
7203           goto input;
7204         }
7205       break;
7206     }
7207   return insn_operand_matches (icode, opno, op->value);
7208 }
7209
7210 /* Make OP describe an input operand that should have the same value
7211    as VALUE, after any mode conversion that the target might request.
7212    TYPE is the type of VALUE.  */
7213
7214 void
7215 create_convert_operand_from_type (struct expand_operand *op,
7216                                   rtx value, tree type)
7217 {
7218   create_convert_operand_from (op, value, TYPE_MODE (type),
7219                                TYPE_UNSIGNED (type));
7220 }
7221
7222 /* Return true if the requirements on operands OP1 and OP2 of instruction
7223    ICODE are similar enough for the result of legitimizing OP1 to be
7224    reusable for OP2.  OPNO1 and OPNO2 are the operand numbers associated
7225    with OP1 and OP2 respectively.  */
7226
7227 static inline bool
7228 can_reuse_operands_p (enum insn_code icode,
7229                       unsigned int opno1, unsigned int opno2,
7230                       const struct expand_operand *op1,
7231                       const struct expand_operand *op2)
7232 {
7233   /* Check requirements that are common to all types.  */
7234   if (op1->type != op2->type
7235       || op1->mode != op2->mode
7236       || (insn_data[(int) icode].operand[opno1].mode
7237           != insn_data[(int) icode].operand[opno2].mode))
7238     return false;
7239
7240   /* Check the requirements for specific types.  */
7241   switch (op1->type)
7242     {
7243     case EXPAND_OUTPUT:
7244       /* Outputs must remain distinct.  */
7245       return false;
7246
7247     case EXPAND_FIXED:
7248     case EXPAND_INPUT:
7249     case EXPAND_ADDRESS:
7250     case EXPAND_INTEGER:
7251       return true;
7252
7253     case EXPAND_CONVERT_TO:
7254     case EXPAND_CONVERT_FROM:
7255       return op1->unsigned_p == op2->unsigned_p;
7256     }
7257   gcc_unreachable ();
7258 }
7259
7260 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
7261    of instruction ICODE.  Return true on success, leaving the new operand
7262    values in the OPS themselves.  Emit no code on failure.  */
7263
7264 bool
7265 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
7266                            unsigned int nops, struct expand_operand *ops)
7267 {
7268   rtx_insn *last = get_last_insn ();
7269   rtx *orig_values = XALLOCAVEC (rtx, nops);
7270   for (unsigned int i = 0; i < nops; i++)
7271     {
7272       orig_values[i] = ops[i].value;
7273
7274       /* First try reusing the result of an earlier legitimization.
7275          This avoids duplicate rtl and ensures that tied operands
7276          remain tied.
7277
7278          This search is linear, but NOPS is bounded at compile time
7279          to a small number (current a single digit).  */
7280       unsigned int j = 0;
7281       for (; j < i; ++j)
7282         if (can_reuse_operands_p (icode, opno + j, opno + i, &ops[j], &ops[i])
7283             && rtx_equal_p (orig_values[j], orig_values[i])
7284             && ops[j].value
7285             && insn_operand_matches (icode, opno + i, ops[j].value))
7286           {
7287             ops[i].value = copy_rtx (ops[j].value);
7288             break;
7289           }
7290
7291       /* Otherwise try legitimizing the operand on its own.  */
7292       if (j == i && !maybe_legitimize_operand (icode, opno + i, &ops[i]))
7293         {
7294           delete_insns_since (last);
7295           return false;
7296         }
7297     }
7298   return true;
7299 }
7300
7301 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
7302    as its operands.  Return the instruction pattern on success,
7303    and emit any necessary set-up code.  Return null and emit no
7304    code on failure.  */
7305
7306 rtx_insn *
7307 maybe_gen_insn (enum insn_code icode, unsigned int nops,
7308                 struct expand_operand *ops)
7309 {
7310   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
7311   if (!maybe_legitimize_operands (icode, 0, nops, ops))
7312     return NULL;
7313
7314   switch (nops)
7315     {
7316     case 1:
7317       return GEN_FCN (icode) (ops[0].value);
7318     case 2:
7319       return GEN_FCN (icode) (ops[0].value, ops[1].value);
7320     case 3:
7321       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
7322     case 4:
7323       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7324                               ops[3].value);
7325     case 5:
7326       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7327                               ops[3].value, ops[4].value);
7328     case 6:
7329       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7330                               ops[3].value, ops[4].value, ops[5].value);
7331     case 7:
7332       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7333                               ops[3].value, ops[4].value, ops[5].value,
7334                               ops[6].value);
7335     case 8:
7336       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7337                               ops[3].value, ops[4].value, ops[5].value,
7338                               ops[6].value, ops[7].value);
7339     case 9:
7340       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7341                               ops[3].value, ops[4].value, ops[5].value,
7342                               ops[6].value, ops[7].value, ops[8].value);
7343     }
7344   gcc_unreachable ();
7345 }
7346
7347 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
7348    as its operands.  Return true on success and emit no code on failure.  */
7349
7350 bool
7351 maybe_expand_insn (enum insn_code icode, unsigned int nops,
7352                    struct expand_operand *ops)
7353 {
7354   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7355   if (pat)
7356     {
7357       emit_insn (pat);
7358       return true;
7359     }
7360   return false;
7361 }
7362
7363 /* Like maybe_expand_insn, but for jumps.  */
7364
7365 bool
7366 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
7367                         struct expand_operand *ops)
7368 {
7369   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7370   if (pat)
7371     {
7372       emit_jump_insn (pat);
7373       return true;
7374     }
7375   return false;
7376 }
7377
7378 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
7379    as its operands.  */
7380
7381 void
7382 expand_insn (enum insn_code icode, unsigned int nops,
7383              struct expand_operand *ops)
7384 {
7385   if (!maybe_expand_insn (icode, nops, ops))
7386     gcc_unreachable ();
7387 }
7388
7389 /* Like expand_insn, but for jumps.  */
7390
7391 void
7392 expand_jump_insn (enum insn_code icode, unsigned int nops,
7393                   struct expand_operand *ops)
7394 {
7395   if (!maybe_expand_jump_insn (icode, nops, ops))
7396     gcc_unreachable ();
7397 }