gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2018 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "backend.h"
  25 #include "target.h"
  26 #include "rtl.h"
  27 #include "tree.h"
  28 #include "memmodel.h"
  29 #include "predict.h"
  30 #include "tm_p.h"
  31 #include "expmed.h"
  32 #include "optabs.h"
  33 #include "emit-rtl.h"
  34 #include "recog.h"
  35 #include "diagnostic-core.h"
  36 #include "rtx-vector-builder.h"
  37
  38 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  39    is properly defined.  */
  40 #include "stor-layout.h"
  41 #include "except.h"
  42 #include "dojump.h"
  43 #include "explow.h"
  44 #include "expr.h"
  45 #include "optabs-tree.h"
  46 #include "libfuncs.h"
  47
  48 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  49                                    machine_mode *);
  50 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  51 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  52
  53 /* Debug facility for use in GDB.  */
  54 void debug_optab_libfuncs (void);
  55 \f
  56 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
  57    the result of operation CODE applied to OP0 (and OP1 if it is a binary
  58    operation).
  59
  60    If the last insn does not set TARGET, don't do anything, but return 1.
  61
  62    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
  63    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
  64    try again, ensuring that TARGET is not one of the operands.  */
  65
  66 static int
  67 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
  68 {
  69   rtx_insn *last_insn;
  70   rtx set;
  71   rtx note;
  72
  73   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
  74
  75   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
  76       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
  77       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
  78       && GET_RTX_CLASS (code) != RTX_COMPARE
  79       && GET_RTX_CLASS (code) != RTX_UNARY)
  80     return 1;
  81
  82   if (GET_CODE (target) == ZERO_EXTRACT)
  83     return 1;
  84
  85   for (last_insn = insns;
  86        NEXT_INSN (last_insn) != NULL_RTX;
  87        last_insn = NEXT_INSN (last_insn))
  88     ;
  89
  90   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
  91      a value changing in the insn, so the note would be invalid for CSE.  */
  92   if (reg_overlap_mentioned_p (target, op0)
  93       || (op1 && reg_overlap_mentioned_p (target, op1)))
  94     {
  95       if (MEM_P (target)
  96           && (rtx_equal_p (target, op0)
  97               || (op1 && rtx_equal_p (target, op1))))
  98         {
  99           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 100              over expanding it as temp = MEM op X, MEM = temp.  If the target
 101              supports MEM = MEM op X instructions, it is sometimes too hard
 102              to reconstruct that form later, especially if X is also a memory,
 103              and due to multiple occurrences of addresses the address might
 104              be forced into register unnecessarily.
 105              Note that not emitting the REG_EQUIV note might inhibit
 106              CSE in some cases.  */
 107           set = single_set (last_insn);
 108           if (set
 109               && GET_CODE (SET_SRC (set)) == code
 110               && MEM_P (SET_DEST (set))
 111               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 112                   || (op1 && rtx_equal_p (SET_DEST (set),
 113                                           XEXP (SET_SRC (set), 1)))))
 114             return 1;
 115         }
 116       return 0;
 117     }
 118
 119   set = set_for_reg_notes (last_insn);
 120   if (set == NULL_RTX)
 121     return 1;
 122
 123   if (! rtx_equal_p (SET_DEST (set), target)
 124       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 125       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 126           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 127     return 1;
 128
 129   if (GET_RTX_CLASS (code) == RTX_UNARY)
 130     switch (code)
 131       {
 132       case FFS:
 133       case CLZ:
 134       case CTZ:
 135       case CLRSB:
 136       case POPCOUNT:
 137       case PARITY:
 138       case BSWAP:
 139         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 140           {
 141             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 142             if (GET_MODE_UNIT_SIZE (GET_MODE (op0))
 143                 > GET_MODE_UNIT_SIZE (GET_MODE (target)))
 144               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 145                                          note, GET_MODE (op0));
 146             else
 147               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 148                                          note, GET_MODE (op0));
 149             break;
 150           }
 151         /* FALLTHRU */
 152       default:
 153         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 154         break;
 155       }
 156   else
 157     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 158
 159   set_unique_reg_note (last_insn, REG_EQUAL, note);
 160
 161   return 1;
 162 }
 163 \f
 164 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 165    for a widening operation would be.  In most cases this would be OP0, but if
 166    that's a constant it'll be VOIDmode, which isn't useful.  */
 167
 168 static machine_mode
 169 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 170 {
 171   machine_mode m0 = GET_MODE (op0);
 172   machine_mode m1 = GET_MODE (op1);
 173   machine_mode result;
 174
 175   if (m0 == VOIDmode && m1 == VOIDmode)
 176     return to_mode;
 177   else if (m0 == VOIDmode || GET_MODE_UNIT_SIZE (m0) < GET_MODE_UNIT_SIZE (m1))
 178     result = m1;
 179   else
 180     result = m0;
 181
 182   if (GET_MODE_UNIT_SIZE (result) > GET_MODE_UNIT_SIZE (to_mode))
 183     return to_mode;
 184
 185   return result;
 186 }
 187 \f
 188 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 189    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 190    not actually do a sign-extend or zero-extend, but can leave the
 191    higher-order bits of the result rtx undefined, for example, in the case
 192    of logical operations, but not right shifts.  */
 193
 194 static rtx
 195 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 196                int unsignedp, int no_extend)
 197 {
 198   rtx result;
 199   scalar_int_mode int_mode;
 200
 201   /* If we don't have to extend and this is a constant, return it.  */
 202   if (no_extend && GET_MODE (op) == VOIDmode)
 203     return op;
 204
 205   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 206      extend since it will be more efficient to do so unless the signedness of
 207      a promoted object differs from our extension.  */
 208   if (! no_extend
 209       || !is_a <scalar_int_mode> (mode, &int_mode)
 210       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 211           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 212     return convert_modes (mode, oldmode, op, unsignedp);
 213
 214   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 215      SUBREG.  */
 216   if (GET_MODE_SIZE (int_mode) <= UNITS_PER_WORD)
 217     return gen_lowpart (int_mode, force_reg (GET_MODE (op), op));
 218
 219   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 220      part to OP.  */
 221
 222   result = gen_reg_rtx (int_mode);
 223   emit_clobber (result);
 224   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 225   return result;
 226 }
 227 \f
 228 /* Expand vector widening operations.
 229
 230    There are two different classes of operations handled here:
 231    1) Operations whose result is wider than all the arguments to the operation.
 232       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 233       In this case OP0 and optionally OP1 would be initialized,
 234       but WIDE_OP wouldn't (not relevant for this case).
 235    2) Operations whose result is of the same size as the last argument to the
 236       operation, but wider than all the other arguments to the operation.
 237       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 238       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 239
 240    E.g, when called to expand the following operations, this is how
 241    the arguments will be initialized:
 242                                 nops    OP0     OP1     WIDE_OP
 243    widening-sum                 2       oprnd0  -       oprnd1
 244    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 245    widening-mult                2       oprnd0  oprnd1  -
 246    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 247
 248 rtx
 249 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 250                            rtx target, int unsignedp)
 251 {
 252   struct expand_operand eops[4];
 253   tree oprnd0, oprnd1, oprnd2;
 254   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 255   optab widen_pattern_optab;
 256   enum insn_code icode;
 257   int nops = TREE_CODE_LENGTH (ops->code);
 258   int op;
 259
 260   oprnd0 = ops->op0;
 261   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 262   if (ops->code == VEC_UNPACK_FIX_TRUNC_HI_EXPR
 263       || ops->code == VEC_UNPACK_FIX_TRUNC_LO_EXPR)
 264     /* The sign is from the result type rather than operand's type
 265        for these ops.  */
 266     widen_pattern_optab
 267       = optab_for_tree_code (ops->code, ops->type, optab_default);
 268   else
 269     widen_pattern_optab
 270       = optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 271   if (ops->code == WIDEN_MULT_PLUS_EXPR
 272       || ops->code == WIDEN_MULT_MINUS_EXPR)
 273     icode = find_widening_optab_handler (widen_pattern_optab,
 274                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 275                                          tmode0);
 276   else
 277     icode = optab_handler (widen_pattern_optab, tmode0);
 278   gcc_assert (icode != CODE_FOR_nothing);
 279
 280   if (nops >= 2)
 281     {
 282       oprnd1 = ops->op1;
 283       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 284     }
 285
 286   /* The last operand is of a wider mode than the rest of the operands.  */
 287   if (nops == 2)
 288     wmode = tmode1;
 289   else if (nops == 3)
 290     {
 291       gcc_assert (tmode1 == tmode0);
 292       gcc_assert (op1);
 293       oprnd2 = ops->op2;
 294       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 295     }
 296
 297   op = 0;
 298   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 299   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 300   if (op1)
 301     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 302   if (wide_op)
 303     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 304   expand_insn (icode, op, eops);
 305   return eops[0].value;
 306 }
 307
 308 /* Generate code to perform an operation specified by TERNARY_OPTAB
 309    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 310
 311    UNSIGNEDP is for the case where we have to widen the operands
 312    to perform the operation.  It says to use zero-extension.
 313
 314    If TARGET is nonzero, the value
 315    is generated there, if it is convenient to do so.
 316    In all cases an rtx is returned for the locus of the value;
 317    this may or may not be TARGET.  */
 318
 319 rtx
 320 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 321                    rtx op1, rtx op2, rtx target, int unsignedp)
 322 {
 323   struct expand_operand ops[4];
 324   enum insn_code icode = optab_handler (ternary_optab, mode);
 325
 326   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 327
 328   create_output_operand (&ops[0], target, mode);
 329   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 330   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 331   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 332   expand_insn (icode, 4, ops);
 333   return ops[0].value;
 334 }
 335
 336
 337 /* Like expand_binop, but return a constant rtx if the result can be
 338    calculated at compile time.  The arguments and return value are
 339    otherwise the same as for expand_binop.  */
 340
 341 rtx
 342 simplify_expand_binop (machine_mode mode, optab binoptab,
 343                        rtx op0, rtx op1, rtx target, int unsignedp,
 344                        enum optab_methods methods)
 345 {
 346   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 347     {
 348       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 349                                          mode, op0, op1);
 350       if (x)
 351         return x;
 352     }
 353
 354   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 355 }
 356
 357 /* Like simplify_expand_binop, but always put the result in TARGET.
 358    Return true if the expansion succeeded.  */
 359
 360 bool
 361 force_expand_binop (machine_mode mode, optab binoptab,
 362                     rtx op0, rtx op1, rtx target, int unsignedp,
 363                     enum optab_methods methods)
 364 {
 365   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 366                                  target, unsignedp, methods);
 367   if (x == 0)
 368     return false;
 369   if (x != target)
 370     emit_move_insn (target, x);
 371   return true;
 372 }
 373
 374 /* Create a new vector value in VMODE with all elements set to OP.  The
 375    mode of OP must be the element mode of VMODE.  If OP is a constant,
 376    then the return value will be a constant.  */
 377
 378 rtx
 379 expand_vector_broadcast (machine_mode vmode, rtx op)
 380 {
 381   int n;
 382   rtvec vec;
 383
 384   gcc_checking_assert (VECTOR_MODE_P (vmode));
 385
 386   if (valid_for_const_vector_p (vmode, op))
 387     return gen_const_vec_duplicate (vmode, op);
 388
 389   insn_code icode = optab_handler (vec_duplicate_optab, vmode);
 390   if (icode != CODE_FOR_nothing)
 391     {
 392       struct expand_operand ops[2];
 393       create_output_operand (&ops[0], NULL_RTX, vmode);
 394       create_input_operand (&ops[1], op, GET_MODE (op));
 395       expand_insn (icode, 2, ops);
 396       return ops[0].value;
 397     }
 398
 399   if (!GET_MODE_NUNITS (vmode).is_constant (&n))
 400     return NULL;
 401
 402   /* ??? If the target doesn't have a vec_init, then we have no easy way
 403      of performing this operation.  Most of this sort of generic support
 404      is hidden away in the vector lowering support in gimple.  */
 405   icode = convert_optab_handler (vec_init_optab, vmode,
 406                                  GET_MODE_INNER (vmode));
 407   if (icode == CODE_FOR_nothing)
 408     return NULL;
 409
 410   vec = rtvec_alloc (n);
 411   for (int i = 0; i < n; ++i)
 412     RTVEC_ELT (vec, i) = op;
 413   rtx ret = gen_reg_rtx (vmode);
 414   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 415
 416   return ret;
 417 }
 418
 419 /* This subroutine of expand_doubleword_shift handles the cases in which
 420    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 421    value are the same as for the parent routine, except that SUPERWORD_OP1
 422    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 423    INTO_TARGET may be null if the caller has decided to calculate it.  */
 424
 425 static bool
 426 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 427                         rtx outof_target, rtx into_target,
 428                         int unsignedp, enum optab_methods methods)
 429 {
 430   if (into_target != 0)
 431     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 432                              into_target, unsignedp, methods))
 433       return false;
 434
 435   if (outof_target != 0)
 436     {
 437       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 438          of the sign bit, otherwise we must fill it with zeros.  */
 439       if (binoptab != ashr_optab)
 440         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 441       else
 442         if (!force_expand_binop (word_mode, binoptab, outof_input,
 443                                  gen_int_shift_amount (word_mode,
 444                                                        BITS_PER_WORD - 1),
 445                                  outof_target, unsignedp, methods))
 446           return false;
 447     }
 448   return true;
 449 }
 450
 451 /* This subroutine of expand_doubleword_shift handles the cases in which
 452    the effective shift value is < BITS_PER_WORD.  The arguments and return
 453    value are the same as for the parent routine.  */
 454
 455 static bool
 456 expand_subword_shift (scalar_int_mode op1_mode, optab binoptab,
 457                       rtx outof_input, rtx into_input, rtx op1,
 458                       rtx outof_target, rtx into_target,
 459                       int unsignedp, enum optab_methods methods,
 460                       unsigned HOST_WIDE_INT shift_mask)
 461 {
 462   optab reverse_unsigned_shift, unsigned_shift;
 463   rtx tmp, carries;
 464
 465   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 466   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 467
 468   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 469      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 470      the opposite direction to BINOPTAB.  */
 471   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 472     {
 473       carries = outof_input;
 474       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 475                                             op1_mode), op1_mode);
 476       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 477                                    0, true, methods);
 478     }
 479   else
 480     {
 481       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 482          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 483          has unknown behavior.  Do a single shift first, then shift by the
 484          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 485          are truncated to the mode size.  */
 486       carries = expand_binop (word_mode, reverse_unsigned_shift,
 487                               outof_input, const1_rtx, 0, unsignedp, methods);
 488       if (shift_mask == BITS_PER_WORD - 1)
 489         {
 490           tmp = immed_wide_int_const
 491             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 492           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 493                                        0, true, methods);
 494         }
 495       else
 496         {
 497           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 498                                                 op1_mode), op1_mode);
 499           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 500                                        0, true, methods);
 501         }
 502     }
 503   if (tmp == 0 || carries == 0)
 504     return false;
 505   carries = expand_binop (word_mode, reverse_unsigned_shift,
 506                           carries, tmp, 0, unsignedp, methods);
 507   if (carries == 0)
 508     return false;
 509
 510   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 511      so the result can go directly into INTO_TARGET if convenient.  */
 512   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 513                       into_target, unsignedp, methods);
 514   if (tmp == 0)
 515     return false;
 516
 517   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 518   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 519                            into_target, unsignedp, methods))
 520     return false;
 521
 522   /* Use a standard word_mode shift for the out-of half.  */
 523   if (outof_target != 0)
 524     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 525                              outof_target, unsignedp, methods))
 526       return false;
 527
 528   return true;
 529 }
 530
 531
 532 /* Try implementing expand_doubleword_shift using conditional moves.
 533    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 534    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 535    are the shift counts to use in the former and latter case.  All other
 536    arguments are the same as the parent routine.  */
 537
 538 static bool
 539 expand_doubleword_shift_condmove (scalar_int_mode op1_mode, optab binoptab,
 540                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 541                                   rtx outof_input, rtx into_input,
 542                                   rtx subword_op1, rtx superword_op1,
 543                                   rtx outof_target, rtx into_target,
 544                                   int unsignedp, enum optab_methods methods,
 545                                   unsigned HOST_WIDE_INT shift_mask)
 546 {
 547   rtx outof_superword, into_superword;
 548
 549   /* Put the superword version of the output into OUTOF_SUPERWORD and
 550      INTO_SUPERWORD.  */
 551   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 552   if (outof_target != 0 && subword_op1 == superword_op1)
 553     {
 554       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 555          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 556       into_superword = outof_target;
 557       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 558                                    outof_superword, 0, unsignedp, methods))
 559         return false;
 560     }
 561   else
 562     {
 563       into_superword = gen_reg_rtx (word_mode);
 564       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 565                                    outof_superword, into_superword,
 566                                    unsignedp, methods))
 567         return false;
 568     }
 569
 570   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 571   if (!expand_subword_shift (op1_mode, binoptab,
 572                              outof_input, into_input, subword_op1,
 573                              outof_target, into_target,
 574                              unsignedp, methods, shift_mask))
 575     return false;
 576
 577   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 578      might be the current value of OUTOF_TARGET.  */
 579   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 580                               into_target, into_superword, word_mode, false))
 581     return false;
 582
 583   if (outof_target != 0)
 584     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 585                                 outof_target, outof_superword,
 586                                 word_mode, false))
 587       return false;
 588
 589   return true;
 590 }
 591
 592 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 593    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 594    input operand; the shift moves bits in the direction OUTOF_INPUT->
 595    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 596    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 597    If OP1 is constant, it will have been truncated as appropriate
 598    and is known to be nonzero.
 599
 600    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 601    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 602    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 603
 604    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 605    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 606    fill with zeros or sign bits as appropriate.
 607
 608    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 609    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 610    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
 611    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
 612    are undefined.
 613
 614    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
 615    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
 616    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
 617    function wants to calculate it itself.
 618
 619    Return true if the shift could be successfully synthesized.  */
 620
 621 static bool
 622 expand_doubleword_shift (scalar_int_mode op1_mode, optab binoptab,
 623                          rtx outof_input, rtx into_input, rtx op1,
 624                          rtx outof_target, rtx into_target,
 625                          int unsignedp, enum optab_methods methods,
 626                          unsigned HOST_WIDE_INT shift_mask)
 627 {
 628   rtx superword_op1, tmp, cmp1, cmp2;
 629   enum rtx_code cmp_code;
 630
 631   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
 632      fill the result with sign or zero bits as appropriate.  If so, the value
 633      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
 634      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
 635      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
 636
 637      This isn't worthwhile for constant shifts since the optimizers will
 638      cope better with in-range shift counts.  */
 639   if (shift_mask >= BITS_PER_WORD
 640       && outof_target != 0
 641       && !CONSTANT_P (op1))
 642     {
 643       if (!expand_doubleword_shift (op1_mode, binoptab,
 644                                     outof_input, into_input, op1,
 645                                     0, into_target,
 646                                     unsignedp, methods, shift_mask))
 647         return false;
 648       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 649                                outof_target, unsignedp, methods))
 650         return false;
 651       return true;
 652     }
 653
 654   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
 655      is true when the effective shift value is less than BITS_PER_WORD.
 656      Set SUPERWORD_OP1 to the shift count that should be used to shift
 657      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
 658   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
 659   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
 660     {
 661       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
 662          is a subword shift count.  */
 663       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
 664                                     0, true, methods);
 665       cmp2 = CONST0_RTX (op1_mode);
 666       cmp_code = EQ;
 667       superword_op1 = op1;
 668     }
 669   else
 670     {
 671       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
 672       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
 673                                     0, true, methods);
 674       cmp2 = CONST0_RTX (op1_mode);
 675       cmp_code = LT;
 676       superword_op1 = cmp1;
 677     }
 678   if (cmp1 == 0)
 679     return false;
 680
 681   /* If we can compute the condition at compile time, pick the
 682      appropriate subroutine.  */
 683   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
 684   if (tmp != 0 && CONST_INT_P (tmp))
 685     {
 686       if (tmp == const0_rtx)
 687         return expand_superword_shift (binoptab, outof_input, superword_op1,
 688                                        outof_target, into_target,
 689                                        unsignedp, methods);
 690       else
 691         return expand_subword_shift (op1_mode, binoptab,
 692                                      outof_input, into_input, op1,
 693                                      outof_target, into_target,
 694                                      unsignedp, methods, shift_mask);
 695     }
 696
 697   /* Try using conditional moves to generate straight-line code.  */
 698   if (HAVE_conditional_move)
 699     {
 700       rtx_insn *start = get_last_insn ();
 701       if (expand_doubleword_shift_condmove (op1_mode, binoptab,
 702                                             cmp_code, cmp1, cmp2,
 703                                             outof_input, into_input,
 704                                             op1, superword_op1,
 705                                             outof_target, into_target,
 706                                             unsignedp, methods, shift_mask))
 707         return true;
 708       delete_insns_since (start);
 709     }
 710
 711   /* As a last resort, use branches to select the correct alternative.  */
 712   rtx_code_label *subword_label = gen_label_rtx ();
 713   rtx_code_label *done_label = gen_label_rtx ();
 714
 715   NO_DEFER_POP;
 716   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
 717                            0, 0, subword_label,
 718                            profile_probability::uninitialized ());
 719   OK_DEFER_POP;
 720
 721   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 722                                outof_target, into_target,
 723                                unsignedp, methods))
 724     return false;
 725
 726   emit_jump_insn (targetm.gen_jump (done_label));
 727   emit_barrier ();
 728   emit_label (subword_label);
 729
 730   if (!expand_subword_shift (op1_mode, binoptab,
 731                              outof_input, into_input, op1,
 732                              outof_target, into_target,
 733                              unsignedp, methods, shift_mask))
 734     return false;
 735
 736   emit_label (done_label);
 737   return true;
 738 }
 739 \f
 740 /* Subroutine of expand_binop.  Perform a double word multiplication of
 741    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
 742    as the target's word_mode.  This function return NULL_RTX if anything
 743    goes wrong, in which case it may have already emitted instructions
 744    which need to be deleted.
 745
 746    If we want to multiply two two-word values and have normal and widening
 747    multiplies of single-word values, we can do this with three smaller
 748    multiplications.
 749
 750    The multiplication proceeds as follows:
 751                                  _______________________
 752                                 [__op0_high_|__op0_low__]
 753                                  _______________________
 754         *                       [__op1_high_|__op1_low__]
 755         _______________________________________________
 756                                  _______________________
 757     (1)                         [__op0_low__*__op1_low__]
 758                      _______________________
 759     (2a)            [__op0_low__*__op1_high_]
 760                      _______________________
 761     (2b)            [__op0_high_*__op1_low__]
 762          _______________________
 763     (3) [__op0_high_*__op1_high_]
 764
 765
 766   This gives a 4-word result.  Since we are only interested in the
 767   lower 2 words, partial result (3) and the upper words of (2a) and
 768   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
 769   calculated using non-widening multiplication.
 770
 771   (1), however, needs to be calculated with an unsigned widening
 772   multiplication.  If this operation is not directly supported we
 773   try using a signed widening multiplication and adjust the result.
 774   This adjustment works as follows:
 775
 776       If both operands are positive then no adjustment is needed.
 777
 778       If the operands have different signs, for example op0_low < 0 and
 779       op1_low >= 0, the instruction treats the most significant bit of
 780       op0_low as a sign bit instead of a bit with significance
 781       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
 782       with 2**BITS_PER_WORD - op0_low, and two's complements the
 783       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
 784       the result.
 785
 786       Similarly, if both operands are negative, we need to add
 787       (op0_low + op1_low) * 2**BITS_PER_WORD.
 788
 789       We use a trick to adjust quickly.  We logically shift op0_low right
 790       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
 791       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
 792       logical shift exists, we do an arithmetic right shift and subtract
 793       the 0 or -1.  */
 794
 795 static rtx
 796 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
 797                        bool umulp, enum optab_methods methods)
 798 {
 799   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
 800   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
 801   rtx wordm1 = (umulp ? NULL_RTX
 802                 : gen_int_shift_amount (word_mode, BITS_PER_WORD - 1));
 803   rtx product, adjust, product_high, temp;
 804
 805   rtx op0_high = operand_subword_force (op0, high, mode);
 806   rtx op0_low = operand_subword_force (op0, low, mode);
 807   rtx op1_high = operand_subword_force (op1, high, mode);
 808   rtx op1_low = operand_subword_force (op1, low, mode);
 809
 810   /* If we're using an unsigned multiply to directly compute the product
 811      of the low-order words of the operands and perform any required
 812      adjustments of the operands, we begin by trying two more multiplications
 813      and then computing the appropriate sum.
 814
 815      We have checked above that the required addition is provided.
 816      Full-word addition will normally always succeed, especially if
 817      it is provided at all, so we don't worry about its failure.  The
 818      multiplication may well fail, however, so we do handle that.  */
 819
 820   if (!umulp)
 821     {
 822       /* ??? This could be done with emit_store_flag where available.  */
 823       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
 824                            NULL_RTX, 1, methods);
 825       if (temp)
 826         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
 827                                  NULL_RTX, 0, OPTAB_DIRECT);
 828       else
 829         {
 830           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
 831                                NULL_RTX, 0, methods);
 832           if (!temp)
 833             return NULL_RTX;
 834           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
 835                                    NULL_RTX, 0, OPTAB_DIRECT);
 836         }
 837
 838       if (!op0_high)
 839         return NULL_RTX;
 840     }
 841
 842   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
 843                          NULL_RTX, 0, OPTAB_DIRECT);
 844   if (!adjust)
 845     return NULL_RTX;
 846
 847   /* OP0_HIGH should now be dead.  */
 848
 849   if (!umulp)
 850     {
 851       /* ??? This could be done with emit_store_flag where available.  */
 852       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
 853                            NULL_RTX, 1, methods);
 854       if (temp)
 855         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
 856                                  NULL_RTX, 0, OPTAB_DIRECT);
 857       else
 858         {
 859           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
 860                                NULL_RTX, 0, methods);
 861           if (!temp)
 862             return NULL_RTX;
 863           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
 864                                    NULL_RTX, 0, OPTAB_DIRECT);
 865         }
 866
 867       if (!op1_high)
 868         return NULL_RTX;
 869     }
 870
 871   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
 872                        NULL_RTX, 0, OPTAB_DIRECT);
 873   if (!temp)
 874     return NULL_RTX;
 875
 876   /* OP1_HIGH should now be dead.  */
 877
 878   adjust = expand_binop (word_mode, add_optab, adjust, temp,
 879                          NULL_RTX, 0, OPTAB_DIRECT);
 880
 881   if (target && !REG_P (target))
 882     target = NULL_RTX;
 883
 884   /* *_widen_optab needs to determine operand mode, make sure at least
 885      one operand has non-VOID mode.  */
 886   if (GET_MODE (op0_low) == VOIDmode && GET_MODE (op1_low) == VOIDmode)
 887     op0_low = force_reg (word_mode, op0_low);
 888
 889   if (umulp)
 890     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
 891                             target, 1, OPTAB_DIRECT);
 892   else
 893     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
 894                             target, 1, OPTAB_DIRECT);
 895
 896   if (!product)
 897     return NULL_RTX;
 898
 899   product_high = operand_subword (product, high, 1, mode);
 900   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
 901                          NULL_RTX, 0, OPTAB_DIRECT);
 902   emit_move_insn (product_high, adjust);
 903   return product;
 904 }
 905 \f
 906 /* Wrapper around expand_binop which takes an rtx code to specify
 907    the operation to perform, not an optab pointer.  All other
 908    arguments are the same.  */
 909 rtx
 910 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
 911                      rtx op1, rtx target, int unsignedp,
 912                      enum optab_methods methods)
 913 {
 914   optab binop = code_to_optab (code);
 915   gcc_assert (binop);
 916
 917   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
 918 }
 919
 920 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
 921    binop.  Order them according to commutative_operand_precedence and, if
 922    possible, try to put TARGET or a pseudo first.  */
 923 static bool
 924 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
 925 {
 926   int op0_prec = commutative_operand_precedence (op0);
 927   int op1_prec = commutative_operand_precedence (op1);
 928
 929   if (op0_prec < op1_prec)
 930     return true;
 931
 932   if (op0_prec > op1_prec)
 933     return false;
 934
 935   /* With equal precedence, both orders are ok, but it is better if the
 936      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
 937   if (target == 0 || REG_P (target))
 938     return (REG_P (op1) && !REG_P (op0)) || target == op1;
 939   else
 940     return rtx_equal_p (op1, target);
 941 }
 942
 943 /* Return true if BINOPTAB implements a shift operation.  */
 944
 945 static bool
 946 shift_optab_p (optab binoptab)
 947 {
 948   switch (optab_to_code (binoptab))
 949     {
 950     case ASHIFT:
 951     case SS_ASHIFT:
 952     case US_ASHIFT:
 953     case ASHIFTRT:
 954     case LSHIFTRT:
 955     case ROTATE:
 956     case ROTATERT:
 957       return true;
 958
 959     default:
 960       return false;
 961     }
 962 }
 963
 964 /* Return true if BINOPTAB implements a commutative binary operation.  */
 965
 966 static bool
 967 commutative_optab_p (optab binoptab)
 968 {
 969   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
 970           || binoptab == smul_widen_optab
 971           || binoptab == umul_widen_optab
 972           || binoptab == smul_highpart_optab
 973           || binoptab == umul_highpart_optab);
 974 }
 975
 976 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
 977    optimizing, and if the operand is a constant that costs more than
 978    1 instruction, force the constant into a register and return that
 979    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
 980
 981 static rtx
 982 avoid_expensive_constant (machine_mode mode, optab binoptab,
 983                           int opn, rtx x, bool unsignedp)
 984 {
 985   bool speed = optimize_insn_for_speed_p ();
 986
 987   if (mode != VOIDmode
 988       && optimize
 989       && CONSTANT_P (x)
 990       && (rtx_cost (x, mode, optab_to_code (binoptab), opn, speed)
 991           > set_src_cost (x, mode, speed)))
 992     {
 993       if (CONST_INT_P (x))
 994         {
 995           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
 996           if (intval != INTVAL (x))
 997             x = GEN_INT (intval);
 998         }
 999       else
1000         x = convert_modes (mode, VOIDmode, x, unsignedp);
1001       x = force_reg (mode, x);
1002     }
1003   return x;
1004 }
1005
1006 /* Helper function for expand_binop: handle the case where there
1007    is an insn ICODE that directly implements the indicated operation.
1008    Returns null if this is not possible.  */
1009 static rtx
1010 expand_binop_directly (enum insn_code icode, machine_mode mode, optab binoptab,
1011                        rtx op0, rtx op1,
1012                        rtx target, int unsignedp, enum optab_methods methods,
1013                        rtx_insn *last)
1014 {
1015   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1016   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1017   machine_mode mode0, mode1, tmp_mode;
1018   struct expand_operand ops[3];
1019   bool commutative_p;
1020   rtx_insn *pat;
1021   rtx xop0 = op0, xop1 = op1;
1022   bool canonicalize_op1 = false;
1023
1024   /* If it is a commutative operator and the modes would match
1025      if we would swap the operands, we can save the conversions.  */
1026   commutative_p = commutative_optab_p (binoptab);
1027   if (commutative_p
1028       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1029       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1030     std::swap (xop0, xop1);
1031
1032   /* If we are optimizing, force expensive constants into a register.  */
1033   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1034   if (!shift_optab_p (binoptab))
1035     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1036   else
1037     /* Shifts and rotates often use a different mode for op1 from op0;
1038        for VOIDmode constants we don't know the mode, so force it
1039        to be canonicalized using convert_modes.  */
1040     canonicalize_op1 = true;
1041
1042   /* In case the insn wants input operands in modes different from
1043      those of the actual operands, convert the operands.  It would
1044      seem that we don't need to convert CONST_INTs, but we do, so
1045      that they're properly zero-extended, sign-extended or truncated
1046      for their mode.  */
1047
1048   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1049   if (xmode0 != VOIDmode && xmode0 != mode0)
1050     {
1051       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1052       mode0 = xmode0;
1053     }
1054
1055   mode1 = ((GET_MODE (xop1) != VOIDmode || canonicalize_op1)
1056            ? GET_MODE (xop1) : mode);
1057   if (xmode1 != VOIDmode && xmode1 != mode1)
1058     {
1059       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1060       mode1 = xmode1;
1061     }
1062
1063   /* If operation is commutative,
1064      try to make the first operand a register.
1065      Even better, try to make it the same as the target.
1066      Also try to make the last operand a constant.  */
1067   if (commutative_p
1068       && swap_commutative_operands_with_target (target, xop0, xop1))
1069     std::swap (xop0, xop1);
1070
1071   /* Now, if insn's predicates don't allow our operands, put them into
1072      pseudo regs.  */
1073
1074   if (binoptab == vec_pack_trunc_optab
1075       || binoptab == vec_pack_usat_optab
1076       || binoptab == vec_pack_ssat_optab
1077       || binoptab == vec_pack_ufix_trunc_optab
1078       || binoptab == vec_pack_sfix_trunc_optab
1079       || binoptab == vec_packu_float_optab
1080       || binoptab == vec_packs_float_optab)
1081     {
1082       /* The mode of the result is different then the mode of the
1083          arguments.  */
1084       tmp_mode = insn_data[(int) icode].operand[0].mode;
1085       if (VECTOR_MODE_P (mode)
1086           && maybe_ne (GET_MODE_NUNITS (tmp_mode), 2 * GET_MODE_NUNITS (mode)))
1087         {
1088           delete_insns_since (last);
1089           return NULL_RTX;
1090         }
1091     }
1092   else
1093     tmp_mode = mode;
1094
1095   create_output_operand (&ops[0], target, tmp_mode);
1096   create_input_operand (&ops[1], xop0, mode0);
1097   create_input_operand (&ops[2], xop1, mode1);
1098   pat = maybe_gen_insn (icode, 3, ops);
1099   if (pat)
1100     {
1101       /* If PAT is composed of more than one insn, try to add an appropriate
1102          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1103          operand, call expand_binop again, this time without a target.  */
1104       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1105           && ! add_equal_note (pat, ops[0].value,
1106                                optab_to_code (binoptab),
1107                                ops[1].value, ops[2].value))
1108         {
1109           delete_insns_since (last);
1110           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1111                                unsignedp, methods);
1112         }
1113
1114       emit_insn (pat);
1115       return ops[0].value;
1116     }
1117   delete_insns_since (last);
1118   return NULL_RTX;
1119 }
1120
1121 /* Generate code to perform an operation specified by BINOPTAB
1122    on operands OP0 and OP1, with result having machine-mode MODE.
1123
1124    UNSIGNEDP is for the case where we have to widen the operands
1125    to perform the operation.  It says to use zero-extension.
1126
1127    If TARGET is nonzero, the value
1128    is generated there, if it is convenient to do so.
1129    In all cases an rtx is returned for the locus of the value;
1130    this may or may not be TARGET.  */
1131
1132 rtx
1133 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1134               rtx target, int unsignedp, enum optab_methods methods)
1135 {
1136   enum optab_methods next_methods
1137     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1138        ? OPTAB_WIDEN : methods);
1139   enum mode_class mclass;
1140   enum insn_code icode;
1141   machine_mode wider_mode;
1142   scalar_int_mode int_mode;
1143   rtx libfunc;
1144   rtx temp;
1145   rtx_insn *entry_last = get_last_insn ();
1146   rtx_insn *last;
1147
1148   mclass = GET_MODE_CLASS (mode);
1149
1150   /* If subtracting an integer constant, convert this into an addition of
1151      the negated constant.  */
1152
1153   if (binoptab == sub_optab && CONST_INT_P (op1))
1154     {
1155       op1 = negate_rtx (mode, op1);
1156       binoptab = add_optab;
1157     }
1158   /* For shifts, constant invalid op1 might be expanded from different
1159      mode than MODE.  As those are invalid, force them to a register
1160      to avoid further problems during expansion.  */
1161   else if (CONST_INT_P (op1)
1162            && shift_optab_p (binoptab)
1163            && UINTVAL (op1) >= GET_MODE_BITSIZE (GET_MODE_INNER (mode)))
1164     {
1165       op1 = gen_int_mode (INTVAL (op1), GET_MODE_INNER (mode));
1166       op1 = force_reg (GET_MODE_INNER (mode), op1);
1167     }
1168
1169   /* Record where to delete back to if we backtrack.  */
1170   last = get_last_insn ();
1171
1172   /* If we can do it with a three-operand insn, do so.  */
1173
1174   if (methods != OPTAB_MUST_WIDEN)
1175     {
1176       if (convert_optab_p (binoptab))
1177         {
1178           machine_mode from_mode = widened_mode (mode, op0, op1);
1179           icode = find_widening_optab_handler (binoptab, mode, from_mode);
1180         }
1181       else
1182         icode = optab_handler (binoptab, mode);
1183       if (icode != CODE_FOR_nothing)
1184         {
1185           temp = expand_binop_directly (icode, mode, binoptab, op0, op1,
1186                                         target, unsignedp, methods, last);
1187           if (temp)
1188             return temp;
1189         }
1190     }
1191
1192   /* If we were trying to rotate, and that didn't work, try rotating
1193      the other direction before falling back to shifts and bitwise-or.  */
1194   if (((binoptab == rotl_optab
1195         && (icode = optab_handler (rotr_optab, mode)) != CODE_FOR_nothing)
1196        || (binoptab == rotr_optab
1197            && (icode = optab_handler (rotl_optab, mode)) != CODE_FOR_nothing))
1198       && is_int_mode (mode, &int_mode))
1199     {
1200       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1201       rtx newop1;
1202       unsigned int bits = GET_MODE_PRECISION (int_mode);
1203
1204       if (CONST_INT_P (op1))
1205         newop1 = gen_int_shift_amount (int_mode, bits - INTVAL (op1));
1206       else if (targetm.shift_truncation_mask (int_mode) == bits - 1)
1207         newop1 = negate_rtx (GET_MODE (op1), op1);
1208       else
1209         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1210                                gen_int_mode (bits, GET_MODE (op1)), op1,
1211                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1212
1213       temp = expand_binop_directly (icode, int_mode, otheroptab, op0, newop1,
1214                                     target, unsignedp, methods, last);
1215       if (temp)
1216         return temp;
1217     }
1218
1219   /* If this is a multiply, see if we can do a widening operation that
1220      takes operands of this mode and makes a wider mode.  */
1221
1222   if (binoptab == smul_optab
1223       && GET_MODE_2XWIDER_MODE (mode).exists (&wider_mode)
1224       && (convert_optab_handler ((unsignedp
1225                                   ? umul_widen_optab
1226                                   : smul_widen_optab),
1227                                  wider_mode, mode) != CODE_FOR_nothing))
1228     {
1229       /* *_widen_optab needs to determine operand mode, make sure at least
1230          one operand has non-VOID mode.  */
1231       if (GET_MODE (op0) == VOIDmode && GET_MODE (op1) == VOIDmode)
1232         op0 = force_reg (mode, op0);
1233       temp = expand_binop (wider_mode,
1234                            unsignedp ? umul_widen_optab : smul_widen_optab,
1235                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1236
1237       if (temp != 0)
1238         {
1239           if (GET_MODE_CLASS (mode) == MODE_INT
1240               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1241             return gen_lowpart (mode, temp);
1242           else
1243             return convert_to_mode (mode, temp, unsignedp);
1244         }
1245     }
1246
1247   /* If this is a vector shift by a scalar, see if we can do a vector
1248      shift by a vector.  If so, broadcast the scalar into a vector.  */
1249   if (mclass == MODE_VECTOR_INT)
1250     {
1251       optab otheroptab = unknown_optab;
1252
1253       if (binoptab == ashl_optab)
1254         otheroptab = vashl_optab;
1255       else if (binoptab == ashr_optab)
1256         otheroptab = vashr_optab;
1257       else if (binoptab == lshr_optab)
1258         otheroptab = vlshr_optab;
1259       else if (binoptab == rotl_optab)
1260         otheroptab = vrotl_optab;
1261       else if (binoptab == rotr_optab)
1262         otheroptab = vrotr_optab;
1263
1264       if (otheroptab
1265           && (icode = optab_handler (otheroptab, mode)) != CODE_FOR_nothing)
1266         {
1267           /* The scalar may have been extended to be too wide.  Truncate
1268              it back to the proper size to fit in the broadcast vector.  */
1269           scalar_mode inner_mode = GET_MODE_INNER (mode);
1270           if (!CONST_INT_P (op1)
1271               && (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (op1)))
1272                   > GET_MODE_BITSIZE (inner_mode)))
1273             op1 = force_reg (inner_mode,
1274                              simplify_gen_unary (TRUNCATE, inner_mode, op1,
1275                                                  GET_MODE (op1)));
1276           rtx vop1 = expand_vector_broadcast (mode, op1);
1277           if (vop1)
1278             {
1279               temp = expand_binop_directly (icode, mode, otheroptab, op0, vop1,
1280                                             target, unsignedp, methods, last);
1281               if (temp)
1282                 return temp;
1283             }
1284         }
1285     }
1286
1287   /* Look for a wider mode of the same class for which we think we
1288      can open-code the operation.  Check for a widening multiply at the
1289      wider mode as well.  */
1290
1291   if (CLASS_HAS_WIDER_MODES_P (mclass)
1292       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1293     FOR_EACH_WIDER_MODE (wider_mode, mode)
1294       {
1295         machine_mode next_mode;
1296         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1297             || (binoptab == smul_optab
1298                 && GET_MODE_WIDER_MODE (wider_mode).exists (&next_mode)
1299                 && (find_widening_optab_handler ((unsignedp
1300                                                   ? umul_widen_optab
1301                                                   : smul_widen_optab),
1302                                                  next_mode, mode)
1303                     != CODE_FOR_nothing)))
1304           {
1305             rtx xop0 = op0, xop1 = op1;
1306             int no_extend = 0;
1307
1308             /* For certain integer operations, we need not actually extend
1309                the narrow operands, as long as we will truncate
1310                the results to the same narrowness.  */
1311
1312             if ((binoptab == ior_optab || binoptab == and_optab
1313                  || binoptab == xor_optab
1314                  || binoptab == add_optab || binoptab == sub_optab
1315                  || binoptab == smul_optab || binoptab == ashl_optab)
1316                 && mclass == MODE_INT)
1317               {
1318                 no_extend = 1;
1319                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1320                                                  xop0, unsignedp);
1321                 if (binoptab != ashl_optab)
1322                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1323                                                    xop1, unsignedp);
1324               }
1325
1326             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1327
1328             /* The second operand of a shift must always be extended.  */
1329             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1330                                   no_extend && binoptab != ashl_optab);
1331
1332             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1333                                  unsignedp, OPTAB_DIRECT);
1334             if (temp)
1335               {
1336                 if (mclass != MODE_INT
1337                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1338                   {
1339                     if (target == 0)
1340                       target = gen_reg_rtx (mode);
1341                     convert_move (target, temp, 0);
1342                     return target;
1343                   }
1344                 else
1345                   return gen_lowpart (mode, temp);
1346               }
1347             else
1348               delete_insns_since (last);
1349           }
1350       }
1351
1352   /* If operation is commutative,
1353      try to make the first operand a register.
1354      Even better, try to make it the same as the target.
1355      Also try to make the last operand a constant.  */
1356   if (commutative_optab_p (binoptab)
1357       && swap_commutative_operands_with_target (target, op0, op1))
1358     std::swap (op0, op1);
1359
1360   /* These can be done a word at a time.  */
1361   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1362       && is_int_mode (mode, &int_mode)
1363       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
1364       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1365     {
1366       int i;
1367       rtx_insn *insns;
1368
1369       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1370          won't be accurate, so use a new target.  */
1371       if (target == 0
1372           || target == op0
1373           || target == op1
1374           || !valid_multiword_target_p (target))
1375         target = gen_reg_rtx (int_mode);
1376
1377       start_sequence ();
1378
1379       /* Do the actual arithmetic.  */
1380       enum machine_mode op0_mode = CONSTANT_P (op0) ? int_mode : VOIDmode;
1381       enum machine_mode op1_mode = CONSTANT_P (op1) ? int_mode : VOIDmode;
1382       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
1383         {
1384           rtx target_piece = operand_subword (target, i, 1, int_mode);
1385           rtx x = expand_binop (word_mode, binoptab,
1386                                 operand_subword_force (op0, i, op0_mode),
1387                                 operand_subword_force (op1, i, op1_mode),
1388                                 target_piece, unsignedp, next_methods);
1389
1390           if (x == 0)
1391             break;
1392
1393           if (target_piece != x)
1394             emit_move_insn (target_piece, x);
1395         }
1396
1397       insns = get_insns ();
1398       end_sequence ();
1399
1400       if (i == GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD)
1401         {
1402           emit_insn (insns);
1403           return target;
1404         }
1405     }
1406
1407   /* Synthesize double word shifts from single word shifts.  */
1408   if ((binoptab == lshr_optab || binoptab == ashl_optab
1409        || binoptab == ashr_optab)
1410       && is_int_mode (mode, &int_mode)
1411       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1412       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1413       && GET_MODE_PRECISION (int_mode) == GET_MODE_BITSIZE (int_mode)
1414       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1415       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1416       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1417     {
1418       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1419       scalar_int_mode op1_mode;
1420
1421       double_shift_mask = targetm.shift_truncation_mask (int_mode);
1422       shift_mask = targetm.shift_truncation_mask (word_mode);
1423       op1_mode = (GET_MODE (op1) != VOIDmode
1424                   ? as_a <scalar_int_mode> (GET_MODE (op1))
1425                   : word_mode);
1426
1427       /* Apply the truncation to constant shifts.  */
1428       if (double_shift_mask > 0 && CONST_INT_P (op1))
1429         op1 = gen_int_mode (INTVAL (op1) & double_shift_mask, op1_mode);
1430
1431       if (op1 == CONST0_RTX (op1_mode))
1432         return op0;
1433
1434       /* Make sure that this is a combination that expand_doubleword_shift
1435          can handle.  See the comments there for details.  */
1436       if (double_shift_mask == 0
1437           || (shift_mask == BITS_PER_WORD - 1
1438               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1439         {
1440           rtx_insn *insns;
1441           rtx into_target, outof_target;
1442           rtx into_input, outof_input;
1443           int left_shift, outof_word;
1444
1445           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1446              won't be accurate, so use a new target.  */
1447           if (target == 0
1448               || target == op0
1449               || target == op1
1450               || !valid_multiword_target_p (target))
1451             target = gen_reg_rtx (int_mode);
1452
1453           start_sequence ();
1454
1455           /* OUTOF_* is the word we are shifting bits away from, and
1456              INTO_* is the word that we are shifting bits towards, thus
1457              they differ depending on the direction of the shift and
1458              WORDS_BIG_ENDIAN.  */
1459
1460           left_shift = binoptab == ashl_optab;
1461           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1462
1463           outof_target = operand_subword (target, outof_word, 1, int_mode);
1464           into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1465
1466           outof_input = operand_subword_force (op0, outof_word, int_mode);
1467           into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1468
1469           if (expand_doubleword_shift (op1_mode, binoptab,
1470                                        outof_input, into_input, op1,
1471                                        outof_target, into_target,
1472                                        unsignedp, next_methods, shift_mask))
1473             {
1474               insns = get_insns ();
1475               end_sequence ();
1476
1477               emit_insn (insns);
1478               return target;
1479             }
1480           end_sequence ();
1481         }
1482     }
1483
1484   /* Synthesize double word rotates from single word shifts.  */
1485   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1486       && is_int_mode (mode, &int_mode)
1487       && CONST_INT_P (op1)
1488       && GET_MODE_PRECISION (int_mode) == 2 * BITS_PER_WORD
1489       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1490       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1491     {
1492       rtx_insn *insns;
1493       rtx into_target, outof_target;
1494       rtx into_input, outof_input;
1495       rtx inter;
1496       int shift_count, left_shift, outof_word;
1497
1498       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1499          won't be accurate, so use a new target. Do this also if target is not
1500          a REG, first because having a register instead may open optimization
1501          opportunities, and second because if target and op0 happen to be MEMs
1502          designating the same location, we would risk clobbering it too early
1503          in the code sequence we generate below.  */
1504       if (target == 0
1505           || target == op0
1506           || target == op1
1507           || !REG_P (target)
1508           || !valid_multiword_target_p (target))
1509         target = gen_reg_rtx (int_mode);
1510
1511       start_sequence ();
1512
1513       shift_count = INTVAL (op1);
1514
1515       /* OUTOF_* is the word we are shifting bits away from, and
1516          INTO_* is the word that we are shifting bits towards, thus
1517          they differ depending on the direction of the shift and
1518          WORDS_BIG_ENDIAN.  */
1519
1520       left_shift = (binoptab == rotl_optab);
1521       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1522
1523       outof_target = operand_subword (target, outof_word, 1, int_mode);
1524       into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1525
1526       outof_input = operand_subword_force (op0, outof_word, int_mode);
1527       into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1528
1529       if (shift_count == BITS_PER_WORD)
1530         {
1531           /* This is just a word swap.  */
1532           emit_move_insn (outof_target, into_input);
1533           emit_move_insn (into_target, outof_input);
1534           inter = const0_rtx;
1535         }
1536       else
1537         {
1538           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1539           HOST_WIDE_INT first_shift_count, second_shift_count;
1540           optab reverse_unsigned_shift, unsigned_shift;
1541
1542           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1543                                     ? lshr_optab : ashl_optab);
1544
1545           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1546                             ? ashl_optab : lshr_optab);
1547
1548           if (shift_count > BITS_PER_WORD)
1549             {
1550               first_shift_count = shift_count - BITS_PER_WORD;
1551               second_shift_count = 2 * BITS_PER_WORD - shift_count;
1552             }
1553           else
1554             {
1555               first_shift_count = BITS_PER_WORD - shift_count;
1556               second_shift_count = shift_count;
1557             }
1558           rtx first_shift_count_rtx
1559             = gen_int_shift_amount (word_mode, first_shift_count);
1560           rtx second_shift_count_rtx
1561             = gen_int_shift_amount (word_mode, second_shift_count);
1562
1563           into_temp1 = expand_binop (word_mode, unsigned_shift,
1564                                      outof_input, first_shift_count_rtx,
1565                                      NULL_RTX, unsignedp, next_methods);
1566           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1567                                      into_input, second_shift_count_rtx,
1568                                      NULL_RTX, unsignedp, next_methods);
1569
1570           if (into_temp1 != 0 && into_temp2 != 0)
1571             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1572                                   into_target, unsignedp, next_methods);
1573           else
1574             inter = 0;
1575
1576           if (inter != 0 && inter != into_target)
1577             emit_move_insn (into_target, inter);
1578
1579           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1580                                       into_input, first_shift_count_rtx,
1581                                       NULL_RTX, unsignedp, next_methods);
1582           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1583                                       outof_input, second_shift_count_rtx,
1584                                       NULL_RTX, unsignedp, next_methods);
1585
1586           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1587             inter = expand_binop (word_mode, ior_optab,
1588                                   outof_temp1, outof_temp2,
1589                                   outof_target, unsignedp, next_methods);
1590
1591           if (inter != 0 && inter != outof_target)
1592             emit_move_insn (outof_target, inter);
1593         }
1594
1595       insns = get_insns ();
1596       end_sequence ();
1597
1598       if (inter != 0)
1599         {
1600           emit_insn (insns);
1601           return target;
1602         }
1603     }
1604
1605   /* These can be done a word at a time by propagating carries.  */
1606   if ((binoptab == add_optab || binoptab == sub_optab)
1607       && is_int_mode (mode, &int_mode)
1608       && GET_MODE_SIZE (int_mode) >= 2 * UNITS_PER_WORD
1609       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1610     {
1611       unsigned int i;
1612       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1613       const unsigned int nwords = GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD;
1614       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1615       rtx xop0, xop1, xtarget;
1616
1617       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1618          value is one of those, use it.  Otherwise, use 1 since it is the
1619          one easiest to get.  */
1620 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1621       int normalizep = STORE_FLAG_VALUE;
1622 #else
1623       int normalizep = 1;
1624 #endif
1625
1626       /* Prepare the operands.  */
1627       xop0 = force_reg (int_mode, op0);
1628       xop1 = force_reg (int_mode, op1);
1629
1630       xtarget = gen_reg_rtx (int_mode);
1631
1632       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1633         target = xtarget;
1634
1635       /* Indicate for flow that the entire target reg is being set.  */
1636       if (REG_P (target))
1637         emit_clobber (xtarget);
1638
1639       /* Do the actual arithmetic.  */
1640       for (i = 0; i < nwords; i++)
1641         {
1642           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1643           rtx target_piece = operand_subword (xtarget, index, 1, int_mode);
1644           rtx op0_piece = operand_subword_force (xop0, index, int_mode);
1645           rtx op1_piece = operand_subword_force (xop1, index, int_mode);
1646           rtx x;
1647
1648           /* Main add/subtract of the input operands.  */
1649           x = expand_binop (word_mode, binoptab,
1650                             op0_piece, op1_piece,
1651                             target_piece, unsignedp, next_methods);
1652           if (x == 0)
1653             break;
1654
1655           if (i + 1 < nwords)
1656             {
1657               /* Store carry from main add/subtract.  */
1658               carry_out = gen_reg_rtx (word_mode);
1659               carry_out = emit_store_flag_force (carry_out,
1660                                                  (binoptab == add_optab
1661                                                   ? LT : GT),
1662                                                  x, op0_piece,
1663                                                  word_mode, 1, normalizep);
1664             }
1665
1666           if (i > 0)
1667             {
1668               rtx newx;
1669
1670               /* Add/subtract previous carry to main result.  */
1671               newx = expand_binop (word_mode,
1672                                    normalizep == 1 ? binoptab : otheroptab,
1673                                    x, carry_in,
1674                                    NULL_RTX, 1, next_methods);
1675
1676               if (i + 1 < nwords)
1677                 {
1678                   /* Get out carry from adding/subtracting carry in.  */
1679                   rtx carry_tmp = gen_reg_rtx (word_mode);
1680                   carry_tmp = emit_store_flag_force (carry_tmp,
1681                                                      (binoptab == add_optab
1682                                                       ? LT : GT),
1683                                                      newx, x,
1684                                                      word_mode, 1, normalizep);
1685
1686                   /* Logical-ior the two poss. carry together.  */
1687                   carry_out = expand_binop (word_mode, ior_optab,
1688                                             carry_out, carry_tmp,
1689                                             carry_out, 0, next_methods);
1690                   if (carry_out == 0)
1691                     break;
1692                 }
1693               emit_move_insn (target_piece, newx);
1694             }
1695           else
1696             {
1697               if (x != target_piece)
1698                 emit_move_insn (target_piece, x);
1699             }
1700
1701           carry_in = carry_out;
1702         }
1703
1704       if (i == GET_MODE_BITSIZE (int_mode) / (unsigned) BITS_PER_WORD)
1705         {
1706           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing
1707               || ! rtx_equal_p (target, xtarget))
1708             {
1709               rtx_insn *temp = emit_move_insn (target, xtarget);
1710
1711               set_dst_reg_note (temp, REG_EQUAL,
1712                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
1713                                                 int_mode, copy_rtx (xop0),
1714                                                 copy_rtx (xop1)),
1715                                 target);
1716             }
1717           else
1718             target = xtarget;
1719
1720           return target;
1721         }
1722
1723       else
1724         delete_insns_since (last);
1725     }
1726
1727   /* Attempt to synthesize double word multiplies using a sequence of word
1728      mode multiplications.  We first attempt to generate a sequence using a
1729      more efficient unsigned widening multiply, and if that fails we then
1730      try using a signed widening multiply.  */
1731
1732   if (binoptab == smul_optab
1733       && is_int_mode (mode, &int_mode)
1734       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1735       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
1736       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
1737     {
1738       rtx product = NULL_RTX;
1739       if (convert_optab_handler (umul_widen_optab, int_mode, word_mode)
1740           != CODE_FOR_nothing)
1741         {
1742           product = expand_doubleword_mult (int_mode, op0, op1, target,
1743                                             true, methods);
1744           if (!product)
1745             delete_insns_since (last);
1746         }
1747
1748       if (product == NULL_RTX
1749           && (convert_optab_handler (smul_widen_optab, int_mode, word_mode)
1750               != CODE_FOR_nothing))
1751         {
1752           product = expand_doubleword_mult (int_mode, op0, op1, target,
1753                                             false, methods);
1754           if (!product)
1755             delete_insns_since (last);
1756         }
1757
1758       if (product != NULL_RTX)
1759         {
1760           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing)
1761             {
1762               rtx_insn *move = emit_move_insn (target ? target : product,
1763                                                product);
1764               set_dst_reg_note (move,
1765                                 REG_EQUAL,
1766                                 gen_rtx_fmt_ee (MULT, int_mode,
1767                                                 copy_rtx (op0),
1768                                                 copy_rtx (op1)),
1769                                 target ? target : product);
1770             }
1771           return product;
1772         }
1773     }
1774
1775   /* It can't be open-coded in this mode.
1776      Use a library call if one is available and caller says that's ok.  */
1777
1778   libfunc = optab_libfunc (binoptab, mode);
1779   if (libfunc
1780       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
1781     {
1782       rtx_insn *insns;
1783       rtx op1x = op1;
1784       machine_mode op1_mode = mode;
1785       rtx value;
1786
1787       start_sequence ();
1788
1789       if (shift_optab_p (binoptab))
1790         {
1791           op1_mode = targetm.libgcc_shift_count_mode ();
1792           /* Specify unsigned here,
1793              since negative shift counts are meaningless.  */
1794           op1x = convert_to_mode (op1_mode, op1, 1);
1795         }
1796
1797       if (GET_MODE (op0) != VOIDmode
1798           && GET_MODE (op0) != mode)
1799         op0 = convert_to_mode (mode, op0, unsignedp);
1800
1801       /* Pass 1 for NO_QUEUE so we don't lose any increments
1802          if the libcall is cse'd or moved.  */
1803       value = emit_library_call_value (libfunc,
1804                                        NULL_RTX, LCT_CONST, mode,
1805                                        op0, mode, op1x, op1_mode);
1806
1807       insns = get_insns ();
1808       end_sequence ();
1809
1810       bool trapv = trapv_binoptab_p (binoptab);
1811       target = gen_reg_rtx (mode);
1812       emit_libcall_block_1 (insns, target, value,
1813                             trapv ? NULL_RTX
1814                             : gen_rtx_fmt_ee (optab_to_code (binoptab),
1815                                               mode, op0, op1), trapv);
1816
1817       return target;
1818     }
1819
1820   delete_insns_since (last);
1821
1822   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1823
1824   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
1825          || methods == OPTAB_MUST_WIDEN))
1826     {
1827       /* Caller says, don't even try.  */
1828       delete_insns_since (entry_last);
1829       return 0;
1830     }
1831
1832   /* Compute the value of METHODS to pass to recursive calls.
1833      Don't allow widening to be tried recursively.  */
1834
1835   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
1836
1837   /* Look for a wider mode of the same class for which it appears we can do
1838      the operation.  */
1839
1840   if (CLASS_HAS_WIDER_MODES_P (mclass))
1841     {
1842       /* This code doesn't make sense for conversion optabs, since we
1843          wouldn't then want to extend the operands to be the same size
1844          as the result.  */
1845       gcc_assert (!convert_optab_p (binoptab));
1846       FOR_EACH_WIDER_MODE (wider_mode, mode)
1847         {
1848           if (optab_handler (binoptab, wider_mode)
1849               || (methods == OPTAB_LIB
1850                   && optab_libfunc (binoptab, wider_mode)))
1851             {
1852               rtx xop0 = op0, xop1 = op1;
1853               int no_extend = 0;
1854
1855               /* For certain integer operations, we need not actually extend
1856                  the narrow operands, as long as we will truncate
1857                  the results to the same narrowness.  */
1858
1859               if ((binoptab == ior_optab || binoptab == and_optab
1860                    || binoptab == xor_optab
1861                    || binoptab == add_optab || binoptab == sub_optab
1862                    || binoptab == smul_optab || binoptab == ashl_optab)
1863                   && mclass == MODE_INT)
1864                 no_extend = 1;
1865
1866               xop0 = widen_operand (xop0, wider_mode, mode,
1867                                     unsignedp, no_extend);
1868
1869               /* The second operand of a shift must always be extended.  */
1870               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1871                                     no_extend && binoptab != ashl_optab);
1872
1873               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1874                                    unsignedp, methods);
1875               if (temp)
1876                 {
1877                   if (mclass != MODE_INT
1878                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1879                     {
1880                       if (target == 0)
1881                         target = gen_reg_rtx (mode);
1882                       convert_move (target, temp, 0);
1883                       return target;
1884                     }
1885                   else
1886                     return gen_lowpart (mode, temp);
1887                 }
1888               else
1889                 delete_insns_since (last);
1890             }
1891         }
1892     }
1893
1894   delete_insns_since (entry_last);
1895   return 0;
1896 }
1897 \f
1898 /* Expand a binary operator which has both signed and unsigned forms.
1899    UOPTAB is the optab for unsigned operations, and SOPTAB is for
1900    signed operations.
1901
1902    If we widen unsigned operands, we may use a signed wider operation instead
1903    of an unsigned wider operation, since the result would be the same.  */
1904
1905 rtx
1906 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
1907                    rtx op0, rtx op1, rtx target, int unsignedp,
1908                    enum optab_methods methods)
1909 {
1910   rtx temp;
1911   optab direct_optab = unsignedp ? uoptab : soptab;
1912   bool save_enable;
1913
1914   /* Do it without widening, if possible.  */
1915   temp = expand_binop (mode, direct_optab, op0, op1, target,
1916                        unsignedp, OPTAB_DIRECT);
1917   if (temp || methods == OPTAB_DIRECT)
1918     return temp;
1919
1920   /* Try widening to a signed int.  Disable any direct use of any
1921      signed insn in the current mode.  */
1922   save_enable = swap_optab_enable (soptab, mode, false);
1923
1924   temp = expand_binop (mode, soptab, op0, op1, target,
1925                        unsignedp, OPTAB_WIDEN);
1926
1927   /* For unsigned operands, try widening to an unsigned int.  */
1928   if (!temp && unsignedp)
1929     temp = expand_binop (mode, uoptab, op0, op1, target,
1930                          unsignedp, OPTAB_WIDEN);
1931   if (temp || methods == OPTAB_WIDEN)
1932     goto egress;
1933
1934   /* Use the right width libcall if that exists.  */
1935   temp = expand_binop (mode, direct_optab, op0, op1, target,
1936                        unsignedp, OPTAB_LIB);
1937   if (temp || methods == OPTAB_LIB)
1938     goto egress;
1939
1940   /* Must widen and use a libcall, use either signed or unsigned.  */
1941   temp = expand_binop (mode, soptab, op0, op1, target,
1942                        unsignedp, methods);
1943   if (!temp && unsignedp)
1944     temp = expand_binop (mode, uoptab, op0, op1, target,
1945                          unsignedp, methods);
1946
1947  egress:
1948   /* Undo the fiddling above.  */
1949   if (save_enable)
1950     swap_optab_enable (soptab, mode, true);
1951   return temp;
1952 }
1953 \f
1954 /* Generate code to perform an operation specified by UNOPPTAB
1955    on operand OP0, with two results to TARG0 and TARG1.
1956    We assume that the order of the operands for the instruction
1957    is TARG0, TARG1, OP0.
1958
1959    Either TARG0 or TARG1 may be zero, but what that means is that
1960    the result is not actually wanted.  We will generate it into
1961    a dummy pseudo-reg and discard it.  They may not both be zero.
1962
1963    Returns 1 if this operation can be performed; 0 if not.  */
1964
1965 int
1966 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
1967                     int unsignedp)
1968 {
1969   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
1970   enum mode_class mclass;
1971   machine_mode wider_mode;
1972   rtx_insn *entry_last = get_last_insn ();
1973   rtx_insn *last;
1974
1975   mclass = GET_MODE_CLASS (mode);
1976
1977   if (!targ0)
1978     targ0 = gen_reg_rtx (mode);
1979   if (!targ1)
1980     targ1 = gen_reg_rtx (mode);
1981
1982   /* Record where to go back to if we fail.  */
1983   last = get_last_insn ();
1984
1985   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
1986     {
1987       struct expand_operand ops[3];
1988       enum insn_code icode = optab_handler (unoptab, mode);
1989
1990       create_fixed_operand (&ops[0], targ0);
1991       create_fixed_operand (&ops[1], targ1);
1992       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
1993       if (maybe_expand_insn (icode, 3, ops))
1994         return 1;
1995     }
1996
1997   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1998
1999   if (CLASS_HAS_WIDER_MODES_P (mclass))
2000     {
2001       FOR_EACH_WIDER_MODE (wider_mode, mode)
2002         {
2003           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2004             {
2005               rtx t0 = gen_reg_rtx (wider_mode);
2006               rtx t1 = gen_reg_rtx (wider_mode);
2007               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2008
2009               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
2010                 {
2011                   convert_move (targ0, t0, unsignedp);
2012                   convert_move (targ1, t1, unsignedp);
2013                   return 1;
2014                 }
2015               else
2016                 delete_insns_since (last);
2017             }
2018         }
2019     }
2020
2021   delete_insns_since (entry_last);
2022   return 0;
2023 }
2024 \f
2025 /* Generate code to perform an operation specified by BINOPTAB
2026    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2027    We assume that the order of the operands for the instruction
2028    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2029    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2030
2031    Either TARG0 or TARG1 may be zero, but what that means is that
2032    the result is not actually wanted.  We will generate it into
2033    a dummy pseudo-reg and discard it.  They may not both be zero.
2034
2035    Returns 1 if this operation can be performed; 0 if not.  */
2036
2037 int
2038 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2039                      int unsignedp)
2040 {
2041   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2042   enum mode_class mclass;
2043   machine_mode wider_mode;
2044   rtx_insn *entry_last = get_last_insn ();
2045   rtx_insn *last;
2046
2047   mclass = GET_MODE_CLASS (mode);
2048
2049   if (!targ0)
2050     targ0 = gen_reg_rtx (mode);
2051   if (!targ1)
2052     targ1 = gen_reg_rtx (mode);
2053
2054   /* Record where to go back to if we fail.  */
2055   last = get_last_insn ();
2056
2057   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2058     {
2059       struct expand_operand ops[4];
2060       enum insn_code icode = optab_handler (binoptab, mode);
2061       machine_mode mode0 = insn_data[icode].operand[1].mode;
2062       machine_mode mode1 = insn_data[icode].operand[2].mode;
2063       rtx xop0 = op0, xop1 = op1;
2064
2065       /* If we are optimizing, force expensive constants into a register.  */
2066       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2067       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2068
2069       create_fixed_operand (&ops[0], targ0);
2070       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2071       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2072       create_fixed_operand (&ops[3], targ1);
2073       if (maybe_expand_insn (icode, 4, ops))
2074         return 1;
2075       delete_insns_since (last);
2076     }
2077
2078   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2079
2080   if (CLASS_HAS_WIDER_MODES_P (mclass))
2081     {
2082       FOR_EACH_WIDER_MODE (wider_mode, mode)
2083         {
2084           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2085             {
2086               rtx t0 = gen_reg_rtx (wider_mode);
2087               rtx t1 = gen_reg_rtx (wider_mode);
2088               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2089               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2090
2091               if (expand_twoval_binop (binoptab, cop0, cop1,
2092                                        t0, t1, unsignedp))
2093                 {
2094                   convert_move (targ0, t0, unsignedp);
2095                   convert_move (targ1, t1, unsignedp);
2096                   return 1;
2097                 }
2098               else
2099                 delete_insns_since (last);
2100             }
2101         }
2102     }
2103
2104   delete_insns_since (entry_last);
2105   return 0;
2106 }
2107
2108 /* Expand the two-valued library call indicated by BINOPTAB, but
2109    preserve only one of the values.  If TARG0 is non-NULL, the first
2110    value is placed into TARG0; otherwise the second value is placed
2111    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2112    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2113    This routine assumes that the value returned by the library call is
2114    as if the return value was of an integral mode twice as wide as the
2115    mode of OP0.  Returns 1 if the call was successful.  */
2116
2117 bool
2118 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2119                              rtx targ0, rtx targ1, enum rtx_code code)
2120 {
2121   machine_mode mode;
2122   machine_mode libval_mode;
2123   rtx libval;
2124   rtx_insn *insns;
2125   rtx libfunc;
2126
2127   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2128   gcc_assert (!targ0 != !targ1);
2129
2130   mode = GET_MODE (op0);
2131   libfunc = optab_libfunc (binoptab, mode);
2132   if (!libfunc)
2133     return false;
2134
2135   /* The value returned by the library function will have twice as
2136      many bits as the nominal MODE.  */
2137   libval_mode = smallest_int_mode_for_size (2 * GET_MODE_BITSIZE (mode));
2138   start_sequence ();
2139   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2140                                     libval_mode,
2141                                     op0, mode,
2142                                     op1, mode);
2143   /* Get the part of VAL containing the value that we want.  */
2144   libval = simplify_gen_subreg (mode, libval, libval_mode,
2145                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2146   insns = get_insns ();
2147   end_sequence ();
2148   /* Move the into the desired location.  */
2149   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2150                       gen_rtx_fmt_ee (code, mode, op0, op1));
2151
2152   return true;
2153 }
2154
2155 \f
2156 /* Wrapper around expand_unop which takes an rtx code to specify
2157    the operation to perform, not an optab pointer.  All other
2158    arguments are the same.  */
2159 rtx
2160 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2161                     rtx target, int unsignedp)
2162 {
2163   optab unop = code_to_optab (code);
2164   gcc_assert (unop);
2165
2166   return expand_unop (mode, unop, op0, target, unsignedp);
2167 }
2168
2169 /* Try calculating
2170         (clz:narrow x)
2171    as
2172         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2173
2174    A similar operation can be used for clrsb.  UNOPTAB says which operation
2175    we are trying to expand.  */
2176 static rtx
2177 widen_leading (scalar_int_mode mode, rtx op0, rtx target, optab unoptab)
2178 {
2179   opt_scalar_int_mode wider_mode_iter;
2180   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2181     {
2182       scalar_int_mode wider_mode = wider_mode_iter.require ();
2183       if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2184         {
2185           rtx xop0, temp;
2186           rtx_insn *last;
2187
2188           last = get_last_insn ();
2189
2190           if (target == 0)
2191             target = gen_reg_rtx (mode);
2192           xop0 = widen_operand (op0, wider_mode, mode,
2193                                 unoptab != clrsb_optab, false);
2194           temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2195                               unoptab != clrsb_optab);
2196           if (temp != 0)
2197             temp = expand_binop
2198               (wider_mode, sub_optab, temp,
2199                gen_int_mode (GET_MODE_PRECISION (wider_mode)
2200                              - GET_MODE_PRECISION (mode),
2201                              wider_mode),
2202                target, true, OPTAB_DIRECT);
2203           if (temp == 0)
2204             delete_insns_since (last);
2205
2206           return temp;
2207         }
2208     }
2209   return 0;
2210 }
2211
2212 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2213    quantities, choosing which based on whether the high word is nonzero.  */
2214 static rtx
2215 expand_doubleword_clz (scalar_int_mode mode, rtx op0, rtx target)
2216 {
2217   rtx xop0 = force_reg (mode, op0);
2218   rtx subhi = gen_highpart (word_mode, xop0);
2219   rtx sublo = gen_lowpart (word_mode, xop0);
2220   rtx_code_label *hi0_label = gen_label_rtx ();
2221   rtx_code_label *after_label = gen_label_rtx ();
2222   rtx_insn *seq;
2223   rtx temp, result;
2224
2225   /* If we were not given a target, use a word_mode register, not a
2226      'mode' register.  The result will fit, and nobody is expecting
2227      anything bigger (the return type of __builtin_clz* is int).  */
2228   if (!target)
2229     target = gen_reg_rtx (word_mode);
2230
2231   /* In any case, write to a word_mode scratch in both branches of the
2232      conditional, so we can ensure there is a single move insn setting
2233      'target' to tag a REG_EQUAL note on.  */
2234   result = gen_reg_rtx (word_mode);
2235
2236   start_sequence ();
2237
2238   /* If the high word is not equal to zero,
2239      then clz of the full value is clz of the high word.  */
2240   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2241                            word_mode, true, hi0_label);
2242
2243   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2244   if (!temp)
2245     goto fail;
2246
2247   if (temp != result)
2248     convert_move (result, temp, true);
2249
2250   emit_jump_insn (targetm.gen_jump (after_label));
2251   emit_barrier ();
2252
2253   /* Else clz of the full value is clz of the low word plus the number
2254      of bits in the high word.  */
2255   emit_label (hi0_label);
2256
2257   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2258   if (!temp)
2259     goto fail;
2260   temp = expand_binop (word_mode, add_optab, temp,
2261                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2262                        result, true, OPTAB_DIRECT);
2263   if (!temp)
2264     goto fail;
2265   if (temp != result)
2266     convert_move (result, temp, true);
2267
2268   emit_label (after_label);
2269   convert_move (target, result, true);
2270
2271   seq = get_insns ();
2272   end_sequence ();
2273
2274   add_equal_note (seq, target, CLZ, xop0, 0);
2275   emit_insn (seq);
2276   return target;
2277
2278  fail:
2279   end_sequence ();
2280   return 0;
2281 }
2282
2283 /* Try calculating popcount of a double-word quantity as two popcount's of
2284    word-sized quantities and summing up the results.  */
2285 static rtx
2286 expand_doubleword_popcount (scalar_int_mode mode, rtx op0, rtx target)
2287 {
2288   rtx t0, t1, t;
2289   rtx_insn *seq;
2290
2291   start_sequence ();
2292
2293   t0 = expand_unop_direct (word_mode, popcount_optab,
2294                            operand_subword_force (op0, 0, mode), NULL_RTX,
2295                            true);
2296   t1 = expand_unop_direct (word_mode, popcount_optab,
2297                            operand_subword_force (op0, 1, mode), NULL_RTX,
2298                            true);
2299   if (!t0 || !t1)
2300     {
2301       end_sequence ();
2302       return NULL_RTX;
2303     }
2304
2305   /* If we were not given a target, use a word_mode register, not a
2306      'mode' register.  The result will fit, and nobody is expecting
2307      anything bigger (the return type of __builtin_popcount* is int).  */
2308   if (!target)
2309     target = gen_reg_rtx (word_mode);
2310
2311   t = expand_binop (word_mode, add_optab, t0, t1, target, 0, OPTAB_DIRECT);
2312
2313   seq = get_insns ();
2314   end_sequence ();
2315
2316   add_equal_note (seq, t, POPCOUNT, op0, 0);
2317   emit_insn (seq);
2318   return t;
2319 }
2320
2321 /* Try calculating
2322         (parity:wide x)
2323    as
2324         (parity:narrow (low (x) ^ high (x))) */
2325 static rtx
2326 expand_doubleword_parity (scalar_int_mode mode, rtx op0, rtx target)
2327 {
2328   rtx t = expand_binop (word_mode, xor_optab,
2329                         operand_subword_force (op0, 0, mode),
2330                         operand_subword_force (op0, 1, mode),
2331                         NULL_RTX, 0, OPTAB_DIRECT);
2332   return expand_unop (word_mode, parity_optab, t, target, true);
2333 }
2334
2335 /* Try calculating
2336         (bswap:narrow x)
2337    as
2338         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2339 static rtx
2340 widen_bswap (scalar_int_mode mode, rtx op0, rtx target)
2341 {
2342   rtx x;
2343   rtx_insn *last;
2344   opt_scalar_int_mode wider_mode_iter;
2345
2346   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2347     if (optab_handler (bswap_optab, wider_mode_iter.require ())
2348         != CODE_FOR_nothing)
2349       break;
2350
2351   if (!wider_mode_iter.exists ())
2352     return NULL_RTX;
2353
2354   scalar_int_mode wider_mode = wider_mode_iter.require ();
2355   last = get_last_insn ();
2356
2357   x = widen_operand (op0, wider_mode, mode, true, true);
2358   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2359
2360   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2361               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2362   if (x != 0)
2363     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2364                       GET_MODE_BITSIZE (wider_mode)
2365                       - GET_MODE_BITSIZE (mode),
2366                       NULL_RTX, true);
2367
2368   if (x != 0)
2369     {
2370       if (target == 0)
2371         target = gen_reg_rtx (mode);
2372       emit_move_insn (target, gen_lowpart (mode, x));
2373     }
2374   else
2375     delete_insns_since (last);
2376
2377   return target;
2378 }
2379
2380 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2381
2382 static rtx
2383 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2384 {
2385   rtx t0, t1;
2386
2387   t1 = expand_unop (word_mode, bswap_optab,
2388                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2389   t0 = expand_unop (word_mode, bswap_optab,
2390                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2391
2392   if (target == 0 || !valid_multiword_target_p (target))
2393     target = gen_reg_rtx (mode);
2394   if (REG_P (target))
2395     emit_clobber (target);
2396   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2397   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2398
2399   return target;
2400 }
2401
2402 /* Try calculating (parity x) as (and (popcount x) 1), where
2403    popcount can also be done in a wider mode.  */
2404 static rtx
2405 expand_parity (scalar_int_mode mode, rtx op0, rtx target)
2406 {
2407   enum mode_class mclass = GET_MODE_CLASS (mode);
2408   opt_scalar_int_mode wider_mode_iter;
2409   FOR_EACH_MODE_FROM (wider_mode_iter, mode)
2410     {
2411       scalar_int_mode wider_mode = wider_mode_iter.require ();
2412       if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2413         {
2414           rtx xop0, temp;
2415           rtx_insn *last;
2416
2417           last = get_last_insn ();
2418
2419           if (target == 0 || GET_MODE (target) != wider_mode)
2420             target = gen_reg_rtx (wider_mode);
2421
2422           xop0 = widen_operand (op0, wider_mode, mode, true, false);
2423           temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2424                               true);
2425           if (temp != 0)
2426             temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2427                                  target, true, OPTAB_DIRECT);
2428
2429           if (temp)
2430             {
2431               if (mclass != MODE_INT
2432                   || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2433                 return convert_to_mode (mode, temp, 0);
2434               else
2435                 return gen_lowpart (mode, temp);
2436             }
2437           else
2438             delete_insns_since (last);
2439         }
2440     }
2441   return 0;
2442 }
2443
2444 /* Try calculating ctz(x) as K - clz(x & -x) ,
2445    where K is GET_MODE_PRECISION(mode) - 1.
2446
2447    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2448    don't have to worry about what the hardware does in that case.  (If
2449    the clz instruction produces the usual value at 0, which is K, the
2450    result of this code sequence will be -1; expand_ffs, below, relies
2451    on this.  It might be nice to have it be K instead, for consistency
2452    with the (very few) processors that provide a ctz with a defined
2453    value, but that would take one more instruction, and it would be
2454    less convenient for expand_ffs anyway.  */
2455
2456 static rtx
2457 expand_ctz (scalar_int_mode mode, rtx op0, rtx target)
2458 {
2459   rtx_insn *seq;
2460   rtx temp;
2461
2462   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2463     return 0;
2464
2465   start_sequence ();
2466
2467   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2468   if (temp)
2469     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2470                          true, OPTAB_DIRECT);
2471   if (temp)
2472     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2473   if (temp)
2474     temp = expand_binop (mode, sub_optab,
2475                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2476                          temp, target,
2477                          true, OPTAB_DIRECT);
2478   if (temp == 0)
2479     {
2480       end_sequence ();
2481       return 0;
2482     }
2483
2484   seq = get_insns ();
2485   end_sequence ();
2486
2487   add_equal_note (seq, temp, CTZ, op0, 0);
2488   emit_insn (seq);
2489   return temp;
2490 }
2491
2492
2493 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2494    else with the sequence used by expand_clz.
2495
2496    The ffs builtin promises to return zero for a zero value and ctz/clz
2497    may have an undefined value in that case.  If they do not give us a
2498    convenient value, we have to generate a test and branch.  */
2499 static rtx
2500 expand_ffs (scalar_int_mode mode, rtx op0, rtx target)
2501 {
2502   HOST_WIDE_INT val = 0;
2503   bool defined_at_zero = false;
2504   rtx temp;
2505   rtx_insn *seq;
2506
2507   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2508     {
2509       start_sequence ();
2510
2511       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2512       if (!temp)
2513         goto fail;
2514
2515       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2516     }
2517   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2518     {
2519       start_sequence ();
2520       temp = expand_ctz (mode, op0, 0);
2521       if (!temp)
2522         goto fail;
2523
2524       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2525         {
2526           defined_at_zero = true;
2527           val = (GET_MODE_PRECISION (mode) - 1) - val;
2528         }
2529     }
2530   else
2531     return 0;
2532
2533   if (defined_at_zero && val == -1)
2534     /* No correction needed at zero.  */;
2535   else
2536     {
2537       /* We don't try to do anything clever with the situation found
2538          on some processors (eg Alpha) where ctz(0:mode) ==
2539          bitsize(mode).  If someone can think of a way to send N to -1
2540          and leave alone all values in the range 0..N-1 (where N is a
2541          power of two), cheaper than this test-and-branch, please add it.
2542
2543          The test-and-branch is done after the operation itself, in case
2544          the operation sets condition codes that can be recycled for this.
2545          (This is true on i386, for instance.)  */
2546
2547       rtx_code_label *nonzero_label = gen_label_rtx ();
2548       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2549                                mode, true, nonzero_label);
2550
2551       convert_move (temp, GEN_INT (-1), false);
2552       emit_label (nonzero_label);
2553     }
2554
2555   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2556      to produce a value in the range 0..bitsize.  */
2557   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2558                        target, false, OPTAB_DIRECT);
2559   if (!temp)
2560     goto fail;
2561
2562   seq = get_insns ();
2563   end_sequence ();
2564
2565   add_equal_note (seq, temp, FFS, op0, 0);
2566   emit_insn (seq);
2567   return temp;
2568
2569  fail:
2570   end_sequence ();
2571   return 0;
2572 }
2573
2574 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2575    conditions, VAL may already be a SUBREG against which we cannot generate
2576    a further SUBREG.  In this case, we expect forcing the value into a
2577    register will work around the situation.  */
2578
2579 static rtx
2580 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
2581                            machine_mode imode)
2582 {
2583   rtx ret;
2584   ret = lowpart_subreg (omode, val, imode);
2585   if (ret == NULL)
2586     {
2587       val = force_reg (imode, val);
2588       ret = lowpart_subreg (omode, val, imode);
2589       gcc_assert (ret != NULL);
2590     }
2591   return ret;
2592 }
2593
2594 /* Expand a floating point absolute value or negation operation via a
2595    logical operation on the sign bit.  */
2596
2597 static rtx
2598 expand_absneg_bit (enum rtx_code code, scalar_float_mode mode,
2599                    rtx op0, rtx target)
2600 {
2601   const struct real_format *fmt;
2602   int bitpos, word, nwords, i;
2603   scalar_int_mode imode;
2604   rtx temp;
2605   rtx_insn *insns;
2606
2607   /* The format has to have a simple sign bit.  */
2608   fmt = REAL_MODE_FORMAT (mode);
2609   if (fmt == NULL)
2610     return NULL_RTX;
2611
2612   bitpos = fmt->signbit_rw;
2613   if (bitpos < 0)
2614     return NULL_RTX;
2615
2616   /* Don't create negative zeros if the format doesn't support them.  */
2617   if (code == NEG && !fmt->has_signed_zero)
2618     return NULL_RTX;
2619
2620   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2621     {
2622       if (!int_mode_for_mode (mode).exists (&imode))
2623         return NULL_RTX;
2624       word = 0;
2625       nwords = 1;
2626     }
2627   else
2628     {
2629       imode = word_mode;
2630
2631       if (FLOAT_WORDS_BIG_ENDIAN)
2632         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2633       else
2634         word = bitpos / BITS_PER_WORD;
2635       bitpos = bitpos % BITS_PER_WORD;
2636       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2637     }
2638
2639   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2640   if (code == ABS)
2641     mask = ~mask;
2642
2643   if (target == 0
2644       || target == op0
2645       || (nwords > 1 && !valid_multiword_target_p (target)))
2646     target = gen_reg_rtx (mode);
2647
2648   if (nwords > 1)
2649     {
2650       start_sequence ();
2651
2652       for (i = 0; i < nwords; ++i)
2653         {
2654           rtx targ_piece = operand_subword (target, i, 1, mode);
2655           rtx op0_piece = operand_subword_force (op0, i, mode);
2656
2657           if (i == word)
2658             {
2659               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2660                                    op0_piece,
2661                                    immed_wide_int_const (mask, imode),
2662                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2663               if (temp != targ_piece)
2664                 emit_move_insn (targ_piece, temp);
2665             }
2666           else
2667             emit_move_insn (targ_piece, op0_piece);
2668         }
2669
2670       insns = get_insns ();
2671       end_sequence ();
2672
2673       emit_insn (insns);
2674     }
2675   else
2676     {
2677       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2678                            gen_lowpart (imode, op0),
2679                            immed_wide_int_const (mask, imode),
2680                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2681       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2682
2683       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2684                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2685                         target);
2686     }
2687
2688   return target;
2689 }
2690
2691 /* As expand_unop, but will fail rather than attempt the operation in a
2692    different mode or with a libcall.  */
2693 static rtx
2694 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
2695                     int unsignedp)
2696 {
2697   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2698     {
2699       struct expand_operand ops[2];
2700       enum insn_code icode = optab_handler (unoptab, mode);
2701       rtx_insn *last = get_last_insn ();
2702       rtx_insn *pat;
2703
2704       create_output_operand (&ops[0], target, mode);
2705       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2706       pat = maybe_gen_insn (icode, 2, ops);
2707       if (pat)
2708         {
2709           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
2710               && ! add_equal_note (pat, ops[0].value,
2711                                    optab_to_code (unoptab),
2712                                    ops[1].value, NULL_RTX))
2713             {
2714               delete_insns_since (last);
2715               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
2716             }
2717
2718           emit_insn (pat);
2719
2720           return ops[0].value;
2721         }
2722     }
2723   return 0;
2724 }
2725
2726 /* Generate code to perform an operation specified by UNOPTAB
2727    on operand OP0, with result having machine-mode MODE.
2728
2729    UNSIGNEDP is for the case where we have to widen the operands
2730    to perform the operation.  It says to use zero-extension.
2731
2732    If TARGET is nonzero, the value
2733    is generated there, if it is convenient to do so.
2734    In all cases an rtx is returned for the locus of the value;
2735    this may or may not be TARGET.  */
2736
2737 rtx
2738 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
2739              int unsignedp)
2740 {
2741   enum mode_class mclass = GET_MODE_CLASS (mode);
2742   machine_mode wider_mode;
2743   scalar_int_mode int_mode;
2744   scalar_float_mode float_mode;
2745   rtx temp;
2746   rtx libfunc;
2747
2748   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
2749   if (temp)
2750     return temp;
2751
2752   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
2753
2754   /* Widening (or narrowing) clz needs special treatment.  */
2755   if (unoptab == clz_optab)
2756     {
2757       if (is_a <scalar_int_mode> (mode, &int_mode))
2758         {
2759           temp = widen_leading (int_mode, op0, target, unoptab);
2760           if (temp)
2761             return temp;
2762
2763           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2764               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2765             {
2766               temp = expand_doubleword_clz (int_mode, op0, target);
2767               if (temp)
2768                 return temp;
2769             }
2770         }
2771
2772       goto try_libcall;
2773     }
2774
2775   if (unoptab == clrsb_optab)
2776     {
2777       if (is_a <scalar_int_mode> (mode, &int_mode))
2778         {
2779           temp = widen_leading (int_mode, op0, target, unoptab);
2780           if (temp)
2781             return temp;
2782         }
2783       goto try_libcall;
2784     }
2785
2786   if (unoptab == popcount_optab
2787       && is_a <scalar_int_mode> (mode, &int_mode)
2788       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2789       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2790       && optimize_insn_for_speed_p ())
2791     {
2792       temp = expand_doubleword_popcount (int_mode, op0, target);
2793       if (temp)
2794         return temp;
2795     }
2796
2797   if (unoptab == parity_optab
2798       && is_a <scalar_int_mode> (mode, &int_mode)
2799       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2800       && (optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2801           || optab_handler (popcount_optab, word_mode) != CODE_FOR_nothing)
2802       && optimize_insn_for_speed_p ())
2803     {
2804       temp = expand_doubleword_parity (int_mode, op0, target);
2805       if (temp)
2806         return temp;
2807     }
2808
2809   /* Widening (or narrowing) bswap needs special treatment.  */
2810   if (unoptab == bswap_optab)
2811     {
2812       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
2813          or ROTATERT.  First try these directly; if this fails, then try the
2814          obvious pair of shifts with allowed widening, as this will probably
2815          be always more efficient than the other fallback methods.  */
2816       if (mode == HImode)
2817         {
2818           rtx_insn *last;
2819           rtx temp1, temp2;
2820
2821           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
2822             {
2823               temp = expand_binop (mode, rotl_optab, op0,
2824                                    gen_int_shift_amount (mode, 8),
2825                                    target, unsignedp, OPTAB_DIRECT);
2826               if (temp)
2827                 return temp;
2828              }
2829
2830           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
2831             {
2832               temp = expand_binop (mode, rotr_optab, op0,
2833                                    gen_int_shift_amount (mode, 8),
2834                                    target, unsignedp, OPTAB_DIRECT);
2835               if (temp)
2836                 return temp;
2837             }
2838
2839           last = get_last_insn ();
2840
2841           temp1 = expand_binop (mode, ashl_optab, op0,
2842                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2843                                 unsignedp, OPTAB_WIDEN);
2844           temp2 = expand_binop (mode, lshr_optab, op0,
2845                                 gen_int_shift_amount (mode, 8), NULL_RTX,
2846                                 unsignedp, OPTAB_WIDEN);
2847           if (temp1 && temp2)
2848             {
2849               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
2850                                    unsignedp, OPTAB_WIDEN);
2851               if (temp)
2852                 return temp;
2853             }
2854
2855           delete_insns_since (last);
2856         }
2857
2858       if (is_a <scalar_int_mode> (mode, &int_mode))
2859         {
2860           temp = widen_bswap (int_mode, op0, target);
2861           if (temp)
2862             return temp;
2863
2864           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2865               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2866             {
2867               temp = expand_doubleword_bswap (mode, op0, target);
2868               if (temp)
2869                 return temp;
2870             }
2871         }
2872
2873       goto try_libcall;
2874     }
2875
2876   if (CLASS_HAS_WIDER_MODES_P (mclass))
2877     FOR_EACH_WIDER_MODE (wider_mode, mode)
2878       {
2879         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2880           {
2881             rtx xop0 = op0;
2882             rtx_insn *last = get_last_insn ();
2883
2884             /* For certain operations, we need not actually extend
2885                the narrow operand, as long as we will truncate the
2886                results to the same narrowness.  */
2887
2888             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
2889                                   (unoptab == neg_optab
2890                                    || unoptab == one_cmpl_optab)
2891                                   && mclass == MODE_INT);
2892
2893             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2894                                 unsignedp);
2895
2896             if (temp)
2897               {
2898                 if (mclass != MODE_INT
2899                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2900                   {
2901                     if (target == 0)
2902                       target = gen_reg_rtx (mode);
2903                     convert_move (target, temp, 0);
2904                     return target;
2905                   }
2906                 else
2907                   return gen_lowpart (mode, temp);
2908               }
2909             else
2910               delete_insns_since (last);
2911           }
2912       }
2913
2914   /* These can be done a word at a time.  */
2915   if (unoptab == one_cmpl_optab
2916       && is_int_mode (mode, &int_mode)
2917       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
2918       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2919     {
2920       int i;
2921       rtx_insn *insns;
2922
2923       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
2924         target = gen_reg_rtx (int_mode);
2925
2926       start_sequence ();
2927
2928       /* Do the actual arithmetic.  */
2929       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
2930         {
2931           rtx target_piece = operand_subword (target, i, 1, int_mode);
2932           rtx x = expand_unop (word_mode, unoptab,
2933                                operand_subword_force (op0, i, int_mode),
2934                                target_piece, unsignedp);
2935
2936           if (target_piece != x)
2937             emit_move_insn (target_piece, x);
2938         }
2939
2940       insns = get_insns ();
2941       end_sequence ();
2942
2943       emit_insn (insns);
2944       return target;
2945     }
2946
2947   if (optab_to_code (unoptab) == NEG)
2948     {
2949       /* Try negating floating point values by flipping the sign bit.  */
2950       if (is_a <scalar_float_mode> (mode, &float_mode))
2951         {
2952           temp = expand_absneg_bit (NEG, float_mode, op0, target);
2953           if (temp)
2954             return temp;
2955         }
2956
2957       /* If there is no negation pattern, and we have no negative zero,
2958          try subtracting from zero.  */
2959       if (!HONOR_SIGNED_ZEROS (mode))
2960         {
2961           temp = expand_binop (mode, (unoptab == negv_optab
2962                                       ? subv_optab : sub_optab),
2963                                CONST0_RTX (mode), op0, target,
2964                                unsignedp, OPTAB_DIRECT);
2965           if (temp)
2966             return temp;
2967         }
2968     }
2969
2970   /* Try calculating parity (x) as popcount (x) % 2.  */
2971   if (unoptab == parity_optab && is_a <scalar_int_mode> (mode, &int_mode))
2972     {
2973       temp = expand_parity (int_mode, op0, target);
2974       if (temp)
2975         return temp;
2976     }
2977
2978   /* Try implementing ffs (x) in terms of clz (x).  */
2979   if (unoptab == ffs_optab && is_a <scalar_int_mode> (mode, &int_mode))
2980     {
2981       temp = expand_ffs (int_mode, op0, target);
2982       if (temp)
2983         return temp;
2984     }
2985
2986   /* Try implementing ctz (x) in terms of clz (x).  */
2987   if (unoptab == ctz_optab && is_a <scalar_int_mode> (mode, &int_mode))
2988     {
2989       temp = expand_ctz (int_mode, op0, target);
2990       if (temp)
2991         return temp;
2992     }
2993
2994  try_libcall:
2995   /* Now try a library call in this mode.  */
2996   libfunc = optab_libfunc (unoptab, mode);
2997   if (libfunc)
2998     {
2999       rtx_insn *insns;
3000       rtx value;
3001       rtx eq_value;
3002       machine_mode outmode = mode;
3003
3004       /* All of these functions return small values.  Thus we choose to
3005          have them return something that isn't a double-word.  */
3006       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
3007           || unoptab == clrsb_optab || unoptab == popcount_optab
3008           || unoptab == parity_optab)
3009         outmode
3010           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3011                                           optab_libfunc (unoptab, mode)));
3012
3013       start_sequence ();
3014
3015       /* Pass 1 for NO_QUEUE so we don't lose any increments
3016          if the libcall is cse'd or moved.  */
3017       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3018                                        op0, mode);
3019       insns = get_insns ();
3020       end_sequence ();
3021
3022       target = gen_reg_rtx (outmode);
3023       bool trapv = trapv_unoptab_p (unoptab);
3024       if (trapv)
3025         eq_value = NULL_RTX;
3026       else
3027         {
3028           eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3029           if (GET_MODE_UNIT_SIZE (outmode) < GET_MODE_UNIT_SIZE (mode))
3030             eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3031           else if (GET_MODE_UNIT_SIZE (outmode) > GET_MODE_UNIT_SIZE (mode))
3032             eq_value = simplify_gen_unary (ZERO_EXTEND,
3033                                            outmode, eq_value, mode);
3034         }
3035       emit_libcall_block_1 (insns, target, value, eq_value, trapv);
3036
3037       return target;
3038     }
3039
3040   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3041
3042   if (CLASS_HAS_WIDER_MODES_P (mclass))
3043     {
3044       FOR_EACH_WIDER_MODE (wider_mode, mode)
3045         {
3046           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3047               || optab_libfunc (unoptab, wider_mode))
3048             {
3049               rtx xop0 = op0;
3050               rtx_insn *last = get_last_insn ();
3051
3052               /* For certain operations, we need not actually extend
3053                  the narrow operand, as long as we will truncate the
3054                  results to the same narrowness.  */
3055               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3056                                     (unoptab == neg_optab
3057                                      || unoptab == one_cmpl_optab
3058                                      || unoptab == bswap_optab)
3059                                     && mclass == MODE_INT);
3060
3061               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3062                                   unsignedp);
3063
3064               /* If we are generating clz using wider mode, adjust the
3065                  result.  Similarly for clrsb.  */
3066               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3067                   && temp != 0)
3068                 {
3069                   scalar_int_mode wider_int_mode
3070                     = as_a <scalar_int_mode> (wider_mode);
3071                   int_mode = as_a <scalar_int_mode> (mode);
3072                   temp = expand_binop
3073                     (wider_mode, sub_optab, temp,
3074                      gen_int_mode (GET_MODE_PRECISION (wider_int_mode)
3075                                    - GET_MODE_PRECISION (int_mode),
3076                                    wider_int_mode),
3077                      target, true, OPTAB_DIRECT);
3078                 }
3079
3080               /* Likewise for bswap.  */
3081               if (unoptab == bswap_optab && temp != 0)
3082                 {
3083                   scalar_int_mode wider_int_mode
3084                     = as_a <scalar_int_mode> (wider_mode);
3085                   int_mode = as_a <scalar_int_mode> (mode);
3086                   gcc_assert (GET_MODE_PRECISION (wider_int_mode)
3087                               == GET_MODE_BITSIZE (wider_int_mode)
3088                               && GET_MODE_PRECISION (int_mode)
3089                                  == GET_MODE_BITSIZE (int_mode));
3090
3091                   temp = expand_shift (RSHIFT_EXPR, wider_int_mode, temp,
3092                                        GET_MODE_BITSIZE (wider_int_mode)
3093                                        - GET_MODE_BITSIZE (int_mode),
3094                                        NULL_RTX, true);
3095                 }
3096
3097               if (temp)
3098                 {
3099                   if (mclass != MODE_INT)
3100                     {
3101                       if (target == 0)
3102                         target = gen_reg_rtx (mode);
3103                       convert_move (target, temp, 0);
3104                       return target;
3105                     }
3106                   else
3107                     return gen_lowpart (mode, temp);
3108                 }
3109               else
3110                 delete_insns_since (last);
3111             }
3112         }
3113     }
3114
3115   /* One final attempt at implementing negation via subtraction,
3116      this time allowing widening of the operand.  */
3117   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3118     {
3119       rtx temp;
3120       temp = expand_binop (mode,
3121                            unoptab == negv_optab ? subv_optab : sub_optab,
3122                            CONST0_RTX (mode), op0,
3123                            target, unsignedp, OPTAB_LIB_WIDEN);
3124       if (temp)
3125         return temp;
3126     }
3127
3128   return 0;
3129 }
3130 \f
3131 /* Emit code to compute the absolute value of OP0, with result to
3132    TARGET if convenient.  (TARGET may be 0.)  The return value says
3133    where the result actually is to be found.
3134
3135    MODE is the mode of the operand; the mode of the result is
3136    different but can be deduced from MODE.
3137
3138  */
3139
3140 rtx
3141 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3142                    int result_unsignedp)
3143 {
3144   rtx temp;
3145
3146   if (GET_MODE_CLASS (mode) != MODE_INT
3147       || ! flag_trapv)
3148     result_unsignedp = 1;
3149
3150   /* First try to do it with a special abs instruction.  */
3151   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3152                       op0, target, 0);
3153   if (temp != 0)
3154     return temp;
3155
3156   /* For floating point modes, try clearing the sign bit.  */
3157   scalar_float_mode float_mode;
3158   if (is_a <scalar_float_mode> (mode, &float_mode))
3159     {
3160       temp = expand_absneg_bit (ABS, float_mode, op0, target);
3161       if (temp)
3162         return temp;
3163     }
3164
3165   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3166   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3167       && !HONOR_SIGNED_ZEROS (mode))
3168     {
3169       rtx_insn *last = get_last_insn ();
3170
3171       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3172                           op0, NULL_RTX, 0);
3173       if (temp != 0)
3174         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3175                              OPTAB_WIDEN);
3176
3177       if (temp != 0)
3178         return temp;
3179
3180       delete_insns_since (last);
3181     }
3182
3183   /* If this machine has expensive jumps, we can do integer absolute
3184      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3185      where W is the width of MODE.  */
3186
3187   scalar_int_mode int_mode;
3188   if (is_int_mode (mode, &int_mode)
3189       && BRANCH_COST (optimize_insn_for_speed_p (),
3190                       false) >= 2)
3191     {
3192       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3193                                    GET_MODE_PRECISION (int_mode) - 1,
3194                                    NULL_RTX, 0);
3195
3196       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3197                            OPTAB_LIB_WIDEN);
3198       if (temp != 0)
3199         temp = expand_binop (int_mode,
3200                              result_unsignedp ? sub_optab : subv_optab,
3201                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3202
3203       if (temp != 0)
3204         return temp;
3205     }
3206
3207   return NULL_RTX;
3208 }
3209
3210 rtx
3211 expand_abs (machine_mode mode, rtx op0, rtx target,
3212             int result_unsignedp, int safe)
3213 {
3214   rtx temp;
3215   rtx_code_label *op1;
3216
3217   if (GET_MODE_CLASS (mode) != MODE_INT
3218       || ! flag_trapv)
3219     result_unsignedp = 1;
3220
3221   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3222   if (temp != 0)
3223     return temp;
3224
3225   /* If that does not win, use conditional jump and negate.  */
3226
3227   /* It is safe to use the target if it is the same
3228      as the source if this is also a pseudo register */
3229   if (op0 == target && REG_P (op0)
3230       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3231     safe = 1;
3232
3233   op1 = gen_label_rtx ();
3234   if (target == 0 || ! safe
3235       || GET_MODE (target) != mode
3236       || (MEM_P (target) && MEM_VOLATILE_P (target))
3237       || (REG_P (target)
3238           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3239     target = gen_reg_rtx (mode);
3240
3241   emit_move_insn (target, op0);
3242   NO_DEFER_POP;
3243
3244   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3245                            NULL_RTX, NULL, op1,
3246                            profile_probability::uninitialized ());
3247
3248   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3249                      target, target, 0);
3250   if (op0 != target)
3251     emit_move_insn (target, op0);
3252   emit_label (op1);
3253   OK_DEFER_POP;
3254   return target;
3255 }
3256
3257 /* Emit code to compute the one's complement absolute value of OP0
3258    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3259    (TARGET may be NULL_RTX.)  The return value says where the result
3260    actually is to be found.
3261
3262    MODE is the mode of the operand; the mode of the result is
3263    different but can be deduced from MODE.  */
3264
3265 rtx
3266 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3267 {
3268   rtx temp;
3269
3270   /* Not applicable for floating point modes.  */
3271   if (FLOAT_MODE_P (mode))
3272     return NULL_RTX;
3273
3274   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3275   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3276     {
3277       rtx_insn *last = get_last_insn ();
3278
3279       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3280       if (temp != 0)
3281         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3282                              OPTAB_WIDEN);
3283
3284       if (temp != 0)
3285         return temp;
3286
3287       delete_insns_since (last);
3288     }
3289
3290   /* If this machine has expensive jumps, we can do one's complement
3291      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3292
3293   scalar_int_mode int_mode;
3294   if (is_int_mode (mode, &int_mode)
3295       && BRANCH_COST (optimize_insn_for_speed_p (),
3296                      false) >= 2)
3297     {
3298       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3299                                    GET_MODE_PRECISION (int_mode) - 1,
3300                                    NULL_RTX, 0);
3301
3302       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3303                            OPTAB_LIB_WIDEN);
3304
3305       if (temp != 0)
3306         return temp;
3307     }
3308
3309   return NULL_RTX;
3310 }
3311
3312 /* A subroutine of expand_copysign, perform the copysign operation using the
3313    abs and neg primitives advertised to exist on the target.  The assumption
3314    is that we have a split register file, and leaving op0 in fp registers,
3315    and not playing with subregs so much, will help the register allocator.  */
3316
3317 static rtx
3318 expand_copysign_absneg (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3319                         int bitpos, bool op0_is_abs)
3320 {
3321   scalar_int_mode imode;
3322   enum insn_code icode;
3323   rtx sign;
3324   rtx_code_label *label;
3325
3326   if (target == op1)
3327     target = NULL_RTX;
3328
3329   /* Check if the back end provides an insn that handles signbit for the
3330      argument's mode. */
3331   icode = optab_handler (signbit_optab, mode);
3332   if (icode != CODE_FOR_nothing)
3333     {
3334       imode = as_a <scalar_int_mode> (insn_data[(int) icode].operand[0].mode);
3335       sign = gen_reg_rtx (imode);
3336       emit_unop_insn (icode, sign, op1, UNKNOWN);
3337     }
3338   else
3339     {
3340       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3341         {
3342           if (!int_mode_for_mode (mode).exists (&imode))
3343             return NULL_RTX;
3344           op1 = gen_lowpart (imode, op1);
3345         }
3346       else
3347         {
3348           int word;
3349
3350           imode = word_mode;
3351           if (FLOAT_WORDS_BIG_ENDIAN)
3352             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3353           else
3354             word = bitpos / BITS_PER_WORD;
3355           bitpos = bitpos % BITS_PER_WORD;
3356           op1 = operand_subword_force (op1, word, mode);
3357         }
3358
3359       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3360       sign = expand_binop (imode, and_optab, op1,
3361                            immed_wide_int_const (mask, imode),
3362                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3363     }
3364
3365   if (!op0_is_abs)
3366     {
3367       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3368       if (op0 == NULL)
3369         return NULL_RTX;
3370       target = op0;
3371     }
3372   else
3373     {
3374       if (target == NULL_RTX)
3375         target = copy_to_reg (op0);
3376       else
3377         emit_move_insn (target, op0);
3378     }
3379
3380   label = gen_label_rtx ();
3381   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3382
3383   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3384     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3385   else
3386     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3387   if (op0 != target)
3388     emit_move_insn (target, op0);
3389
3390   emit_label (label);
3391
3392   return target;
3393 }
3394
3395
3396 /* A subroutine of expand_copysign, perform the entire copysign operation
3397    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3398    is true if op0 is known to have its sign bit clear.  */
3399
3400 static rtx
3401 expand_copysign_bit (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3402                      int bitpos, bool op0_is_abs)
3403 {
3404   scalar_int_mode imode;
3405   int word, nwords, i;
3406   rtx temp;
3407   rtx_insn *insns;
3408
3409   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3410     {
3411       if (!int_mode_for_mode (mode).exists (&imode))
3412         return NULL_RTX;
3413       word = 0;
3414       nwords = 1;
3415     }
3416   else
3417     {
3418       imode = word_mode;
3419
3420       if (FLOAT_WORDS_BIG_ENDIAN)
3421         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3422       else
3423         word = bitpos / BITS_PER_WORD;
3424       bitpos = bitpos % BITS_PER_WORD;
3425       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3426     }
3427
3428   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3429
3430   if (target == 0
3431       || target == op0
3432       || target == op1
3433       || (nwords > 1 && !valid_multiword_target_p (target)))
3434     target = gen_reg_rtx (mode);
3435
3436   if (nwords > 1)
3437     {
3438       start_sequence ();
3439
3440       for (i = 0; i < nwords; ++i)
3441         {
3442           rtx targ_piece = operand_subword (target, i, 1, mode);
3443           rtx op0_piece = operand_subword_force (op0, i, mode);
3444
3445           if (i == word)
3446             {
3447               if (!op0_is_abs)
3448                 op0_piece
3449                   = expand_binop (imode, and_optab, op0_piece,
3450                                   immed_wide_int_const (~mask, imode),
3451                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3452               op1 = expand_binop (imode, and_optab,
3453                                   operand_subword_force (op1, i, mode),
3454                                   immed_wide_int_const (mask, imode),
3455                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3456
3457               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3458                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3459               if (temp != targ_piece)
3460                 emit_move_insn (targ_piece, temp);
3461             }
3462           else
3463             emit_move_insn (targ_piece, op0_piece);
3464         }
3465
3466       insns = get_insns ();
3467       end_sequence ();
3468
3469       emit_insn (insns);
3470     }
3471   else
3472     {
3473       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3474                           immed_wide_int_const (mask, imode),
3475                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3476
3477       op0 = gen_lowpart (imode, op0);
3478       if (!op0_is_abs)
3479         op0 = expand_binop (imode, and_optab, op0,
3480                             immed_wide_int_const (~mask, imode),
3481                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3482
3483       temp = expand_binop (imode, ior_optab, op0, op1,
3484                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3485       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3486     }
3487
3488   return target;
3489 }
3490
3491 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3492    scalar floating point mode.  Return NULL if we do not know how to
3493    expand the operation inline.  */
3494
3495 rtx
3496 expand_copysign (rtx op0, rtx op1, rtx target)
3497 {
3498   scalar_float_mode mode;
3499   const struct real_format *fmt;
3500   bool op0_is_abs;
3501   rtx temp;
3502
3503   mode = as_a <scalar_float_mode> (GET_MODE (op0));
3504   gcc_assert (GET_MODE (op1) == mode);
3505
3506   /* First try to do it with a special instruction.  */
3507   temp = expand_binop (mode, copysign_optab, op0, op1,
3508                        target, 0, OPTAB_DIRECT);
3509   if (temp)
3510     return temp;
3511
3512   fmt = REAL_MODE_FORMAT (mode);
3513   if (fmt == NULL || !fmt->has_signed_zero)
3514     return NULL_RTX;
3515
3516   op0_is_abs = false;
3517   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3518     {
3519       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3520         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3521       op0_is_abs = true;
3522     }
3523
3524   if (fmt->signbit_ro >= 0
3525       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3526           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3527               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3528     {
3529       temp = expand_copysign_absneg (mode, op0, op1, target,
3530                                      fmt->signbit_ro, op0_is_abs);
3531       if (temp)
3532         return temp;
3533     }
3534
3535   if (fmt->signbit_rw < 0)
3536     return NULL_RTX;
3537   return expand_copysign_bit (mode, op0, op1, target,
3538                               fmt->signbit_rw, op0_is_abs);
3539 }
3540 \f
3541 /* Generate an instruction whose insn-code is INSN_CODE,
3542    with two operands: an output TARGET and an input OP0.
3543    TARGET *must* be nonzero, and the output is always stored there.
3544    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3545    the value that is stored into TARGET.
3546
3547    Return false if expansion failed.  */
3548
3549 bool
3550 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3551                       enum rtx_code code)
3552 {
3553   struct expand_operand ops[2];
3554   rtx_insn *pat;
3555
3556   create_output_operand (&ops[0], target, GET_MODE (target));
3557   create_input_operand (&ops[1], op0, GET_MODE (op0));
3558   pat = maybe_gen_insn (icode, 2, ops);
3559   if (!pat)
3560     return false;
3561
3562   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3563       && code != UNKNOWN)
3564     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3565
3566   emit_insn (pat);
3567
3568   if (ops[0].value != target)
3569     emit_move_insn (target, ops[0].value);
3570   return true;
3571 }
3572 /* Generate an instruction whose insn-code is INSN_CODE,
3573    with two operands: an output TARGET and an input OP0.
3574    TARGET *must* be nonzero, and the output is always stored there.
3575    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3576    the value that is stored into TARGET.  */
3577
3578 void
3579 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3580 {
3581   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3582   gcc_assert (ok);
3583 }
3584 \f
3585 struct no_conflict_data
3586 {
3587   rtx target;
3588   rtx_insn *first, *insn;
3589   bool must_stay;
3590 };
3591
3592 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3593    the currently examined clobber / store has to stay in the list of
3594    insns that constitute the actual libcall block.  */
3595 static void
3596 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3597 {
3598   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3599
3600   /* If this inns directly contributes to setting the target, it must stay.  */
3601   if (reg_overlap_mentioned_p (p->target, dest))
3602     p->must_stay = true;
3603   /* If we haven't committed to keeping any other insns in the list yet,
3604      there is nothing more to check.  */
3605   else if (p->insn == p->first)
3606     return;
3607   /* If this insn sets / clobbers a register that feeds one of the insns
3608      already in the list, this insn has to stay too.  */
3609   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3610            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3611            || reg_used_between_p (dest, p->first, p->insn)
3612            /* Likewise if this insn depends on a register set by a previous
3613               insn in the list, or if it sets a result (presumably a hard
3614               register) that is set or clobbered by a previous insn.
3615               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3616               SET_DEST perform the former check on the address, and the latter
3617               check on the MEM.  */
3618            || (GET_CODE (set) == SET
3619                && (modified_in_p (SET_SRC (set), p->first)
3620                    || modified_in_p (SET_DEST (set), p->first)
3621                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3622                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3623     p->must_stay = true;
3624 }
3625
3626 \f
3627 /* Emit code to make a call to a constant function or a library call.
3628
3629    INSNS is a list containing all insns emitted in the call.
3630    These insns leave the result in RESULT.  Our block is to copy RESULT
3631    to TARGET, which is logically equivalent to EQUIV.
3632
3633    We first emit any insns that set a pseudo on the assumption that these are
3634    loading constants into registers; doing so allows them to be safely cse'ed
3635    between blocks.  Then we emit all the other insns in the block, followed by
3636    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3637    note with an operand of EQUIV.  */
3638
3639 static void
3640 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3641                       bool equiv_may_trap)
3642 {
3643   rtx final_dest = target;
3644   rtx_insn *next, *last, *insn;
3645
3646   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3647      into a MEM later.  Protect the libcall block from this change.  */
3648   if (! REG_P (target) || REG_USERVAR_P (target))
3649     target = gen_reg_rtx (GET_MODE (target));
3650
3651   /* If we're using non-call exceptions, a libcall corresponding to an
3652      operation that may trap may also trap.  */
3653   /* ??? See the comment in front of make_reg_eh_region_note.  */
3654   if (cfun->can_throw_non_call_exceptions
3655       && (equiv_may_trap || may_trap_p (equiv)))
3656     {
3657       for (insn = insns; insn; insn = NEXT_INSN (insn))
3658         if (CALL_P (insn))
3659           {
3660             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3661             if (note)
3662               {
3663                 int lp_nr = INTVAL (XEXP (note, 0));
3664                 if (lp_nr == 0 || lp_nr == INT_MIN)
3665                   remove_note (insn, note);
3666               }
3667           }
3668     }
3669   else
3670     {
3671       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3672          reg note to indicate that this call cannot throw or execute a nonlocal
3673          goto (unless there is already a REG_EH_REGION note, in which case
3674          we update it).  */
3675       for (insn = insns; insn; insn = NEXT_INSN (insn))
3676         if (CALL_P (insn))
3677           make_reg_eh_region_note_nothrow_nononlocal (insn);
3678     }
3679
3680   /* First emit all insns that set pseudos.  Remove them from the list as
3681      we go.  Avoid insns that set pseudos which were referenced in previous
3682      insns.  These can be generated by move_by_pieces, for example,
3683      to update an address.  Similarly, avoid insns that reference things
3684      set in previous insns.  */
3685
3686   for (insn = insns; insn; insn = next)
3687     {
3688       rtx set = single_set (insn);
3689
3690       next = NEXT_INSN (insn);
3691
3692       if (set != 0 && REG_P (SET_DEST (set))
3693           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3694         {
3695           struct no_conflict_data data;
3696
3697           data.target = const0_rtx;
3698           data.first = insns;
3699           data.insn = insn;
3700           data.must_stay = 0;
3701           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3702           if (! data.must_stay)
3703             {
3704               if (PREV_INSN (insn))
3705                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3706               else
3707                 insns = next;
3708
3709               if (next)
3710                 SET_PREV_INSN (next) = PREV_INSN (insn);
3711
3712               add_insn (insn);
3713             }
3714         }
3715
3716       /* Some ports use a loop to copy large arguments onto the stack.
3717          Don't move anything outside such a loop.  */
3718       if (LABEL_P (insn))
3719         break;
3720     }
3721
3722   /* Write the remaining insns followed by the final copy.  */
3723   for (insn = insns; insn; insn = next)
3724     {
3725       next = NEXT_INSN (insn);
3726
3727       add_insn (insn);
3728     }
3729
3730   last = emit_move_insn (target, result);
3731   if (equiv)
3732     set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3733
3734   if (final_dest != target)
3735     emit_move_insn (final_dest, target);
3736 }
3737
3738 void
3739 emit_libcall_block (rtx_insn *insns, rtx target, rtx result, rtx equiv)
3740 {
3741   emit_libcall_block_1 (insns, target, result, equiv, false);
3742 }
3743 \f
3744 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3745    PURPOSE describes how this comparison will be used.  CODE is the rtx
3746    comparison code we will be using.
3747
3748    ??? Actually, CODE is slightly weaker than that.  A target is still
3749    required to implement all of the normal bcc operations, but not
3750    required to implement all (or any) of the unordered bcc operations.  */
3751
3752 int
3753 can_compare_p (enum rtx_code code, machine_mode mode,
3754                enum can_compare_purpose purpose)
3755 {
3756   rtx test;
3757   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
3758   do
3759     {
3760       enum insn_code icode;
3761
3762       if (purpose == ccp_jump
3763           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
3764           && insn_operand_matches (icode, 0, test))
3765         return 1;
3766       if (purpose == ccp_store_flag
3767           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
3768           && insn_operand_matches (icode, 1, test))
3769         return 1;
3770       if (purpose == ccp_cmov
3771           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
3772         return 1;
3773
3774       mode = GET_MODE_WIDER_MODE (mode).else_void ();
3775       PUT_MODE (test, mode);
3776     }
3777   while (mode != VOIDmode);
3778
3779   return 0;
3780 }
3781
3782 /* This function is called when we are going to emit a compare instruction that
3783    compares the values found in X and Y, using the rtl operator COMPARISON.
3784
3785    If they have mode BLKmode, then SIZE specifies the size of both operands.
3786
3787    UNSIGNEDP nonzero says that the operands are unsigned;
3788    this matters if they need to be widened (as given by METHODS).
3789
3790    *PTEST is where the resulting comparison RTX is returned or NULL_RTX
3791    if we failed to produce one.
3792
3793    *PMODE is the mode of the inputs (in case they are const_int).
3794
3795    This function performs all the setup necessary so that the caller only has
3796    to emit a single comparison insn.  This setup can involve doing a BLKmode
3797    comparison or emitting a library call to perform the comparison if no insn
3798    is available to handle it.
3799    The values which are passed in through pointers can be modified; the caller
3800    should perform the comparison on the modified values.  Constant
3801    comparisons must have already been folded.  */
3802
3803 static void
3804 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
3805                   int unsignedp, enum optab_methods methods,
3806                   rtx *ptest, machine_mode *pmode)
3807 {
3808   machine_mode mode = *pmode;
3809   rtx libfunc, test;
3810   machine_mode cmp_mode;
3811   enum mode_class mclass;
3812
3813   /* The other methods are not needed.  */
3814   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
3815               || methods == OPTAB_LIB_WIDEN);
3816
3817   if (CONST_SCALAR_INT_P (y))
3818     canonicalize_comparison (mode, &comparison, &y);
3819
3820   /* If we are optimizing, force expensive constants into a register.  */
3821   if (CONSTANT_P (x) && optimize
3822       && (rtx_cost (x, mode, COMPARE, 0, optimize_insn_for_speed_p ())
3823           > COSTS_N_INSNS (1)))
3824     x = force_reg (mode, x);
3825
3826   if (CONSTANT_P (y) && optimize
3827       && (rtx_cost (y, mode, COMPARE, 1, optimize_insn_for_speed_p ())
3828           > COSTS_N_INSNS (1)))
3829     y = force_reg (mode, y);
3830
3831 #if HAVE_cc0
3832   /* Make sure if we have a canonical comparison.  The RTL
3833      documentation states that canonical comparisons are required only
3834      for targets which have cc0.  */
3835   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
3836 #endif
3837
3838   /* Don't let both operands fail to indicate the mode.  */
3839   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
3840     x = force_reg (mode, x);
3841   if (mode == VOIDmode)
3842     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
3843
3844   /* Handle all BLKmode compares.  */
3845
3846   if (mode == BLKmode)
3847     {
3848       machine_mode result_mode;
3849       enum insn_code cmp_code;
3850       rtx result;
3851       rtx opalign
3852         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
3853
3854       gcc_assert (size);
3855
3856       /* Try to use a memory block compare insn - either cmpstr
3857          or cmpmem will do.  */
3858       opt_scalar_int_mode cmp_mode_iter;
3859       FOR_EACH_MODE_IN_CLASS (cmp_mode_iter, MODE_INT)
3860         {
3861           scalar_int_mode cmp_mode = cmp_mode_iter.require ();
3862           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
3863           if (cmp_code == CODE_FOR_nothing)
3864             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
3865           if (cmp_code == CODE_FOR_nothing)
3866             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
3867           if (cmp_code == CODE_FOR_nothing)
3868             continue;
3869
3870           /* Must make sure the size fits the insn's mode.  */
3871           if (CONST_INT_P (size)
3872               ? INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode))
3873               : (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (size)))
3874                  > GET_MODE_BITSIZE (cmp_mode)))
3875             continue;
3876
3877           result_mode = insn_data[cmp_code].operand[0].mode;
3878           result = gen_reg_rtx (result_mode);
3879           size = convert_to_mode (cmp_mode, size, 1);
3880           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
3881
3882           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
3883           *pmode = result_mode;
3884           return;
3885         }
3886
3887       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
3888         goto fail;
3889
3890       /* Otherwise call a library function.  */
3891       result = emit_block_comp_via_libcall (XEXP (x, 0), XEXP (y, 0), size);
3892
3893       x = result;
3894       y = const0_rtx;
3895       mode = TYPE_MODE (integer_type_node);
3896       methods = OPTAB_LIB_WIDEN;
3897       unsignedp = false;
3898     }
3899
3900   /* Don't allow operands to the compare to trap, as that can put the
3901      compare and branch in different basic blocks.  */
3902   if (cfun->can_throw_non_call_exceptions)
3903     {
3904       if (may_trap_p (x))
3905         x = copy_to_reg (x);
3906       if (may_trap_p (y))
3907         y = copy_to_reg (y);
3908     }
3909
3910   if (GET_MODE_CLASS (mode) == MODE_CC)
3911     {
3912       enum insn_code icode = optab_handler (cbranch_optab, CCmode);
3913       test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3914       gcc_assert (icode != CODE_FOR_nothing
3915                   && insn_operand_matches (icode, 0, test));
3916       *ptest = test;
3917       return;
3918     }
3919
3920   mclass = GET_MODE_CLASS (mode);
3921   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3922   FOR_EACH_MODE_FROM (cmp_mode, mode)
3923     {
3924       enum insn_code icode;
3925       icode = optab_handler (cbranch_optab, cmp_mode);
3926       if (icode != CODE_FOR_nothing
3927           && insn_operand_matches (icode, 0, test))
3928         {
3929           rtx_insn *last = get_last_insn ();
3930           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
3931           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
3932           if (op0 && op1
3933               && insn_operand_matches (icode, 1, op0)
3934               && insn_operand_matches (icode, 2, op1))
3935             {
3936               XEXP (test, 0) = op0;
3937               XEXP (test, 1) = op1;
3938               *ptest = test;
3939               *pmode = cmp_mode;
3940               return;
3941             }
3942           delete_insns_since (last);
3943         }
3944
3945       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
3946         break;
3947     }
3948
3949   if (methods != OPTAB_LIB_WIDEN)
3950     goto fail;
3951
3952   if (SCALAR_FLOAT_MODE_P (mode))
3953     {
3954       /* Small trick if UNORDERED isn't implemented by the hardware.  */
3955       if (comparison == UNORDERED && rtx_equal_p (x, y))
3956         {
3957           prepare_cmp_insn (x, y, UNLT, NULL_RTX, unsignedp, OPTAB_WIDEN,
3958                             ptest, pmode);
3959           if (*ptest)
3960             return;
3961         }
3962
3963       prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
3964     }
3965   else
3966     {
3967       rtx result;
3968       machine_mode ret_mode;
3969
3970       /* Handle a libcall just for the mode we are using.  */
3971       libfunc = optab_libfunc (cmp_optab, mode);
3972       gcc_assert (libfunc);
3973
3974       /* If we want unsigned, and this mode has a distinct unsigned
3975          comparison routine, use that.  */
3976       if (unsignedp)
3977         {
3978           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
3979           if (ulibfunc)
3980             libfunc = ulibfunc;
3981         }
3982
3983       ret_mode = targetm.libgcc_cmp_return_mode ();
3984       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
3985                                         ret_mode, x, mode, y, mode);
3986
3987       /* There are two kinds of comparison routines. Biased routines
3988          return 0/1/2, and unbiased routines return -1/0/1. Other parts
3989          of gcc expect that the comparison operation is equivalent
3990          to the modified comparison. For signed comparisons compare the
3991          result against 1 in the biased case, and zero in the unbiased
3992          case. For unsigned comparisons always compare against 1 after
3993          biasing the unbiased result by adding 1. This gives us a way to
3994          represent LTU.
3995          The comparisons in the fixed-point helper library are always
3996          biased.  */
3997       x = result;
3998       y = const1_rtx;
3999
4000       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
4001         {
4002           if (unsignedp)
4003             x = plus_constant (ret_mode, result, 1);
4004           else
4005             y = const0_rtx;
4006         }
4007
4008       *pmode = ret_mode;
4009       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
4010                         ptest, pmode);
4011     }
4012
4013   return;
4014
4015  fail:
4016   *ptest = NULL_RTX;
4017 }
4018
4019 /* Before emitting an insn with code ICODE, make sure that X, which is going
4020    to be used for operand OPNUM of the insn, is converted from mode MODE to
4021    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
4022    that it is accepted by the operand predicate.  Return the new value.  */
4023
4024 rtx
4025 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
4026                  machine_mode wider_mode, int unsignedp)
4027 {
4028   if (mode != wider_mode)
4029     x = convert_modes (wider_mode, mode, x, unsignedp);
4030
4031   if (!insn_operand_matches (icode, opnum, x))
4032     {
4033       machine_mode op_mode = insn_data[(int) icode].operand[opnum].mode;
4034       if (reload_completed)
4035         return NULL_RTX;
4036       if (GET_MODE (x) != op_mode && GET_MODE (x) != VOIDmode)
4037         return NULL_RTX;
4038       x = copy_to_mode_reg (op_mode, x);
4039     }
4040
4041   return x;
4042 }
4043
4044 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4045    we can do the branch.  */
4046
4047 static void
4048 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label,
4049                           profile_probability prob)
4050 {
4051   machine_mode optab_mode;
4052   enum mode_class mclass;
4053   enum insn_code icode;
4054   rtx_insn *insn;
4055
4056   mclass = GET_MODE_CLASS (mode);
4057   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4058   icode = optab_handler (cbranch_optab, optab_mode);
4059
4060   gcc_assert (icode != CODE_FOR_nothing);
4061   gcc_assert (insn_operand_matches (icode, 0, test));
4062   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4063                                           XEXP (test, 1), label));
4064   if (prob.initialized_p ()
4065       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4066       && insn
4067       && JUMP_P (insn)
4068       && any_condjump_p (insn)
4069       && !find_reg_note (insn, REG_BR_PROB, 0))
4070     add_reg_br_prob_note (insn, prob);
4071 }
4072
4073 /* Generate code to compare X with Y so that the condition codes are
4074    set and to jump to LABEL if the condition is true.  If X is a
4075    constant and Y is not a constant, then the comparison is swapped to
4076    ensure that the comparison RTL has the canonical form.
4077
4078    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4079    need to be widened.  UNSIGNEDP is also used to select the proper
4080    branch condition code.
4081
4082    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4083
4084    MODE is the mode of the inputs (in case they are const_int).
4085
4086    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4087    It will be potentially converted into an unsigned variant based on
4088    UNSIGNEDP to select a proper jump instruction.
4089
4090    PROB is the probability of jumping to LABEL.  */
4091
4092 void
4093 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4094                          machine_mode mode, int unsignedp, rtx label,
4095                          profile_probability prob)
4096 {
4097   rtx op0 = x, op1 = y;
4098   rtx test;
4099
4100   /* Swap operands and condition to ensure canonical RTL.  */
4101   if (swap_commutative_operands_p (x, y)
4102       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4103     {
4104       op0 = y, op1 = x;
4105       comparison = swap_condition (comparison);
4106     }
4107
4108   /* If OP0 is still a constant, then both X and Y must be constants
4109      or the opposite comparison is not supported.  Force X into a register
4110      to create canonical RTL.  */
4111   if (CONSTANT_P (op0))
4112     op0 = force_reg (mode, op0);
4113
4114   if (unsignedp)
4115     comparison = unsigned_condition (comparison);
4116
4117   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4118                     &test, &mode);
4119   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4120 }
4121
4122 \f
4123 /* Emit a library call comparison between floating point X and Y.
4124    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4125
4126 static void
4127 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4128                        rtx *ptest, machine_mode *pmode)
4129 {
4130   enum rtx_code swapped = swap_condition (comparison);
4131   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4132   machine_mode orig_mode = GET_MODE (x);
4133   machine_mode mode;
4134   rtx true_rtx, false_rtx;
4135   rtx value, target, equiv;
4136   rtx_insn *insns;
4137   rtx libfunc = 0;
4138   bool reversed_p = false;
4139   scalar_int_mode cmp_mode = targetm.libgcc_cmp_return_mode ();
4140
4141   FOR_EACH_MODE_FROM (mode, orig_mode)
4142     {
4143       if (code_to_optab (comparison)
4144           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4145         break;
4146
4147       if (code_to_optab (swapped)
4148           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4149         {
4150           std::swap (x, y);
4151           comparison = swapped;
4152           break;
4153         }
4154
4155       if (code_to_optab (reversed)
4156           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4157         {
4158           comparison = reversed;
4159           reversed_p = true;
4160           break;
4161         }
4162     }
4163
4164   gcc_assert (mode != VOIDmode);
4165
4166   if (mode != orig_mode)
4167     {
4168       x = convert_to_mode (mode, x, 0);
4169       y = convert_to_mode (mode, y, 0);
4170     }
4171
4172   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4173      the RTL.  The allows the RTL optimizers to delete the libcall if the
4174      condition can be determined at compile-time.  */
4175   if (comparison == UNORDERED
4176       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4177     {
4178       true_rtx = const_true_rtx;
4179       false_rtx = const0_rtx;
4180     }
4181   else
4182     {
4183       switch (comparison)
4184         {
4185         case EQ:
4186           true_rtx = const0_rtx;
4187           false_rtx = const_true_rtx;
4188           break;
4189
4190         case NE:
4191           true_rtx = const_true_rtx;
4192           false_rtx = const0_rtx;
4193           break;
4194
4195         case GT:
4196           true_rtx = const1_rtx;
4197           false_rtx = const0_rtx;
4198           break;
4199
4200         case GE:
4201           true_rtx = const0_rtx;
4202           false_rtx = constm1_rtx;
4203           break;
4204
4205         case LT:
4206           true_rtx = constm1_rtx;
4207           false_rtx = const0_rtx;
4208           break;
4209
4210         case LE:
4211           true_rtx = const0_rtx;
4212           false_rtx = const1_rtx;
4213           break;
4214
4215         default:
4216           gcc_unreachable ();
4217         }
4218     }
4219
4220   if (comparison == UNORDERED)
4221     {
4222       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4223       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4224       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4225                                     temp, const_true_rtx, equiv);
4226     }
4227   else
4228     {
4229       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4230       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4231         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4232                                       equiv, true_rtx, false_rtx);
4233     }
4234
4235   start_sequence ();
4236   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4237                                    cmp_mode, x, mode, y, mode);
4238   insns = get_insns ();
4239   end_sequence ();
4240
4241   target = gen_reg_rtx (cmp_mode);
4242   emit_libcall_block (insns, target, value, equiv);
4243
4244   if (comparison == UNORDERED
4245       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4246       || reversed_p)
4247     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4248   else
4249     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4250
4251   *pmode = cmp_mode;
4252 }
4253 \f
4254 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4255
4256 void
4257 emit_indirect_jump (rtx loc)
4258 {
4259   if (!targetm.have_indirect_jump ())
4260     sorry ("indirect jumps are not available on this target");
4261   else
4262     {
4263       struct expand_operand ops[1];
4264       create_address_operand (&ops[0], loc);
4265       expand_jump_insn (targetm.code_for_indirect_jump, 1, ops);
4266       emit_barrier ();
4267     }
4268 }
4269 \f
4270
4271 /* Emit a conditional move instruction if the machine supports one for that
4272    condition and machine mode.
4273
4274    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4275    the mode to use should they be constants.  If it is VOIDmode, they cannot
4276    both be constants.
4277
4278    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4279    should be stored there.  MODE is the mode to use should they be constants.
4280    If it is VOIDmode, they cannot both be constants.
4281
4282    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4283    is not supported.  */
4284
4285 rtx
4286 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4287                        machine_mode cmode, rtx op2, rtx op3,
4288                        machine_mode mode, int unsignedp)
4289 {
4290   rtx comparison;
4291   rtx_insn *last;
4292   enum insn_code icode;
4293   enum rtx_code reversed;
4294
4295   /* If the two source operands are identical, that's just a move.  */
4296
4297   if (rtx_equal_p (op2, op3))
4298     {
4299       if (!target)
4300         target = gen_reg_rtx (mode);
4301
4302       emit_move_insn (target, op3);
4303       return target;
4304     }
4305
4306   /* If one operand is constant, make it the second one.  Only do this
4307      if the other operand is not constant as well.  */
4308
4309   if (swap_commutative_operands_p (op0, op1))
4310     {
4311       std::swap (op0, op1);
4312       code = swap_condition (code);
4313     }
4314
4315   /* get_condition will prefer to generate LT and GT even if the old
4316      comparison was against zero, so undo that canonicalization here since
4317      comparisons against zero are cheaper.  */
4318   if (code == LT && op1 == const1_rtx)
4319     code = LE, op1 = const0_rtx;
4320   else if (code == GT && op1 == constm1_rtx)
4321     code = GE, op1 = const0_rtx;
4322
4323   if (cmode == VOIDmode)
4324     cmode = GET_MODE (op0);
4325
4326   enum rtx_code orig_code = code;
4327   bool swapped = false;
4328   if (swap_commutative_operands_p (op2, op3)
4329       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4330           != UNKNOWN))
4331     {
4332       std::swap (op2, op3);
4333       code = reversed;
4334       swapped = true;
4335     }
4336
4337   if (mode == VOIDmode)
4338     mode = GET_MODE (op2);
4339
4340   icode = direct_optab_handler (movcc_optab, mode);
4341
4342   if (icode == CODE_FOR_nothing)
4343     return NULL_RTX;
4344
4345   if (!target)
4346     target = gen_reg_rtx (mode);
4347
4348   for (int pass = 0; ; pass++)
4349     {
4350       code = unsignedp ? unsigned_condition (code) : code;
4351       comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4352
4353       /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4354          punt and let the caller figure out how best to deal with this
4355          situation.  */
4356       if (COMPARISON_P (comparison))
4357         {
4358           saved_pending_stack_adjust save;
4359           save_pending_stack_adjust (&save);
4360           last = get_last_insn ();
4361           do_pending_stack_adjust ();
4362           machine_mode cmpmode = cmode;
4363           prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4364                             GET_CODE (comparison), NULL_RTX, unsignedp,
4365                             OPTAB_WIDEN, &comparison, &cmpmode);
4366           if (comparison)
4367             {
4368               struct expand_operand ops[4];
4369
4370               create_output_operand (&ops[0], target, mode);
4371               create_fixed_operand (&ops[1], comparison);
4372               create_input_operand (&ops[2], op2, mode);
4373               create_input_operand (&ops[3], op3, mode);
4374               if (maybe_expand_insn (icode, 4, ops))
4375                 {
4376                   if (ops[0].value != target)
4377                     convert_move (target, ops[0].value, false);
4378                   return target;
4379                 }
4380             }
4381           delete_insns_since (last);
4382           restore_pending_stack_adjust (&save);
4383         }
4384
4385       if (pass == 1)
4386         return NULL_RTX;
4387
4388       /* If the preferred op2/op3 order is not usable, retry with other
4389          operand order, perhaps it will expand successfully.  */
4390       if (swapped)
4391         code = orig_code;
4392       else if ((reversed = reversed_comparison_code_parts (orig_code, op0, op1,
4393                                                            NULL))
4394                != UNKNOWN)
4395         code = reversed;
4396       else
4397         return NULL_RTX;
4398       std::swap (op2, op3);
4399     }
4400 }
4401
4402
4403 /* Emit a conditional negate or bitwise complement using the
4404    negcc or notcc optabs if available.  Return NULL_RTX if such operations
4405    are not available.  Otherwise return the RTX holding the result.
4406    TARGET is the desired destination of the result.  COMP is the comparison
4407    on which to negate.  If COND is true move into TARGET the negation
4408    or bitwise complement of OP1.  Otherwise move OP2 into TARGET.
4409    CODE is either NEG or NOT.  MODE is the machine mode in which the
4410    operation is performed.  */
4411
4412 rtx
4413 emit_conditional_neg_or_complement (rtx target, rtx_code code,
4414                                      machine_mode mode, rtx cond, rtx op1,
4415                                      rtx op2)
4416 {
4417   optab op = unknown_optab;
4418   if (code == NEG)
4419     op = negcc_optab;
4420   else if (code == NOT)
4421     op = notcc_optab;
4422   else
4423     gcc_unreachable ();
4424
4425   insn_code icode = direct_optab_handler (op, mode);
4426
4427   if (icode == CODE_FOR_nothing)
4428     return NULL_RTX;
4429
4430   if (!target)
4431     target = gen_reg_rtx (mode);
4432
4433   rtx_insn *last = get_last_insn ();
4434   struct expand_operand ops[4];
4435
4436   create_output_operand (&ops[0], target, mode);
4437   create_fixed_operand (&ops[1], cond);
4438   create_input_operand (&ops[2], op1, mode);
4439   create_input_operand (&ops[3], op2, mode);
4440
4441   if (maybe_expand_insn (icode, 4, ops))
4442     {
4443       if (ops[0].value != target)
4444         convert_move (target, ops[0].value, false);
4445
4446       return target;
4447     }
4448   delete_insns_since (last);
4449   return NULL_RTX;
4450 }
4451
4452 /* Emit a conditional addition instruction if the machine supports one for that
4453    condition and machine mode.
4454
4455    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4456    the mode to use should they be constants.  If it is VOIDmode, they cannot
4457    both be constants.
4458
4459    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4460    should be stored there.  MODE is the mode to use should they be constants.
4461    If it is VOIDmode, they cannot both be constants.
4462
4463    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4464    is not supported.  */
4465
4466 rtx
4467 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4468                       machine_mode cmode, rtx op2, rtx op3,
4469                       machine_mode mode, int unsignedp)
4470 {
4471   rtx comparison;
4472   rtx_insn *last;
4473   enum insn_code icode;
4474
4475   /* If one operand is constant, make it the second one.  Only do this
4476      if the other operand is not constant as well.  */
4477
4478   if (swap_commutative_operands_p (op0, op1))
4479     {
4480       std::swap (op0, op1);
4481       code = swap_condition (code);
4482     }
4483
4484   /* get_condition will prefer to generate LT and GT even if the old
4485      comparison was against zero, so undo that canonicalization here since
4486      comparisons against zero are cheaper.  */
4487   if (code == LT && op1 == const1_rtx)
4488     code = LE, op1 = const0_rtx;
4489   else if (code == GT && op1 == constm1_rtx)
4490     code = GE, op1 = const0_rtx;
4491
4492   if (cmode == VOIDmode)
4493     cmode = GET_MODE (op0);
4494
4495   if (mode == VOIDmode)
4496     mode = GET_MODE (op2);
4497
4498   icode = optab_handler (addcc_optab, mode);
4499
4500   if (icode == CODE_FOR_nothing)
4501     return 0;
4502
4503   if (!target)
4504     target = gen_reg_rtx (mode);
4505
4506   code = unsignedp ? unsigned_condition (code) : code;
4507   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4508
4509   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4510      return NULL and let the caller figure out how best to deal with this
4511      situation.  */
4512   if (!COMPARISON_P (comparison))
4513     return NULL_RTX;
4514
4515   do_pending_stack_adjust ();
4516   last = get_last_insn ();
4517   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4518                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4519                     &comparison, &cmode);
4520   if (comparison)
4521     {
4522       struct expand_operand ops[4];
4523
4524       create_output_operand (&ops[0], target, mode);
4525       create_fixed_operand (&ops[1], comparison);
4526       create_input_operand (&ops[2], op2, mode);
4527       create_input_operand (&ops[3], op3, mode);
4528       if (maybe_expand_insn (icode, 4, ops))
4529         {
4530           if (ops[0].value != target)
4531             convert_move (target, ops[0].value, false);
4532           return target;
4533         }
4534     }
4535   delete_insns_since (last);
4536   return NULL_RTX;
4537 }
4538 \f
4539 /* These functions attempt to generate an insn body, rather than
4540    emitting the insn, but if the gen function already emits them, we
4541    make no attempt to turn them back into naked patterns.  */
4542
4543 /* Generate and return an insn body to add Y to X.  */
4544
4545 rtx_insn *
4546 gen_add2_insn (rtx x, rtx y)
4547 {
4548   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4549
4550   gcc_assert (insn_operand_matches (icode, 0, x));
4551   gcc_assert (insn_operand_matches (icode, 1, x));
4552   gcc_assert (insn_operand_matches (icode, 2, y));
4553
4554   return GEN_FCN (icode) (x, x, y);
4555 }
4556
4557 /* Generate and return an insn body to add r1 and c,
4558    storing the result in r0.  */
4559
4560 rtx_insn *
4561 gen_add3_insn (rtx r0, rtx r1, rtx c)
4562 {
4563   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4564
4565   if (icode == CODE_FOR_nothing
4566       || !insn_operand_matches (icode, 0, r0)
4567       || !insn_operand_matches (icode, 1, r1)
4568       || !insn_operand_matches (icode, 2, c))
4569     return NULL;
4570
4571   return GEN_FCN (icode) (r0, r1, c);
4572 }
4573
4574 int
4575 have_add2_insn (rtx x, rtx y)
4576 {
4577   enum insn_code icode;
4578
4579   gcc_assert (GET_MODE (x) != VOIDmode);
4580
4581   icode = optab_handler (add_optab, GET_MODE (x));
4582
4583   if (icode == CODE_FOR_nothing)
4584     return 0;
4585
4586   if (!insn_operand_matches (icode, 0, x)
4587       || !insn_operand_matches (icode, 1, x)
4588       || !insn_operand_matches (icode, 2, y))
4589     return 0;
4590
4591   return 1;
4592 }
4593
4594 /* Generate and return an insn body to add Y to X.  */
4595
4596 rtx_insn *
4597 gen_addptr3_insn (rtx x, rtx y, rtx z)
4598 {
4599   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4600
4601   gcc_assert (insn_operand_matches (icode, 0, x));
4602   gcc_assert (insn_operand_matches (icode, 1, y));
4603   gcc_assert (insn_operand_matches (icode, 2, z));
4604
4605   return GEN_FCN (icode) (x, y, z);
4606 }
4607
4608 /* Return true if the target implements an addptr pattern and X, Y,
4609    and Z are valid for the pattern predicates.  */
4610
4611 int
4612 have_addptr3_insn (rtx x, rtx y, rtx z)
4613 {
4614   enum insn_code icode;
4615
4616   gcc_assert (GET_MODE (x) != VOIDmode);
4617
4618   icode = optab_handler (addptr3_optab, GET_MODE (x));
4619
4620   if (icode == CODE_FOR_nothing)
4621     return 0;
4622
4623   if (!insn_operand_matches (icode, 0, x)
4624       || !insn_operand_matches (icode, 1, y)
4625       || !insn_operand_matches (icode, 2, z))
4626     return 0;
4627
4628   return 1;
4629 }
4630
4631 /* Generate and return an insn body to subtract Y from X.  */
4632
4633 rtx_insn *
4634 gen_sub2_insn (rtx x, rtx y)
4635 {
4636   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4637
4638   gcc_assert (insn_operand_matches (icode, 0, x));
4639   gcc_assert (insn_operand_matches (icode, 1, x));
4640   gcc_assert (insn_operand_matches (icode, 2, y));
4641
4642   return GEN_FCN (icode) (x, x, y);
4643 }
4644
4645 /* Generate and return an insn body to subtract r1 and c,
4646    storing the result in r0.  */
4647
4648 rtx_insn *
4649 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4650 {
4651   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4652
4653   if (icode == CODE_FOR_nothing
4654       || !insn_operand_matches (icode, 0, r0)
4655       || !insn_operand_matches (icode, 1, r1)
4656       || !insn_operand_matches (icode, 2, c))
4657     return NULL;
4658
4659   return GEN_FCN (icode) (r0, r1, c);
4660 }
4661
4662 int
4663 have_sub2_insn (rtx x, rtx y)
4664 {
4665   enum insn_code icode;
4666
4667   gcc_assert (GET_MODE (x) != VOIDmode);
4668
4669   icode = optab_handler (sub_optab, GET_MODE (x));
4670
4671   if (icode == CODE_FOR_nothing)
4672     return 0;
4673
4674   if (!insn_operand_matches (icode, 0, x)
4675       || !insn_operand_matches (icode, 1, x)
4676       || !insn_operand_matches (icode, 2, y))
4677     return 0;
4678
4679   return 1;
4680 }
4681 \f
4682 /* Generate the body of an insn to extend Y (with mode MFROM)
4683    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4684
4685 rtx_insn *
4686 gen_extend_insn (rtx x, rtx y, machine_mode mto,
4687                  machine_mode mfrom, int unsignedp)
4688 {
4689   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4690   return GEN_FCN (icode) (x, y);
4691 }
4692 \f
4693 /* Generate code to convert FROM to floating point
4694    and store in TO.  FROM must be fixed point and not VOIDmode.
4695    UNSIGNEDP nonzero means regard FROM as unsigned.
4696    Normally this is done by correcting the final value
4697    if it is negative.  */
4698
4699 void
4700 expand_float (rtx to, rtx from, int unsignedp)
4701 {
4702   enum insn_code icode;
4703   rtx target = to;
4704   scalar_mode from_mode, to_mode;
4705   machine_mode fmode, imode;
4706   bool can_do_signed = false;
4707
4708   /* Crash now, because we won't be able to decide which mode to use.  */
4709   gcc_assert (GET_MODE (from) != VOIDmode);
4710
4711   /* Look for an insn to do the conversion.  Do it in the specified
4712      modes if possible; otherwise convert either input, output or both to
4713      wider mode.  If the integer mode is wider than the mode of FROM,
4714      we can do the conversion signed even if the input is unsigned.  */
4715
4716   FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
4717     FOR_EACH_MODE_FROM (imode, GET_MODE (from))
4718       {
4719         int doing_unsigned = unsignedp;
4720
4721         if (fmode != GET_MODE (to)
4722             && (significand_size (fmode)
4723                 < GET_MODE_UNIT_PRECISION (GET_MODE (from))))
4724           continue;
4725
4726         icode = can_float_p (fmode, imode, unsignedp);
4727         if (icode == CODE_FOR_nothing && unsignedp)
4728           {
4729             enum insn_code scode = can_float_p (fmode, imode, 0);
4730             if (scode != CODE_FOR_nothing)
4731               can_do_signed = true;
4732             if (imode != GET_MODE (from))
4733               icode = scode, doing_unsigned = 0;
4734           }
4735
4736         if (icode != CODE_FOR_nothing)
4737           {
4738             if (imode != GET_MODE (from))
4739               from = convert_to_mode (imode, from, unsignedp);
4740
4741             if (fmode != GET_MODE (to))
4742               target = gen_reg_rtx (fmode);
4743
4744             emit_unop_insn (icode, target, from,
4745                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
4746
4747             if (target != to)
4748               convert_move (to, target, 0);
4749             return;
4750           }
4751       }
4752
4753   /* Unsigned integer, and no way to convert directly.  Convert as signed,
4754      then unconditionally adjust the result.  */
4755   if (unsignedp
4756       && can_do_signed
4757       && is_a <scalar_mode> (GET_MODE (to), &to_mode)
4758       && is_a <scalar_mode> (GET_MODE (from), &from_mode))
4759     {
4760       opt_scalar_mode fmode_iter;
4761       rtx_code_label *label = gen_label_rtx ();
4762       rtx temp;
4763       REAL_VALUE_TYPE offset;
4764
4765       /* Look for a usable floating mode FMODE wider than the source and at
4766          least as wide as the target.  Using FMODE will avoid rounding woes
4767          with unsigned values greater than the signed maximum value.  */
4768
4769       FOR_EACH_MODE_FROM (fmode_iter, to_mode)
4770         {
4771           scalar_mode fmode = fmode_iter.require ();
4772           if (GET_MODE_PRECISION (from_mode) < GET_MODE_BITSIZE (fmode)
4773               && can_float_p (fmode, from_mode, 0) != CODE_FOR_nothing)
4774             break;
4775         }
4776
4777       if (!fmode_iter.exists (&fmode))
4778         {
4779           /* There is no such mode.  Pretend the target is wide enough.  */
4780           fmode = to_mode;
4781
4782           /* Avoid double-rounding when TO is narrower than FROM.  */
4783           if ((significand_size (fmode) + 1)
4784               < GET_MODE_PRECISION (from_mode))
4785             {
4786               rtx temp1;
4787               rtx_code_label *neglabel = gen_label_rtx ();
4788
4789               /* Don't use TARGET if it isn't a register, is a hard register,
4790                  or is the wrong mode.  */
4791               if (!REG_P (target)
4792                   || REGNO (target) < FIRST_PSEUDO_REGISTER
4793                   || GET_MODE (target) != fmode)
4794                 target = gen_reg_rtx (fmode);
4795
4796               imode = from_mode;
4797               do_pending_stack_adjust ();
4798
4799               /* Test whether the sign bit is set.  */
4800               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
4801                                        0, neglabel);
4802
4803               /* The sign bit is not set.  Convert as signed.  */
4804               expand_float (target, from, 0);
4805               emit_jump_insn (targetm.gen_jump (label));
4806               emit_barrier ();
4807
4808               /* The sign bit is set.
4809                  Convert to a usable (positive signed) value by shifting right
4810                  one bit, while remembering if a nonzero bit was shifted
4811                  out; i.e., compute  (from & 1) | (from >> 1).  */
4812
4813               emit_label (neglabel);
4814               temp = expand_binop (imode, and_optab, from, const1_rtx,
4815                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
4816               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
4817               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
4818                                    OPTAB_LIB_WIDEN);
4819               expand_float (target, temp, 0);
4820
4821               /* Multiply by 2 to undo the shift above.  */
4822               temp = expand_binop (fmode, add_optab, target, target,
4823                                    target, 0, OPTAB_LIB_WIDEN);
4824               if (temp != target)
4825                 emit_move_insn (target, temp);
4826
4827               do_pending_stack_adjust ();
4828               emit_label (label);
4829               goto done;
4830             }
4831         }
4832
4833       /* If we are about to do some arithmetic to correct for an
4834          unsigned operand, do it in a pseudo-register.  */
4835
4836       if (to_mode != fmode
4837           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
4838         target = gen_reg_rtx (fmode);
4839
4840       /* Convert as signed integer to floating.  */
4841       expand_float (target, from, 0);
4842
4843       /* If FROM is negative (and therefore TO is negative),
4844          correct its value by 2**bitwidth.  */
4845
4846       do_pending_stack_adjust ();
4847       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, from_mode,
4848                                0, label);
4849
4850
4851       real_2expN (&offset, GET_MODE_PRECISION (from_mode), fmode);
4852       temp = expand_binop (fmode, add_optab, target,
4853                            const_double_from_real_value (offset, fmode),
4854                            target, 0, OPTAB_LIB_WIDEN);
4855       if (temp != target)
4856         emit_move_insn (target, temp);
4857
4858       do_pending_stack_adjust ();
4859       emit_label (label);
4860       goto done;
4861     }
4862
4863   /* No hardware instruction available; call a library routine.  */
4864     {
4865       rtx libfunc;
4866       rtx_insn *insns;
4867       rtx value;
4868       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
4869
4870       if (is_narrower_int_mode (GET_MODE (from), SImode))
4871         from = convert_to_mode (SImode, from, unsignedp);
4872
4873       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
4874       gcc_assert (libfunc);
4875
4876       start_sequence ();
4877
4878       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4879                                        GET_MODE (to), from, GET_MODE (from));
4880       insns = get_insns ();
4881       end_sequence ();
4882
4883       emit_libcall_block (insns, target, value,
4884                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
4885                                          GET_MODE (to), from));
4886     }
4887
4888  done:
4889
4890   /* Copy result to requested destination
4891      if we have been computing in a temp location.  */
4892
4893   if (target != to)
4894     {
4895       if (GET_MODE (target) == GET_MODE (to))
4896         emit_move_insn (to, target);
4897       else
4898         convert_move (to, target, 0);
4899     }
4900 }
4901 \f
4902 /* Generate code to convert FROM to fixed point and store in TO.  FROM
4903    must be floating point.  */
4904
4905 void
4906 expand_fix (rtx to, rtx from, int unsignedp)
4907 {
4908   enum insn_code icode;
4909   rtx target = to;
4910   machine_mode fmode, imode;
4911   opt_scalar_mode fmode_iter;
4912   bool must_trunc = false;
4913
4914   /* We first try to find a pair of modes, one real and one integer, at
4915      least as wide as FROM and TO, respectively, in which we can open-code
4916      this conversion.  If the integer mode is wider than the mode of TO,
4917      we can do the conversion either signed or unsigned.  */
4918
4919   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
4920     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
4921       {
4922         int doing_unsigned = unsignedp;
4923
4924         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
4925         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
4926           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
4927
4928         if (icode != CODE_FOR_nothing)
4929           {
4930             rtx_insn *last = get_last_insn ();
4931             if (fmode != GET_MODE (from))
4932               from = convert_to_mode (fmode, from, 0);
4933
4934             if (must_trunc)
4935               {
4936                 rtx temp = gen_reg_rtx (GET_MODE (from));
4937                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
4938                                     temp, 0);
4939               }
4940
4941             if (imode != GET_MODE (to))
4942               target = gen_reg_rtx (imode);
4943
4944             if (maybe_emit_unop_insn (icode, target, from,
4945                                       doing_unsigned ? UNSIGNED_FIX : FIX))
4946               {
4947                 if (target != to)
4948                   convert_move (to, target, unsignedp);
4949                 return;
4950               }
4951             delete_insns_since (last);
4952           }
4953       }
4954
4955   /* For an unsigned conversion, there is one more way to do it.
4956      If we have a signed conversion, we generate code that compares
4957      the real value to the largest representable positive number.  If if
4958      is smaller, the conversion is done normally.  Otherwise, subtract
4959      one plus the highest signed number, convert, and add it back.
4960
4961      We only need to check all real modes, since we know we didn't find
4962      anything with a wider integer mode.
4963
4964      This code used to extend FP value into mode wider than the destination.
4965      This is needed for decimal float modes which cannot accurately
4966      represent one plus the highest signed number of the same size, but
4967      not for binary modes.  Consider, for instance conversion from SFmode
4968      into DImode.
4969
4970      The hot path through the code is dealing with inputs smaller than 2^63
4971      and doing just the conversion, so there is no bits to lose.
4972
4973      In the other path we know the value is positive in the range 2^63..2^64-1
4974      inclusive.  (as for other input overflow happens and result is undefined)
4975      So we know that the most important bit set in mantissa corresponds to
4976      2^63.  The subtraction of 2^63 should not generate any rounding as it
4977      simply clears out that bit.  The rest is trivial.  */
4978
4979   scalar_int_mode to_mode;
4980   if (unsignedp
4981       && is_a <scalar_int_mode> (GET_MODE (to), &to_mode)
4982       && HWI_COMPUTABLE_MODE_P (to_mode))
4983     FOR_EACH_MODE_FROM (fmode_iter, as_a <scalar_mode> (GET_MODE (from)))
4984       {
4985         scalar_mode fmode = fmode_iter.require ();
4986         if (CODE_FOR_nothing != can_fix_p (to_mode, fmode,
4987                                            0, &must_trunc)
4988             && (!DECIMAL_FLOAT_MODE_P (fmode)
4989                 || (GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (to_mode))))
4990           {
4991             int bitsize;
4992             REAL_VALUE_TYPE offset;
4993             rtx limit;
4994             rtx_code_label *lab1, *lab2;
4995             rtx_insn *insn;
4996
4997             bitsize = GET_MODE_PRECISION (to_mode);
4998             real_2expN (&offset, bitsize - 1, fmode);
4999             limit = const_double_from_real_value (offset, fmode);
5000             lab1 = gen_label_rtx ();
5001             lab2 = gen_label_rtx ();
5002
5003             if (fmode != GET_MODE (from))
5004               from = convert_to_mode (fmode, from, 0);
5005
5006             /* See if we need to do the subtraction.  */
5007             do_pending_stack_adjust ();
5008             emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX,
5009                                      GET_MODE (from), 0, lab1);
5010
5011             /* If not, do the signed "fix" and branch around fixup code.  */
5012             expand_fix (to, from, 0);
5013             emit_jump_insn (targetm.gen_jump (lab2));
5014             emit_barrier ();
5015
5016             /* Otherwise, subtract 2**(N-1), convert to signed number,
5017                then add 2**(N-1).  Do the addition using XOR since this
5018                will often generate better code.  */
5019             emit_label (lab1);
5020             target = expand_binop (GET_MODE (from), sub_optab, from, limit,
5021                                    NULL_RTX, 0, OPTAB_LIB_WIDEN);
5022             expand_fix (to, target, 0);
5023             target = expand_binop (to_mode, xor_optab, to,
5024                                    gen_int_mode
5025                                    (HOST_WIDE_INT_1 << (bitsize - 1),
5026                                     to_mode),
5027                                    to, 1, OPTAB_LIB_WIDEN);
5028
5029             if (target != to)
5030               emit_move_insn (to, target);
5031
5032             emit_label (lab2);
5033
5034             if (optab_handler (mov_optab, to_mode) != CODE_FOR_nothing)
5035               {
5036                 /* Make a place for a REG_NOTE and add it.  */
5037                 insn = emit_move_insn (to, to);
5038                 set_dst_reg_note (insn, REG_EQUAL,
5039                                   gen_rtx_fmt_e (UNSIGNED_FIX, to_mode,
5040                                                  copy_rtx (from)),
5041                                   to);
5042               }
5043
5044             return;
5045           }
5046       }
5047
5048   /* We can't do it with an insn, so use a library call.  But first ensure
5049      that the mode of TO is at least as wide as SImode, since those are the
5050      only library calls we know about.  */
5051
5052   if (is_narrower_int_mode (GET_MODE (to), SImode))
5053     {
5054       target = gen_reg_rtx (SImode);
5055
5056       expand_fix (target, from, unsignedp);
5057     }
5058   else
5059     {
5060       rtx_insn *insns;
5061       rtx value;
5062       rtx libfunc;
5063
5064       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5065       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5066       gcc_assert (libfunc);
5067
5068       start_sequence ();
5069
5070       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5071                                        GET_MODE (to), from, GET_MODE (from));
5072       insns = get_insns ();
5073       end_sequence ();
5074
5075       emit_libcall_block (insns, target, value,
5076                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5077                                          GET_MODE (to), from));
5078     }
5079
5080   if (target != to)
5081     {
5082       if (GET_MODE (to) == GET_MODE (target))
5083         emit_move_insn (to, target);
5084       else
5085         convert_move (to, target, 0);
5086     }
5087 }
5088
5089
5090 /* Promote integer arguments for a libcall if necessary.
5091    emit_library_call_value cannot do the promotion because it does not
5092    know if it should do a signed or unsigned promotion.  This is because
5093    there are no tree types defined for libcalls.  */
5094
5095 static rtx
5096 prepare_libcall_arg (rtx arg, int uintp)
5097 {
5098   scalar_int_mode mode;
5099   machine_mode arg_mode;
5100   if (is_a <scalar_int_mode> (GET_MODE (arg), &mode))
5101     {
5102       /*  If we need to promote the integer function argument we need to do
5103           it here instead of inside emit_library_call_value because in
5104           emit_library_call_value we don't know if we should do a signed or
5105           unsigned promotion.  */
5106
5107       int unsigned_p = 0;
5108       arg_mode = promote_function_mode (NULL_TREE, mode,
5109                                         &unsigned_p, NULL_TREE, 0);
5110       if (arg_mode != mode)
5111         return convert_to_mode (arg_mode, arg, uintp);
5112     }
5113     return arg;
5114 }
5115
5116 /* Generate code to convert FROM or TO a fixed-point.
5117    If UINTP is true, either TO or FROM is an unsigned integer.
5118    If SATP is true, we need to saturate the result.  */
5119
5120 void
5121 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5122 {
5123   machine_mode to_mode = GET_MODE (to);
5124   machine_mode from_mode = GET_MODE (from);
5125   convert_optab tab;
5126   enum rtx_code this_code;
5127   enum insn_code code;
5128   rtx_insn *insns;
5129   rtx value;
5130   rtx libfunc;
5131
5132   if (to_mode == from_mode)
5133     {
5134       emit_move_insn (to, from);
5135       return;
5136     }
5137
5138   if (uintp)
5139     {
5140       tab = satp ? satfractuns_optab : fractuns_optab;
5141       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5142     }
5143   else
5144     {
5145       tab = satp ? satfract_optab : fract_optab;
5146       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5147     }
5148   code = convert_optab_handler (tab, to_mode, from_mode);
5149   if (code != CODE_FOR_nothing)
5150     {
5151       emit_unop_insn (code, to, from, this_code);
5152       return;
5153     }
5154
5155   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5156   gcc_assert (libfunc);
5157
5158   from = prepare_libcall_arg (from, uintp);
5159   from_mode = GET_MODE (from);
5160
5161   start_sequence ();
5162   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5163                                    from, from_mode);
5164   insns = get_insns ();
5165   end_sequence ();
5166
5167   emit_libcall_block (insns, to, value,
5168                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5169 }
5170
5171 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5172    must be floating point, TO must be signed.  Use the conversion optab
5173    TAB to do the conversion.  */
5174
5175 bool
5176 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5177 {
5178   enum insn_code icode;
5179   rtx target = to;
5180   machine_mode fmode, imode;
5181
5182   /* We first try to find a pair of modes, one real and one integer, at
5183      least as wide as FROM and TO, respectively, in which we can open-code
5184      this conversion.  If the integer mode is wider than the mode of TO,
5185      we can do the conversion either signed or unsigned.  */
5186
5187   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
5188     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
5189       {
5190         icode = convert_optab_handler (tab, imode, fmode);
5191         if (icode != CODE_FOR_nothing)
5192           {
5193             rtx_insn *last = get_last_insn ();
5194             if (fmode != GET_MODE (from))
5195               from = convert_to_mode (fmode, from, 0);
5196
5197             if (imode != GET_MODE (to))
5198               target = gen_reg_rtx (imode);
5199
5200             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5201               {
5202                 delete_insns_since (last);
5203                 continue;
5204               }
5205             if (target != to)
5206               convert_move (to, target, 0);
5207             return true;
5208           }
5209       }
5210
5211   return false;
5212 }
5213 \f
5214 /* Report whether we have an instruction to perform the operation
5215    specified by CODE on operands of mode MODE.  */
5216 int
5217 have_insn_for (enum rtx_code code, machine_mode mode)
5218 {
5219   return (code_to_optab (code)
5220           && (optab_handler (code_to_optab (code), mode)
5221               != CODE_FOR_nothing));
5222 }
5223
5224 /* Print information about the current contents of the optabs on
5225    STDERR.  */
5226
5227 DEBUG_FUNCTION void
5228 debug_optab_libfuncs (void)
5229 {
5230   int i, j, k;
5231
5232   /* Dump the arithmetic optabs.  */
5233   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
5234     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5235       {
5236         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
5237         if (l)
5238           {
5239             gcc_assert (GET_CODE (l) == SYMBOL_REF);
5240             fprintf (stderr, "%s\t%s:\t%s\n",
5241                      GET_RTX_NAME (optab_to_code ((optab) i)),
5242                      GET_MODE_NAME (j),
5243                      XSTR (l, 0));
5244           }
5245       }
5246
5247   /* Dump the conversion optabs.  */
5248   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
5249     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5250       for (k = 0; k < NUM_MACHINE_MODES; ++k)
5251         {
5252           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
5253                                          (machine_mode) k);
5254           if (l)
5255             {
5256               gcc_assert (GET_CODE (l) == SYMBOL_REF);
5257               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
5258                        GET_RTX_NAME (optab_to_code ((optab) i)),
5259                        GET_MODE_NAME (j),
5260                        GET_MODE_NAME (k),
5261                        XSTR (l, 0));
5262             }
5263         }
5264 }
5265
5266 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
5267    CODE.  Return 0 on failure.  */
5268
5269 rtx_insn *
5270 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
5271 {
5272   machine_mode mode = GET_MODE (op1);
5273   enum insn_code icode;
5274   rtx_insn *insn;
5275   rtx trap_rtx;
5276
5277   if (mode == VOIDmode)
5278     return 0;
5279
5280   icode = optab_handler (ctrap_optab, mode);
5281   if (icode == CODE_FOR_nothing)
5282     return 0;
5283
5284   /* Some targets only accept a zero trap code.  */
5285   if (!insn_operand_matches (icode, 3, tcode))
5286     return 0;
5287
5288   do_pending_stack_adjust ();
5289   start_sequence ();
5290   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
5291                     &trap_rtx, &mode);
5292   if (!trap_rtx)
5293     insn = NULL;
5294   else
5295     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
5296                             tcode);
5297
5298   /* If that failed, then give up.  */
5299   if (insn == 0)
5300     {
5301       end_sequence ();
5302       return 0;
5303     }
5304
5305   emit_insn (insn);
5306   insn = get_insns ();
5307   end_sequence ();
5308   return insn;
5309 }
5310
5311 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
5312    or unsigned operation code.  */
5313
5314 enum rtx_code
5315 get_rtx_code (enum tree_code tcode, bool unsignedp)
5316 {
5317   enum rtx_code code;
5318   switch (tcode)
5319     {
5320     case EQ_EXPR:
5321       code = EQ;
5322       break;
5323     case NE_EXPR:
5324       code = NE;
5325       break;
5326     case LT_EXPR:
5327       code = unsignedp ? LTU : LT;
5328       break;
5329     case LE_EXPR:
5330       code = unsignedp ? LEU : LE;
5331       break;
5332     case GT_EXPR:
5333       code = unsignedp ? GTU : GT;
5334       break;
5335     case GE_EXPR:
5336       code = unsignedp ? GEU : GE;
5337       break;
5338
5339     case UNORDERED_EXPR:
5340       code = UNORDERED;
5341       break;
5342     case ORDERED_EXPR:
5343       code = ORDERED;
5344       break;
5345     case UNLT_EXPR:
5346       code = UNLT;
5347       break;
5348     case UNLE_EXPR:
5349       code = UNLE;
5350       break;
5351     case UNGT_EXPR:
5352       code = UNGT;
5353       break;
5354     case UNGE_EXPR:
5355       code = UNGE;
5356       break;
5357     case UNEQ_EXPR:
5358       code = UNEQ;
5359       break;
5360     case LTGT_EXPR:
5361       code = LTGT;
5362       break;
5363
5364     case BIT_AND_EXPR:
5365       code = AND;
5366       break;
5367
5368     case BIT_IOR_EXPR:
5369       code = IOR;
5370       break;
5371
5372     default:
5373       gcc_unreachable ();
5374     }
5375   return code;
5376 }
5377
5378 /* Return a comparison rtx of mode CMP_MODE for COND.  Use UNSIGNEDP to
5379    select signed or unsigned operators.  OPNO holds the index of the
5380    first comparison operand for insn ICODE.  Do not generate the
5381    compare instruction itself.  */
5382
5383 static rtx
5384 vector_compare_rtx (machine_mode cmp_mode, enum tree_code tcode,
5385                     tree t_op0, tree t_op1, bool unsignedp,
5386                     enum insn_code icode, unsigned int opno)
5387 {
5388   struct expand_operand ops[2];
5389   rtx rtx_op0, rtx_op1;
5390   machine_mode m0, m1;
5391   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
5392
5393   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
5394
5395   /* Expand operands.  For vector types with scalar modes, e.g. where int64x1_t
5396      has mode DImode, this can produce a constant RTX of mode VOIDmode; in such
5397      cases, use the original mode.  */
5398   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
5399                          EXPAND_STACK_PARM);
5400   m0 = GET_MODE (rtx_op0);
5401   if (m0 == VOIDmode)
5402     m0 = TYPE_MODE (TREE_TYPE (t_op0));
5403
5404   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
5405                          EXPAND_STACK_PARM);
5406   m1 = GET_MODE (rtx_op1);
5407   if (m1 == VOIDmode)
5408     m1 = TYPE_MODE (TREE_TYPE (t_op1));
5409
5410   create_input_operand (&ops[0], rtx_op0, m0);
5411   create_input_operand (&ops[1], rtx_op1, m1);
5412   if (!maybe_legitimize_operands (icode, opno, 2, ops))
5413     gcc_unreachable ();
5414   return gen_rtx_fmt_ee (rcode, cmp_mode, ops[0].value, ops[1].value);
5415 }
5416
5417 /* Check if vec_perm mask SEL is a constant equivalent to a shift of
5418    the first vec_perm operand, assuming the second operand is a constant
5419    vector of zeros.  Return the shift distance in bits if so, or NULL_RTX
5420    if the vec_perm is not a shift.  MODE is the mode of the value being
5421    shifted.  */
5422 static rtx
5423 shift_amt_for_vec_perm_mask (machine_mode mode, const vec_perm_indices &sel)
5424 {
5425   unsigned int bitsize = GET_MODE_UNIT_BITSIZE (mode);
5426   poly_int64 first = sel[0];
5427   if (maybe_ge (sel[0], GET_MODE_NUNITS (mode)))
5428     return NULL_RTX;
5429
5430   if (!sel.series_p (0, 1, first, 1))
5431     {
5432       unsigned int nelt;
5433       if (!GET_MODE_NUNITS (mode).is_constant (&nelt))
5434         return NULL_RTX;
5435       for (unsigned int i = 1; i < nelt; i++)
5436         {
5437           poly_int64 expected = i + first;
5438           /* Indices into the second vector are all equivalent.  */
5439           if (maybe_lt (sel[i], nelt)
5440               ? maybe_ne (sel[i], expected)
5441               : maybe_lt (expected, nelt))
5442             return NULL_RTX;
5443         }
5444     }
5445
5446   return gen_int_shift_amount (mode, first * bitsize);
5447 }
5448
5449 /* A subroutine of expand_vec_perm_var for expanding one vec_perm insn.  */
5450
5451 static rtx
5452 expand_vec_perm_1 (enum insn_code icode, rtx target,
5453                    rtx v0, rtx v1, rtx sel)
5454 {
5455   machine_mode tmode = GET_MODE (target);
5456   machine_mode smode = GET_MODE (sel);
5457   struct expand_operand ops[4];
5458
5459   gcc_assert (GET_MODE_CLASS (smode) == MODE_VECTOR_INT
5460               || mode_for_int_vector (tmode).require () == smode);
5461   create_output_operand (&ops[0], target, tmode);
5462   create_input_operand (&ops[3], sel, smode);
5463
5464   /* Make an effort to preserve v0 == v1.  The target expander is able to
5465      rely on this to determine if we're permuting a single input operand.  */
5466   if (rtx_equal_p (v0, v1))
5467     {
5468       if (!insn_operand_matches (icode, 1, v0))
5469         v0 = force_reg (tmode, v0);
5470       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
5471       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
5472
5473       create_fixed_operand (&ops[1], v0);
5474       create_fixed_operand (&ops[2], v0);
5475     }
5476   else
5477     {
5478       create_input_operand (&ops[1], v0, tmode);
5479       create_input_operand (&ops[2], v1, tmode);
5480     }
5481
5482   if (maybe_expand_insn (icode, 4, ops))
5483     return ops[0].value;
5484   return NULL_RTX;
5485 }
5486
5487 /* Implement a permutation of vectors v0 and v1 using the permutation
5488    vector in SEL and return the result.  Use TARGET to hold the result
5489    if nonnull and convenient.
5490
5491    MODE is the mode of the vectors being permuted (V0 and V1).  SEL_MODE
5492    is the TYPE_MODE associated with SEL, or BLKmode if SEL isn't known
5493    to have a particular mode.  */
5494
5495 rtx
5496 expand_vec_perm_const (machine_mode mode, rtx v0, rtx v1,
5497                        const vec_perm_builder &sel, machine_mode sel_mode,
5498                        rtx target)
5499 {
5500   if (!target || !register_operand (target, mode))
5501     target = gen_reg_rtx (mode);
5502
5503   /* Set QIMODE to a different vector mode with byte elements.
5504      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
5505   machine_mode qimode;
5506   if (!qimode_for_vec_perm (mode).exists (&qimode))
5507     qimode = VOIDmode;
5508
5509   rtx_insn *last = get_last_insn ();
5510
5511   bool single_arg_p = rtx_equal_p (v0, v1);
5512   /* Always specify two input vectors here and leave the target to handle
5513      cases in which the inputs are equal.  Not all backends can cope with
5514      the single-input representation when testing for a double-input
5515      target instruction.  */
5516   vec_perm_indices indices (sel, 2, GET_MODE_NUNITS (mode));
5517
5518   /* See if this can be handled with a vec_shr.  We only do this if the
5519      second vector is all zeroes.  */
5520   insn_code shift_code = optab_handler (vec_shr_optab, mode);
5521   insn_code shift_code_qi = ((qimode != VOIDmode && qimode != mode)
5522                              ? optab_handler (vec_shr_optab, qimode)
5523                              : CODE_FOR_nothing);
5524
5525   if (v1 == CONST0_RTX (GET_MODE (v1))
5526       && (shift_code != CODE_FOR_nothing
5527           || shift_code_qi != CODE_FOR_nothing))
5528     {
5529       rtx shift_amt = shift_amt_for_vec_perm_mask (mode, indices);
5530       if (shift_amt)
5531         {
5532           struct expand_operand ops[3];
5533           if (shift_code != CODE_FOR_nothing)
5534             {
5535               create_output_operand (&ops[0], target, mode);
5536               create_input_operand (&ops[1], v0, mode);
5537               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
5538               if (maybe_expand_insn (shift_code, 3, ops))
5539                 return ops[0].value;
5540             }
5541           if (shift_code_qi != CODE_FOR_nothing)
5542             {
5543               rtx tmp = gen_reg_rtx (qimode);
5544               create_output_operand (&ops[0], tmp, qimode);
5545               create_input_operand (&ops[1], gen_lowpart (qimode, v0), qimode);
5546               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
5547               if (maybe_expand_insn (shift_code_qi, 3, ops))
5548                 return gen_lowpart (mode, ops[0].value);
5549             }
5550         }
5551     }
5552
5553   if (targetm.vectorize.vec_perm_const != NULL)
5554     {
5555       v0 = force_reg (mode, v0);
5556       if (single_arg_p)
5557         v1 = v0;
5558       else
5559         v1 = force_reg (mode, v1);
5560
5561       if (targetm.vectorize.vec_perm_const (mode, target, v0, v1, indices))
5562         return target;
5563     }
5564
5565   /* Fall back to a constant byte-based permutation.  */
5566   vec_perm_indices qimode_indices;
5567   rtx target_qi = NULL_RTX, v0_qi = NULL_RTX, v1_qi = NULL_RTX;
5568   if (qimode != VOIDmode)
5569     {
5570       qimode_indices.new_expanded_vector (indices, GET_MODE_UNIT_SIZE (mode));
5571       target_qi = gen_reg_rtx (qimode);
5572       v0_qi = gen_lowpart (qimode, v0);
5573       v1_qi = gen_lowpart (qimode, v1);
5574       if (targetm.vectorize.vec_perm_const != NULL
5575           && targetm.vectorize.vec_perm_const (qimode, target_qi, v0_qi,
5576                                                v1_qi, qimode_indices))
5577         return gen_lowpart (mode, target_qi);
5578     }
5579
5580   /* Otherwise expand as a fully variable permuation.  */
5581
5582   /* The optabs are only defined for selectors with the same width
5583      as the values being permuted.  */
5584   machine_mode required_sel_mode;
5585   if (!mode_for_int_vector (mode).exists (&required_sel_mode)
5586       || !VECTOR_MODE_P (required_sel_mode))
5587     {
5588       delete_insns_since (last);
5589       return NULL_RTX;
5590     }
5591
5592   /* We know that it is semantically valid to treat SEL as having SEL_MODE.
5593      If that isn't the mode we want then we need to prove that using
5594      REQUIRED_SEL_MODE is OK.  */
5595   if (sel_mode != required_sel_mode)
5596     {
5597       if (!selector_fits_mode_p (required_sel_mode, indices))
5598         {
5599           delete_insns_since (last);
5600           return NULL_RTX;
5601         }
5602       sel_mode = required_sel_mode;
5603     }
5604
5605   insn_code icode = direct_optab_handler (vec_perm_optab, mode);
5606   if (icode != CODE_FOR_nothing)
5607     {
5608       rtx sel_rtx = vec_perm_indices_to_rtx (sel_mode, indices);
5609       rtx tmp = expand_vec_perm_1 (icode, target, v0, v1, sel_rtx);
5610       if (tmp)
5611         return tmp;
5612     }
5613
5614   if (qimode != VOIDmode
5615       && selector_fits_mode_p (qimode, qimode_indices))
5616     {
5617       icode = direct_optab_handler (vec_perm_optab, qimode);
5618       if (icode != CODE_FOR_nothing)
5619         {
5620           rtx sel_qi = vec_perm_indices_to_rtx (qimode, qimode_indices);
5621           rtx tmp = expand_vec_perm_1 (icode, target_qi, v0_qi, v1_qi, sel_qi);
5622           if (tmp)
5623             return gen_lowpart (mode, tmp);
5624         }
5625     }
5626
5627   delete_insns_since (last);
5628   return NULL_RTX;
5629 }
5630
5631 /* Implement a permutation of vectors v0 and v1 using the permutation
5632    vector in SEL and return the result.  Use TARGET to hold the result
5633    if nonnull and convenient.
5634
5635    MODE is the mode of the vectors being permuted (V0 and V1).
5636    SEL must have the integer equivalent of MODE and is known to be
5637    unsuitable for permutes with a constant permutation vector.  */
5638
5639 rtx
5640 expand_vec_perm_var (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
5641 {
5642   enum insn_code icode;
5643   unsigned int i, u;
5644   rtx tmp, sel_qi;
5645
5646   u = GET_MODE_UNIT_SIZE (mode);
5647
5648   if (!target || GET_MODE (target) != mode)
5649     target = gen_reg_rtx (mode);
5650
5651   icode = direct_optab_handler (vec_perm_optab, mode);
5652   if (icode != CODE_FOR_nothing)
5653     {
5654       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5655       if (tmp)
5656         return tmp;
5657     }
5658
5659   /* As a special case to aid several targets, lower the element-based
5660      permutation to a byte-based permutation and try again.  */
5661   machine_mode qimode;
5662   if (!qimode_for_vec_perm (mode).exists (&qimode)
5663       || maybe_gt (GET_MODE_NUNITS (qimode), GET_MODE_MASK (QImode) + 1))
5664     return NULL_RTX;
5665   icode = direct_optab_handler (vec_perm_optab, qimode);
5666   if (icode == CODE_FOR_nothing)
5667     return NULL_RTX;
5668
5669   /* Multiply each element by its byte size.  */
5670   machine_mode selmode = GET_MODE (sel);
5671   if (u == 2)
5672     sel = expand_simple_binop (selmode, PLUS, sel, sel,
5673                                NULL, 0, OPTAB_DIRECT);
5674   else
5675     sel = expand_simple_binop (selmode, ASHIFT, sel,
5676                                gen_int_shift_amount (selmode, exact_log2 (u)),
5677                                NULL, 0, OPTAB_DIRECT);
5678   gcc_assert (sel != NULL);
5679
5680   /* Broadcast the low byte each element into each of its bytes.
5681      The encoding has U interleaved stepped patterns, one for each
5682      byte of an element.  */
5683   vec_perm_builder const_sel (GET_MODE_SIZE (mode), u, 3);
5684   unsigned int low_byte_in_u = BYTES_BIG_ENDIAN ? u - 1 : 0;
5685   for (i = 0; i < 3; ++i)
5686     for (unsigned int j = 0; j < u; ++j)
5687       const_sel.quick_push (i * u + low_byte_in_u);
5688   sel = gen_lowpart (qimode, sel);
5689   sel = expand_vec_perm_const (qimode, sel, sel, const_sel, qimode, NULL);
5690   gcc_assert (sel != NULL);
5691
5692   /* Add the byte offset to each byte element.  */
5693   /* Note that the definition of the indicies here is memory ordering,
5694      so there should be no difference between big and little endian.  */
5695   rtx_vector_builder byte_indices (qimode, u, 1);
5696   for (i = 0; i < u; ++i)
5697     byte_indices.quick_push (GEN_INT (i));
5698   tmp = byte_indices.build ();
5699   sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
5700                                 sel, 0, OPTAB_DIRECT);
5701   gcc_assert (sel_qi != NULL);
5702
5703   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5704   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5705                            gen_lowpart (qimode, v1), sel_qi);
5706   if (tmp)
5707     tmp = gen_lowpart (mode, tmp);
5708   return tmp;
5709 }
5710
5711 /* Generate insns for a VEC_COND_EXPR with mask, given its TYPE and its
5712    three operands.  */
5713
5714 rtx
5715 expand_vec_cond_mask_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5716                            rtx target)
5717 {
5718   struct expand_operand ops[4];
5719   machine_mode mode = TYPE_MODE (vec_cond_type);
5720   machine_mode mask_mode = TYPE_MODE (TREE_TYPE (op0));
5721   enum insn_code icode = get_vcond_mask_icode (mode, mask_mode);
5722   rtx mask, rtx_op1, rtx_op2;
5723
5724   if (icode == CODE_FOR_nothing)
5725     return 0;
5726
5727   mask = expand_normal (op0);
5728   rtx_op1 = expand_normal (op1);
5729   rtx_op2 = expand_normal (op2);
5730
5731   mask = force_reg (mask_mode, mask);
5732   rtx_op1 = force_reg (GET_MODE (rtx_op1), rtx_op1);
5733
5734   create_output_operand (&ops[0], target, mode);
5735   create_input_operand (&ops[1], rtx_op1, mode);
5736   create_input_operand (&ops[2], rtx_op2, mode);
5737   create_input_operand (&ops[3], mask, mask_mode);
5738   expand_insn (icode, 4, ops);
5739
5740   return ops[0].value;
5741 }
5742
5743 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
5744    three operands.  */
5745
5746 rtx
5747 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5748                       rtx target)
5749 {
5750   struct expand_operand ops[6];
5751   enum insn_code icode;
5752   rtx comparison, rtx_op1, rtx_op2;
5753   machine_mode mode = TYPE_MODE (vec_cond_type);
5754   machine_mode cmp_op_mode;
5755   bool unsignedp;
5756   tree op0a, op0b;
5757   enum tree_code tcode;
5758
5759   if (COMPARISON_CLASS_P (op0))
5760     {
5761       op0a = TREE_OPERAND (op0, 0);
5762       op0b = TREE_OPERAND (op0, 1);
5763       tcode = TREE_CODE (op0);
5764     }
5765   else
5766     {
5767       gcc_assert (VECTOR_BOOLEAN_TYPE_P (TREE_TYPE (op0)));
5768       if (get_vcond_mask_icode (mode, TYPE_MODE (TREE_TYPE (op0)))
5769           != CODE_FOR_nothing)
5770         return expand_vec_cond_mask_expr (vec_cond_type, op0, op1,
5771                                           op2, target);
5772       /* Fake op0 < 0.  */
5773       else
5774         {
5775           gcc_assert (GET_MODE_CLASS (TYPE_MODE (TREE_TYPE (op0)))
5776                       == MODE_VECTOR_INT);
5777           op0a = op0;
5778           op0b = build_zero_cst (TREE_TYPE (op0));
5779           tcode = LT_EXPR;
5780         }
5781     }
5782   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
5783   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5784
5785
5786   gcc_assert (known_eq (GET_MODE_SIZE (mode), GET_MODE_SIZE (cmp_op_mode))
5787               && known_eq (GET_MODE_NUNITS (mode),
5788                            GET_MODE_NUNITS (cmp_op_mode)));
5789
5790   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
5791   if (icode == CODE_FOR_nothing)
5792     {
5793       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5794         icode = get_vcond_eq_icode (mode, cmp_op_mode);
5795       if (icode == CODE_FOR_nothing)
5796         return 0;
5797     }
5798
5799   comparison = vector_compare_rtx (VOIDmode, tcode, op0a, op0b, unsignedp,
5800                                    icode, 4);
5801   rtx_op1 = expand_normal (op1);
5802   rtx_op2 = expand_normal (op2);
5803
5804   create_output_operand (&ops[0], target, mode);
5805   create_input_operand (&ops[1], rtx_op1, mode);
5806   create_input_operand (&ops[2], rtx_op2, mode);
5807   create_fixed_operand (&ops[3], comparison);
5808   create_fixed_operand (&ops[4], XEXP (comparison, 0));
5809   create_fixed_operand (&ops[5], XEXP (comparison, 1));
5810   expand_insn (icode, 6, ops);
5811   return ops[0].value;
5812 }
5813
5814 /* Generate VEC_SERIES_EXPR <OP0, OP1>, returning a value of mode VMODE.
5815    Use TARGET for the result if nonnull and convenient.  */
5816
5817 rtx
5818 expand_vec_series_expr (machine_mode vmode, rtx op0, rtx op1, rtx target)
5819 {
5820   struct expand_operand ops[3];
5821   enum insn_code icode;
5822   machine_mode emode = GET_MODE_INNER (vmode);
5823
5824   icode = direct_optab_handler (vec_series_optab, vmode);
5825   gcc_assert (icode != CODE_FOR_nothing);
5826
5827   create_output_operand (&ops[0], target, vmode);
5828   create_input_operand (&ops[1], op0, emode);
5829   create_input_operand (&ops[2], op1, emode);
5830
5831   expand_insn (icode, 3, ops);
5832   return ops[0].value;
5833 }
5834
5835 /* Generate insns for a vector comparison into a mask.  */
5836
5837 rtx
5838 expand_vec_cmp_expr (tree type, tree exp, rtx target)
5839 {
5840   struct expand_operand ops[4];
5841   enum insn_code icode;
5842   rtx comparison;
5843   machine_mode mask_mode = TYPE_MODE (type);
5844   machine_mode vmode;
5845   bool unsignedp;
5846   tree op0a, op0b;
5847   enum tree_code tcode;
5848
5849   op0a = TREE_OPERAND (exp, 0);
5850   op0b = TREE_OPERAND (exp, 1);
5851   tcode = TREE_CODE (exp);
5852
5853   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5854   vmode = TYPE_MODE (TREE_TYPE (op0a));
5855
5856   icode = get_vec_cmp_icode (vmode, mask_mode, unsignedp);
5857   if (icode == CODE_FOR_nothing)
5858     {
5859       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5860         icode = get_vec_cmp_eq_icode (vmode, mask_mode);
5861       if (icode == CODE_FOR_nothing)
5862         return 0;
5863     }
5864
5865   comparison = vector_compare_rtx (mask_mode, tcode, op0a, op0b,
5866                                    unsignedp, icode, 2);
5867   create_output_operand (&ops[0], target, mask_mode);
5868   create_fixed_operand (&ops[1], comparison);
5869   create_fixed_operand (&ops[2], XEXP (comparison, 0));
5870   create_fixed_operand (&ops[3], XEXP (comparison, 1));
5871   expand_insn (icode, 4, ops);
5872   return ops[0].value;
5873 }
5874
5875 /* Expand a highpart multiply.  */
5876
5877 rtx
5878 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
5879                       rtx target, bool uns_p)
5880 {
5881   struct expand_operand eops[3];
5882   enum insn_code icode;
5883   int method, i;
5884   machine_mode wmode;
5885   rtx m1, m2;
5886   optab tab1, tab2;
5887
5888   method = can_mult_highpart_p (mode, uns_p);
5889   switch (method)
5890     {
5891     case 0:
5892       return NULL_RTX;
5893     case 1:
5894       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
5895       return expand_binop (mode, tab1, op0, op1, target, uns_p,
5896                            OPTAB_LIB_WIDEN);
5897     case 2:
5898       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
5899       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
5900       break;
5901     case 3:
5902       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
5903       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
5904       if (BYTES_BIG_ENDIAN)
5905         std::swap (tab1, tab2);
5906       break;
5907     default:
5908       gcc_unreachable ();
5909     }
5910
5911   icode = optab_handler (tab1, mode);
5912   wmode = insn_data[icode].operand[0].mode;
5913   gcc_checking_assert (known_eq (2 * GET_MODE_NUNITS (wmode),
5914                                  GET_MODE_NUNITS (mode)));
5915   gcc_checking_assert (known_eq (GET_MODE_SIZE (wmode), GET_MODE_SIZE (mode)));
5916
5917   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5918   create_input_operand (&eops[1], op0, mode);
5919   create_input_operand (&eops[2], op1, mode);
5920   expand_insn (icode, 3, eops);
5921   m1 = gen_lowpart (mode, eops[0].value);
5922
5923   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5924   create_input_operand (&eops[1], op0, mode);
5925   create_input_operand (&eops[2], op1, mode);
5926   expand_insn (optab_handler (tab2, mode), 3, eops);
5927   m2 = gen_lowpart (mode, eops[0].value);
5928
5929   vec_perm_builder sel;
5930   if (method == 2)
5931     {
5932       /* The encoding has 2 interleaved stepped patterns.  */
5933       sel.new_vector (GET_MODE_NUNITS (mode), 2, 3);
5934       for (i = 0; i < 6; ++i)
5935         sel.quick_push (!BYTES_BIG_ENDIAN + (i & ~1)
5936                         + ((i & 1) ? GET_MODE_NUNITS (mode) : 0));
5937     }
5938   else
5939     {
5940       /* The encoding has a single interleaved stepped pattern.  */
5941       sel.new_vector (GET_MODE_NUNITS (mode), 1, 3);
5942       for (i = 0; i < 3; ++i)
5943         sel.quick_push (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
5944     }
5945
5946   return expand_vec_perm_const (mode, m1, m2, sel, BLKmode, target);
5947 }
5948 \f
5949 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
5950    pattern.  */
5951
5952 static void
5953 find_cc_set (rtx x, const_rtx pat, void *data)
5954 {
5955   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
5956       && GET_CODE (pat) == SET)
5957     {
5958       rtx *p_cc_reg = (rtx *) data;
5959       gcc_assert (!*p_cc_reg);
5960       *p_cc_reg = x;
5961     }
5962 }
5963
5964 /* This is a helper function for the other atomic operations.  This function
5965    emits a loop that contains SEQ that iterates until a compare-and-swap
5966    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
5967    a set of instructions that takes a value from OLD_REG as an input and
5968    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
5969    set to the current contents of MEM.  After SEQ, a compare-and-swap will
5970    attempt to update MEM with NEW_REG.  The function returns true when the
5971    loop was generated successfully.  */
5972
5973 static bool
5974 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
5975 {
5976   machine_mode mode = GET_MODE (mem);
5977   rtx_code_label *label;
5978   rtx cmp_reg, success, oldval;
5979
5980   /* The loop we want to generate looks like
5981
5982         cmp_reg = mem;
5983       label:
5984         old_reg = cmp_reg;
5985         seq;
5986         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
5987         if (success)
5988           goto label;
5989
5990      Note that we only do the plain load from memory once.  Subsequent
5991      iterations use the value loaded by the compare-and-swap pattern.  */
5992
5993   label = gen_label_rtx ();
5994   cmp_reg = gen_reg_rtx (mode);
5995
5996   emit_move_insn (cmp_reg, mem);
5997   emit_label (label);
5998   emit_move_insn (old_reg, cmp_reg);
5999   if (seq)
6000     emit_insn (seq);
6001
6002   success = NULL_RTX;
6003   oldval = cmp_reg;
6004   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
6005                                        new_reg, false, MEMMODEL_SYNC_SEQ_CST,
6006                                        MEMMODEL_RELAXED))
6007     return false;
6008
6009   if (oldval != cmp_reg)
6010     emit_move_insn (cmp_reg, oldval);
6011
6012   /* Mark this jump predicted not taken.  */
6013   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
6014                            GET_MODE (success), 1, label,
6015                            profile_probability::guessed_never ());
6016   return true;
6017 }
6018
6019
6020 /* This function tries to emit an atomic_exchange intruction.  VAL is written
6021    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
6022    using TARGET if possible.  */
6023
6024 static rtx
6025 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6026 {
6027   machine_mode mode = GET_MODE (mem);
6028   enum insn_code icode;
6029
6030   /* If the target supports the exchange directly, great.  */
6031   icode = direct_optab_handler (atomic_exchange_optab, mode);
6032   if (icode != CODE_FOR_nothing)
6033     {
6034       struct expand_operand ops[4];
6035
6036       create_output_operand (&ops[0], target, mode);
6037       create_fixed_operand (&ops[1], mem);
6038       create_input_operand (&ops[2], val, mode);
6039       create_integer_operand (&ops[3], model);
6040       if (maybe_expand_insn (icode, 4, ops))
6041         return ops[0].value;
6042     }
6043
6044   return NULL_RTX;
6045 }
6046
6047 /* This function tries to implement an atomic exchange operation using
6048    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
6049    The previous contents of *MEM are returned, using TARGET if possible.
6050    Since this instructionn is an acquire barrier only, stronger memory
6051    models may require additional barriers to be emitted.  */
6052
6053 static rtx
6054 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
6055                                    enum memmodel model)
6056 {
6057   machine_mode mode = GET_MODE (mem);
6058   enum insn_code icode;
6059   rtx_insn *last_insn = get_last_insn ();
6060
6061   icode = optab_handler (sync_lock_test_and_set_optab, mode);
6062
6063   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
6064      exists, and the memory model is stronger than acquire, add a release
6065      barrier before the instruction.  */
6066
6067   if (is_mm_seq_cst (model) || is_mm_release (model) || is_mm_acq_rel (model))
6068     expand_mem_thread_fence (model);
6069
6070   if (icode != CODE_FOR_nothing)
6071     {
6072       struct expand_operand ops[3];
6073       create_output_operand (&ops[0], target, mode);
6074       create_fixed_operand (&ops[1], mem);
6075       create_input_operand (&ops[2], val, mode);
6076       if (maybe_expand_insn (icode, 3, ops))
6077         return ops[0].value;
6078     }
6079
6080   /* If an external test-and-set libcall is provided, use that instead of
6081      any external compare-and-swap that we might get from the compare-and-
6082      swap-loop expansion later.  */
6083   if (!can_compare_and_swap_p (mode, false))
6084     {
6085       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
6086       if (libfunc != NULL)
6087         {
6088           rtx addr;
6089
6090           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6091           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6092                                           mode, addr, ptr_mode,
6093                                           val, mode);
6094         }
6095     }
6096
6097   /* If the test_and_set can't be emitted, eliminate any barrier that might
6098      have been emitted.  */
6099   delete_insns_since (last_insn);
6100   return NULL_RTX;
6101 }
6102
6103 /* This function tries to implement an atomic exchange operation using a
6104    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
6105    *MEM are returned, using TARGET if possible.  No memory model is required
6106    since a compare_and_swap loop is seq-cst.  */
6107
6108 static rtx
6109 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
6110 {
6111   machine_mode mode = GET_MODE (mem);
6112
6113   if (can_compare_and_swap_p (mode, true))
6114     {
6115       if (!target || !register_operand (target, mode))
6116         target = gen_reg_rtx (mode);
6117       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
6118         return target;
6119     }
6120
6121   return NULL_RTX;
6122 }
6123
6124 /* This function tries to implement an atomic test-and-set operation
6125    using the atomic_test_and_set instruction pattern.  A boolean value
6126    is returned from the operation, using TARGET if possible.  */
6127
6128 static rtx
6129 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6130 {
6131   machine_mode pat_bool_mode;
6132   struct expand_operand ops[3];
6133
6134   if (!targetm.have_atomic_test_and_set ())
6135     return NULL_RTX;
6136
6137   /* While we always get QImode from __atomic_test_and_set, we get
6138      other memory modes from __sync_lock_test_and_set.  Note that we
6139      use no endian adjustment here.  This matches the 4.6 behavior
6140      in the Sparc backend.  */
6141   enum insn_code icode = targetm.code_for_atomic_test_and_set;
6142   gcc_checking_assert (insn_data[icode].operand[1].mode == QImode);
6143   if (GET_MODE (mem) != QImode)
6144     mem = adjust_address_nv (mem, QImode, 0);
6145
6146   pat_bool_mode = insn_data[icode].operand[0].mode;
6147   create_output_operand (&ops[0], target, pat_bool_mode);
6148   create_fixed_operand (&ops[1], mem);
6149   create_integer_operand (&ops[2], model);
6150
6151   if (maybe_expand_insn (icode, 3, ops))
6152     return ops[0].value;
6153   return NULL_RTX;
6154 }
6155
6156 /* This function expands the legacy _sync_lock test_and_set operation which is
6157    generally an atomic exchange.  Some limited targets only allow the
6158    constant 1 to be stored.  This is an ACQUIRE operation.
6159
6160    TARGET is an optional place to stick the return value.
6161    MEM is where VAL is stored.  */
6162
6163 rtx
6164 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
6165 {
6166   rtx ret;
6167
6168   /* Try an atomic_exchange first.  */
6169   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_SYNC_ACQUIRE);
6170   if (ret)
6171     return ret;
6172
6173   ret = maybe_emit_sync_lock_test_and_set (target, mem, val,
6174                                            MEMMODEL_SYNC_ACQUIRE);
6175   if (ret)
6176     return ret;
6177
6178   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6179   if (ret)
6180     return ret;
6181
6182   /* If there are no other options, try atomic_test_and_set if the value
6183      being stored is 1.  */
6184   if (val == const1_rtx)
6185     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_SYNC_ACQUIRE);
6186
6187   return ret;
6188 }
6189
6190 /* This function expands the atomic test_and_set operation:
6191    atomically store a boolean TRUE into MEM and return the previous value.
6192
6193    MEMMODEL is the memory model variant to use.
6194    TARGET is an optional place to stick the return value.  */
6195
6196 rtx
6197 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6198 {
6199   machine_mode mode = GET_MODE (mem);
6200   rtx ret, trueval, subtarget;
6201
6202   ret = maybe_emit_atomic_test_and_set (target, mem, model);
6203   if (ret)
6204     return ret;
6205
6206   /* Be binary compatible with non-default settings of trueval, and different
6207      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
6208      another only has atomic-exchange.  */
6209   if (targetm.atomic_test_and_set_trueval == 1)
6210     {
6211       trueval = const1_rtx;
6212       subtarget = target ? target : gen_reg_rtx (mode);
6213     }
6214   else
6215     {
6216       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
6217       subtarget = gen_reg_rtx (mode);
6218     }
6219
6220   /* Try the atomic-exchange optab...  */
6221   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
6222
6223   /* ... then an atomic-compare-and-swap loop ... */
6224   if (!ret)
6225     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
6226
6227   /* ... before trying the vaguely defined legacy lock_test_and_set. */
6228   if (!ret)
6229     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
6230
6231   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
6232      things with the value 1.  Thus we try again without trueval.  */
6233   if (!ret && targetm.atomic_test_and_set_trueval != 1)
6234     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
6235
6236   /* Failing all else, assume a single threaded environment and simply
6237      perform the operation.  */
6238   if (!ret)
6239     {
6240       /* If the result is ignored skip the move to target.  */
6241       if (subtarget != const0_rtx)
6242         emit_move_insn (subtarget, mem);
6243
6244       emit_move_insn (mem, trueval);
6245       ret = subtarget;
6246     }
6247
6248   /* Recall that have to return a boolean value; rectify if trueval
6249      is not exactly one.  */
6250   if (targetm.atomic_test_and_set_trueval != 1)
6251     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
6252
6253   return ret;
6254 }
6255
6256 /* This function expands the atomic exchange operation:
6257    atomically store VAL in MEM and return the previous value in MEM.
6258
6259    MEMMODEL is the memory model variant to use.
6260    TARGET is an optional place to stick the return value.  */
6261
6262 rtx
6263 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6264 {
6265   machine_mode mode = GET_MODE (mem);
6266   rtx ret;
6267
6268   /* If loads are not atomic for the required size and we are not called to
6269      provide a __sync builtin, do not do anything so that we stay consistent
6270      with atomic loads of the same size.  */
6271   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6272     return NULL_RTX;
6273
6274   ret = maybe_emit_atomic_exchange (target, mem, val, model);
6275
6276   /* Next try a compare-and-swap loop for the exchange.  */
6277   if (!ret)
6278     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6279
6280   return ret;
6281 }
6282
6283 /* This function expands the atomic compare exchange operation:
6284
6285    *PTARGET_BOOL is an optional place to store the boolean success/failure.
6286    *PTARGET_OVAL is an optional place to store the old value from memory.
6287    Both target parameters may be NULL or const0_rtx to indicate that we do
6288    not care about that return value.  Both target parameters are updated on
6289    success to the actual location of the corresponding result.
6290
6291    MEMMODEL is the memory model variant to use.
6292
6293    The return value of the function is true for success.  */
6294
6295 bool
6296 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
6297                                 rtx mem, rtx expected, rtx desired,
6298                                 bool is_weak, enum memmodel succ_model,
6299                                 enum memmodel fail_model)
6300 {
6301   machine_mode mode = GET_MODE (mem);
6302   struct expand_operand ops[8];
6303   enum insn_code icode;
6304   rtx target_oval, target_bool = NULL_RTX;
6305   rtx libfunc;
6306
6307   /* If loads are not atomic for the required size and we are not called to
6308      provide a __sync builtin, do not do anything so that we stay consistent
6309      with atomic loads of the same size.  */
6310   if (!can_atomic_load_p (mode) && !is_mm_sync (succ_model))
6311     return false;
6312
6313   /* Load expected into a register for the compare and swap.  */
6314   if (MEM_P (expected))
6315     expected = copy_to_reg (expected);
6316
6317   /* Make sure we always have some place to put the return oldval.
6318      Further, make sure that place is distinct from the input expected,
6319      just in case we need that path down below.  */
6320   if (ptarget_oval && *ptarget_oval == const0_rtx)
6321     ptarget_oval = NULL;
6322
6323   if (ptarget_oval == NULL
6324       || (target_oval = *ptarget_oval) == NULL
6325       || reg_overlap_mentioned_p (expected, target_oval))
6326     target_oval = gen_reg_rtx (mode);
6327
6328   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
6329   if (icode != CODE_FOR_nothing)
6330     {
6331       machine_mode bool_mode = insn_data[icode].operand[0].mode;
6332
6333       if (ptarget_bool && *ptarget_bool == const0_rtx)
6334         ptarget_bool = NULL;
6335
6336       /* Make sure we always have a place for the bool operand.  */
6337       if (ptarget_bool == NULL
6338           || (target_bool = *ptarget_bool) == NULL
6339           || GET_MODE (target_bool) != bool_mode)
6340         target_bool = gen_reg_rtx (bool_mode);
6341
6342       /* Emit the compare_and_swap.  */
6343       create_output_operand (&ops[0], target_bool, bool_mode);
6344       create_output_operand (&ops[1], target_oval, mode);
6345       create_fixed_operand (&ops[2], mem);
6346       create_input_operand (&ops[3], expected, mode);
6347       create_input_operand (&ops[4], desired, mode);
6348       create_integer_operand (&ops[5], is_weak);
6349       create_integer_operand (&ops[6], succ_model);
6350       create_integer_operand (&ops[7], fail_model);
6351       if (maybe_expand_insn (icode, 8, ops))
6352         {
6353           /* Return success/failure.  */
6354           target_bool = ops[0].value;
6355           target_oval = ops[1].value;
6356           goto success;
6357         }
6358     }
6359
6360   /* Otherwise fall back to the original __sync_val_compare_and_swap
6361      which is always seq-cst.  */
6362   icode = optab_handler (sync_compare_and_swap_optab, mode);
6363   if (icode != CODE_FOR_nothing)
6364     {
6365       rtx cc_reg;
6366
6367       create_output_operand (&ops[0], target_oval, mode);
6368       create_fixed_operand (&ops[1], mem);
6369       create_input_operand (&ops[2], expected, mode);
6370       create_input_operand (&ops[3], desired, mode);
6371       if (!maybe_expand_insn (icode, 4, ops))
6372         return false;
6373
6374       target_oval = ops[0].value;
6375
6376       /* If the caller isn't interested in the boolean return value,
6377          skip the computation of it.  */
6378       if (ptarget_bool == NULL)
6379         goto success;
6380
6381       /* Otherwise, work out if the compare-and-swap succeeded.  */
6382       cc_reg = NULL_RTX;
6383       if (have_insn_for (COMPARE, CCmode))
6384         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
6385       if (cc_reg)
6386         {
6387           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
6388                                                const0_rtx, VOIDmode, 0, 1);
6389           goto success;
6390         }
6391       goto success_bool_from_val;
6392     }
6393
6394   /* Also check for library support for __sync_val_compare_and_swap.  */
6395   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
6396   if (libfunc != NULL)
6397     {
6398       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6399       rtx target = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6400                                             mode, addr, ptr_mode,
6401                                             expected, mode, desired, mode);
6402       emit_move_insn (target_oval, target);
6403
6404       /* Compute the boolean return value only if requested.  */
6405       if (ptarget_bool)
6406         goto success_bool_from_val;
6407       else
6408         goto success;
6409     }
6410
6411   /* Failure.  */
6412   return false;
6413
6414  success_bool_from_val:
6415    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
6416                                         expected, VOIDmode, 1, 1);
6417  success:
6418   /* Make sure that the oval output winds up where the caller asked.  */
6419   if (ptarget_oval)
6420     *ptarget_oval = target_oval;
6421   if (ptarget_bool)
6422     *ptarget_bool = target_bool;
6423   return true;
6424 }
6425
6426 /* Generate asm volatile("" : : : "memory") as the memory blockage.  */
6427
6428 static void
6429 expand_asm_memory_blockage (void)
6430 {
6431   rtx asm_op, clob;
6432
6433   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, "", "", 0,
6434                                  rtvec_alloc (0), rtvec_alloc (0),
6435                                  rtvec_alloc (0), UNKNOWN_LOCATION);
6436   MEM_VOLATILE_P (asm_op) = 1;
6437
6438   clob = gen_rtx_SCRATCH (VOIDmode);
6439   clob = gen_rtx_MEM (BLKmode, clob);
6440   clob = gen_rtx_CLOBBER (VOIDmode, clob);
6441
6442   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
6443 }
6444
6445 /* Do not propagate memory accesses across this point.  */
6446
6447 static void
6448 expand_memory_blockage (void)
6449 {
6450   if (targetm.have_memory_blockage ())
6451     emit_insn (targetm.gen_memory_blockage ());
6452   else
6453     expand_asm_memory_blockage ();
6454 }
6455
6456 /* This routine will either emit the mem_thread_fence pattern or issue a
6457    sync_synchronize to generate a fence for memory model MEMMODEL.  */
6458
6459 void
6460 expand_mem_thread_fence (enum memmodel model)
6461 {
6462   if (is_mm_relaxed (model))
6463     return;
6464   if (targetm.have_mem_thread_fence ())
6465     {
6466       emit_insn (targetm.gen_mem_thread_fence (GEN_INT (model)));
6467       expand_memory_blockage ();
6468     }
6469   else if (targetm.have_memory_barrier ())
6470     emit_insn (targetm.gen_memory_barrier ());
6471   else if (synchronize_libfunc != NULL_RTX)
6472     emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode);
6473   else
6474     expand_memory_blockage ();
6475 }
6476
6477 /* Emit a signal fence with given memory model.  */
6478
6479 void
6480 expand_mem_signal_fence (enum memmodel model)
6481 {
6482   /* No machine barrier is required to implement a signal fence, but
6483      a compiler memory barrier must be issued, except for relaxed MM.  */
6484   if (!is_mm_relaxed (model))
6485     expand_memory_blockage ();
6486 }
6487
6488 /* This function expands the atomic load operation:
6489    return the atomically loaded value in MEM.
6490
6491    MEMMODEL is the memory model variant to use.
6492    TARGET is an option place to stick the return value.  */
6493
6494 rtx
6495 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
6496 {
6497   machine_mode mode = GET_MODE (mem);
6498   enum insn_code icode;
6499
6500   /* If the target supports the load directly, great.  */
6501   icode = direct_optab_handler (atomic_load_optab, mode);
6502   if (icode != CODE_FOR_nothing)
6503     {
6504       struct expand_operand ops[3];
6505       rtx_insn *last = get_last_insn ();
6506       if (is_mm_seq_cst (model))
6507         expand_memory_blockage ();
6508
6509       create_output_operand (&ops[0], target, mode);
6510       create_fixed_operand (&ops[1], mem);
6511       create_integer_operand (&ops[2], model);
6512       if (maybe_expand_insn (icode, 3, ops))
6513         {
6514           if (!is_mm_relaxed (model))
6515             expand_memory_blockage ();
6516           return ops[0].value;
6517         }
6518       delete_insns_since (last);
6519     }
6520
6521   /* If the size of the object is greater than word size on this target,
6522      then we assume that a load will not be atomic.  We could try to
6523      emulate a load with a compare-and-swap operation, but the store that
6524      doing this could result in would be incorrect if this is a volatile
6525      atomic load or targetting read-only-mapped memory.  */
6526   if (maybe_gt (GET_MODE_PRECISION (mode), BITS_PER_WORD))
6527     /* If there is no atomic load, leave the library call.  */
6528     return NULL_RTX;
6529
6530   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
6531   if (!target || target == const0_rtx)
6532     target = gen_reg_rtx (mode);
6533
6534   /* For SEQ_CST, emit a barrier before the load.  */
6535   if (is_mm_seq_cst (model))
6536     expand_mem_thread_fence (model);
6537
6538   emit_move_insn (target, mem);
6539
6540   /* Emit the appropriate barrier after the load.  */
6541   expand_mem_thread_fence (model);
6542
6543   return target;
6544 }
6545
6546 /* This function expands the atomic store operation:
6547    Atomically store VAL in MEM.
6548    MEMMODEL is the memory model variant to use.
6549    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
6550    function returns const0_rtx if a pattern was emitted.  */
6551
6552 rtx
6553 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
6554 {
6555   machine_mode mode = GET_MODE (mem);
6556   enum insn_code icode;
6557   struct expand_operand ops[3];
6558
6559   /* If the target supports the store directly, great.  */
6560   icode = direct_optab_handler (atomic_store_optab, mode);
6561   if (icode != CODE_FOR_nothing)
6562     {
6563       rtx_insn *last = get_last_insn ();
6564       if (!is_mm_relaxed (model))
6565         expand_memory_blockage ();
6566       create_fixed_operand (&ops[0], mem);
6567       create_input_operand (&ops[1], val, mode);
6568       create_integer_operand (&ops[2], model);
6569       if (maybe_expand_insn (icode, 3, ops))
6570         {
6571           if (is_mm_seq_cst (model))
6572             expand_memory_blockage ();
6573           return const0_rtx;
6574         }
6575       delete_insns_since (last);
6576     }
6577
6578   /* If using __sync_lock_release is a viable alternative, try it.
6579      Note that this will not be set to true if we are expanding a generic
6580      __atomic_store_n.  */
6581   if (use_release)
6582     {
6583       icode = direct_optab_handler (sync_lock_release_optab, mode);
6584       if (icode != CODE_FOR_nothing)
6585         {
6586           create_fixed_operand (&ops[0], mem);
6587           create_input_operand (&ops[1], const0_rtx, mode);
6588           if (maybe_expand_insn (icode, 2, ops))
6589             {
6590               /* lock_release is only a release barrier.  */
6591               if (is_mm_seq_cst (model))
6592                 expand_mem_thread_fence (model);
6593               return const0_rtx;
6594             }
6595         }
6596     }
6597
6598   /* If the size of the object is greater than word size on this target,
6599      a default store will not be atomic.  */
6600   if (maybe_gt (GET_MODE_PRECISION (mode), BITS_PER_WORD))
6601     {
6602       /* If loads are atomic or we are called to provide a __sync builtin,
6603          we can try a atomic_exchange and throw away the result.  Otherwise,
6604          don't do anything so that we do not create an inconsistency between
6605          loads and stores.  */
6606       if (can_atomic_load_p (mode) || is_mm_sync (model))
6607         {
6608           rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
6609           if (!target)
6610             target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem,
6611                                                                 val);
6612           if (target)
6613             return const0_rtx;
6614         }
6615         return NULL_RTX;
6616     }
6617
6618   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
6619   expand_mem_thread_fence (model);
6620
6621   emit_move_insn (mem, val);
6622
6623   /* For SEQ_CST, also emit a barrier after the store.  */
6624   if (is_mm_seq_cst (model))
6625     expand_mem_thread_fence (model);
6626
6627   return const0_rtx;
6628 }
6629
6630
6631 /* Structure containing the pointers and values required to process the
6632    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
6633
6634 struct atomic_op_functions
6635 {
6636   direct_optab mem_fetch_before;
6637   direct_optab mem_fetch_after;
6638   direct_optab mem_no_result;
6639   optab fetch_before;
6640   optab fetch_after;
6641   direct_optab no_result;
6642   enum rtx_code reverse_code;
6643 };
6644
6645
6646 /* Fill in structure pointed to by OP with the various optab entries for an
6647    operation of type CODE.  */
6648
6649 static void
6650 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
6651 {
6652   gcc_assert (op!= NULL);
6653
6654   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
6655      in the source code during compilation, and the optab entries are not
6656      computable until runtime.  Fill in the values at runtime.  */
6657   switch (code)
6658     {
6659     case PLUS:
6660       op->mem_fetch_before = atomic_fetch_add_optab;
6661       op->mem_fetch_after = atomic_add_fetch_optab;
6662       op->mem_no_result = atomic_add_optab;
6663       op->fetch_before = sync_old_add_optab;
6664       op->fetch_after = sync_new_add_optab;
6665       op->no_result = sync_add_optab;
6666       op->reverse_code = MINUS;
6667       break;
6668     case MINUS:
6669       op->mem_fetch_before = atomic_fetch_sub_optab;
6670       op->mem_fetch_after = atomic_sub_fetch_optab;
6671       op->mem_no_result = atomic_sub_optab;
6672       op->fetch_before = sync_old_sub_optab;
6673       op->fetch_after = sync_new_sub_optab;
6674       op->no_result = sync_sub_optab;
6675       op->reverse_code = PLUS;
6676       break;
6677     case XOR:
6678       op->mem_fetch_before = atomic_fetch_xor_optab;
6679       op->mem_fetch_after = atomic_xor_fetch_optab;
6680       op->mem_no_result = atomic_xor_optab;
6681       op->fetch_before = sync_old_xor_optab;
6682       op->fetch_after = sync_new_xor_optab;
6683       op->no_result = sync_xor_optab;
6684       op->reverse_code = XOR;
6685       break;
6686     case AND:
6687       op->mem_fetch_before = atomic_fetch_and_optab;
6688       op->mem_fetch_after = atomic_and_fetch_optab;
6689       op->mem_no_result = atomic_and_optab;
6690       op->fetch_before = sync_old_and_optab;
6691       op->fetch_after = sync_new_and_optab;
6692       op->no_result = sync_and_optab;
6693       op->reverse_code = UNKNOWN;
6694       break;
6695     case IOR:
6696       op->mem_fetch_before = atomic_fetch_or_optab;
6697       op->mem_fetch_after = atomic_or_fetch_optab;
6698       op->mem_no_result = atomic_or_optab;
6699       op->fetch_before = sync_old_ior_optab;
6700       op->fetch_after = sync_new_ior_optab;
6701       op->no_result = sync_ior_optab;
6702       op->reverse_code = UNKNOWN;
6703       break;
6704     case NOT:
6705       op->mem_fetch_before = atomic_fetch_nand_optab;
6706       op->mem_fetch_after = atomic_nand_fetch_optab;
6707       op->mem_no_result = atomic_nand_optab;
6708       op->fetch_before = sync_old_nand_optab;
6709       op->fetch_after = sync_new_nand_optab;
6710       op->no_result = sync_nand_optab;
6711       op->reverse_code = UNKNOWN;
6712       break;
6713     default:
6714       gcc_unreachable ();
6715     }
6716 }
6717
6718 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
6719    using memory order MODEL.  If AFTER is true the operation needs to return
6720    the value of *MEM after the operation, otherwise the previous value.
6721    TARGET is an optional place to place the result.  The result is unused if
6722    it is const0_rtx.
6723    Return the result if there is a better sequence, otherwise NULL_RTX.  */
6724
6725 static rtx
6726 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6727                          enum memmodel model, bool after)
6728 {
6729   /* If the value is prefetched, or not used, it may be possible to replace
6730      the sequence with a native exchange operation.  */
6731   if (!after || target == const0_rtx)
6732     {
6733       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
6734       if (code == AND && val == const0_rtx)
6735         {
6736           if (target == const0_rtx)
6737             target = gen_reg_rtx (GET_MODE (mem));
6738           return maybe_emit_atomic_exchange (target, mem, val, model);
6739         }
6740
6741       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
6742       if (code == IOR && val == constm1_rtx)
6743         {
6744           if (target == const0_rtx)
6745             target = gen_reg_rtx (GET_MODE (mem));
6746           return maybe_emit_atomic_exchange (target, mem, val, model);
6747         }
6748     }
6749
6750   return NULL_RTX;
6751 }
6752
6753 /* Try to emit an instruction for a specific operation varaition.
6754    OPTAB contains the OP functions.
6755    TARGET is an optional place to return the result. const0_rtx means unused.
6756    MEM is the memory location to operate on.
6757    VAL is the value to use in the operation.
6758    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
6759    MODEL is the memory model, if used.
6760    AFTER is true if the returned result is the value after the operation.  */
6761
6762 static rtx
6763 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
6764                rtx val, bool use_memmodel, enum memmodel model, bool after)
6765 {
6766   machine_mode mode = GET_MODE (mem);
6767   struct expand_operand ops[4];
6768   enum insn_code icode;
6769   int op_counter = 0;
6770   int num_ops;
6771
6772   /* Check to see if there is a result returned.  */
6773   if (target == const0_rtx)
6774     {
6775       if (use_memmodel)
6776         {
6777           icode = direct_optab_handler (optab->mem_no_result, mode);
6778           create_integer_operand (&ops[2], model);
6779           num_ops = 3;
6780         }
6781       else
6782         {
6783           icode = direct_optab_handler (optab->no_result, mode);
6784           num_ops = 2;
6785         }
6786     }
6787   /* Otherwise, we need to generate a result.  */
6788   else
6789     {
6790       if (use_memmodel)
6791         {
6792           icode = direct_optab_handler (after ? optab->mem_fetch_after
6793                                         : optab->mem_fetch_before, mode);
6794           create_integer_operand (&ops[3], model);
6795           num_ops = 4;
6796         }
6797       else
6798         {
6799           icode = optab_handler (after ? optab->fetch_after
6800                                  : optab->fetch_before, mode);
6801           num_ops = 3;
6802         }
6803       create_output_operand (&ops[op_counter++], target, mode);
6804     }
6805   if (icode == CODE_FOR_nothing)
6806     return NULL_RTX;
6807
6808   create_fixed_operand (&ops[op_counter++], mem);
6809   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
6810   create_convert_operand_to (&ops[op_counter++], val, mode, true);
6811
6812   if (maybe_expand_insn (icode, num_ops, ops))
6813     return (target == const0_rtx ? const0_rtx : ops[0].value);
6814
6815   return NULL_RTX;
6816 }
6817
6818
6819 /* This function expands an atomic fetch_OP or OP_fetch operation:
6820    TARGET is an option place to stick the return value.  const0_rtx indicates
6821    the result is unused.
6822    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6823    CODE is the operation being performed (OP)
6824    MEMMODEL is the memory model variant to use.
6825    AFTER is true to return the result of the operation (OP_fetch).
6826    AFTER is false to return the value before the operation (fetch_OP).
6827
6828    This function will *only* generate instructions if there is a direct
6829    optab. No compare and swap loops or libcalls will be generated. */
6830
6831 static rtx
6832 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
6833                                     enum rtx_code code, enum memmodel model,
6834                                     bool after)
6835 {
6836   machine_mode mode = GET_MODE (mem);
6837   struct atomic_op_functions optab;
6838   rtx result;
6839   bool unused_result = (target == const0_rtx);
6840
6841   get_atomic_op_for_code (&optab, code);
6842
6843   /* Check to see if there are any better instructions.  */
6844   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
6845   if (result)
6846     return result;
6847
6848   /* Check for the case where the result isn't used and try those patterns.  */
6849   if (unused_result)
6850     {
6851       /* Try the memory model variant first.  */
6852       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
6853       if (result)
6854         return result;
6855
6856       /* Next try the old style withuot a memory model.  */
6857       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
6858       if (result)
6859         return result;
6860
6861       /* There is no no-result pattern, so try patterns with a result.  */
6862       target = NULL_RTX;
6863     }
6864
6865   /* Try the __atomic version.  */
6866   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
6867   if (result)
6868     return result;
6869
6870   /* Try the older __sync version.  */
6871   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
6872   if (result)
6873     return result;
6874
6875   /* If the fetch value can be calculated from the other variation of fetch,
6876      try that operation.  */
6877   if (after || unused_result || optab.reverse_code != UNKNOWN)
6878     {
6879       /* Try the __atomic version, then the older __sync version.  */
6880       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
6881       if (!result)
6882         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
6883
6884       if (result)
6885         {
6886           /* If the result isn't used, no need to do compensation code.  */
6887           if (unused_result)
6888             return result;
6889
6890           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
6891              Fetch_before == after REVERSE_OP val.  */
6892           if (!after)
6893             code = optab.reverse_code;
6894           if (code == NOT)
6895             {
6896               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
6897                                             true, OPTAB_LIB_WIDEN);
6898               result = expand_simple_unop (mode, NOT, result, target, true);
6899             }
6900           else
6901             result = expand_simple_binop (mode, code, result, val, target,
6902                                           true, OPTAB_LIB_WIDEN);
6903           return result;
6904         }
6905     }
6906
6907   /* No direct opcode can be generated.  */
6908   return NULL_RTX;
6909 }
6910
6911
6912
6913 /* This function expands an atomic fetch_OP or OP_fetch operation:
6914    TARGET is an option place to stick the return value.  const0_rtx indicates
6915    the result is unused.
6916    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6917    CODE is the operation being performed (OP)
6918    MEMMODEL is the memory model variant to use.
6919    AFTER is true to return the result of the operation (OP_fetch).
6920    AFTER is false to return the value before the operation (fetch_OP).  */
6921 rtx
6922 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6923                         enum memmodel model, bool after)
6924 {
6925   machine_mode mode = GET_MODE (mem);
6926   rtx result;
6927   bool unused_result = (target == const0_rtx);
6928
6929   /* If loads are not atomic for the required size and we are not called to
6930      provide a __sync builtin, do not do anything so that we stay consistent
6931      with atomic loads of the same size.  */
6932   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6933     return NULL_RTX;
6934
6935   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
6936                                                after);
6937
6938   if (result)
6939     return result;
6940
6941   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
6942   if (code == PLUS || code == MINUS)
6943     {
6944       rtx tmp;
6945       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
6946
6947       start_sequence ();
6948       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
6949       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
6950                                                    model, after);
6951       if (result)
6952         {
6953           /* PLUS worked so emit the insns and return.  */
6954           tmp = get_insns ();
6955           end_sequence ();
6956           emit_insn (tmp);
6957           return result;
6958         }
6959
6960       /* PLUS did not work, so throw away the negation code and continue.  */
6961       end_sequence ();
6962     }
6963
6964   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
6965   if (!can_compare_and_swap_p (mode, false))
6966     {
6967       rtx libfunc;
6968       bool fixup = false;
6969       enum rtx_code orig_code = code;
6970       struct atomic_op_functions optab;
6971
6972       get_atomic_op_for_code (&optab, code);
6973       libfunc = optab_libfunc (after ? optab.fetch_after
6974                                : optab.fetch_before, mode);
6975       if (libfunc == NULL
6976           && (after || unused_result || optab.reverse_code != UNKNOWN))
6977         {
6978           fixup = true;
6979           if (!after)
6980             code = optab.reverse_code;
6981           libfunc = optab_libfunc (after ? optab.fetch_before
6982                                    : optab.fetch_after, mode);
6983         }
6984       if (libfunc != NULL)
6985         {
6986           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6987           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
6988                                             addr, ptr_mode, val, mode);
6989
6990           if (!unused_result && fixup)
6991             result = expand_simple_binop (mode, code, result, val, target,
6992                                           true, OPTAB_LIB_WIDEN);
6993           return result;
6994         }
6995
6996       /* We need the original code for any further attempts.  */
6997       code = orig_code;
6998     }
6999
7000   /* If nothing else has succeeded, default to a compare and swap loop.  */
7001   if (can_compare_and_swap_p (mode, true))
7002     {
7003       rtx_insn *insn;
7004       rtx t0 = gen_reg_rtx (mode), t1;
7005
7006       start_sequence ();
7007
7008       /* If the result is used, get a register for it.  */
7009       if (!unused_result)
7010         {
7011           if (!target || !register_operand (target, mode))
7012             target = gen_reg_rtx (mode);
7013           /* If fetch_before, copy the value now.  */
7014           if (!after)
7015             emit_move_insn (target, t0);
7016         }
7017       else
7018         target = const0_rtx;
7019
7020       t1 = t0;
7021       if (code == NOT)
7022         {
7023           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
7024                                     true, OPTAB_LIB_WIDEN);
7025           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
7026         }
7027       else
7028         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
7029                                   OPTAB_LIB_WIDEN);
7030
7031       /* For after, copy the value now.  */
7032       if (!unused_result && after)
7033         emit_move_insn (target, t1);
7034       insn = get_insns ();
7035       end_sequence ();
7036
7037       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
7038         return target;
7039     }
7040
7041   return NULL_RTX;
7042 }
7043 \f
7044 /* Return true if OPERAND is suitable for operand number OPNO of
7045    instruction ICODE.  */
7046
7047 bool
7048 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
7049 {
7050   return (!insn_data[(int) icode].operand[opno].predicate
7051           || (insn_data[(int) icode].operand[opno].predicate
7052               (operand, insn_data[(int) icode].operand[opno].mode)));
7053 }
7054 \f
7055 /* TARGET is a target of a multiword operation that we are going to
7056    implement as a series of word-mode operations.  Return true if
7057    TARGET is suitable for this purpose.  */
7058
7059 bool
7060 valid_multiword_target_p (rtx target)
7061 {
7062   machine_mode mode;
7063   int i, size;
7064
7065   mode = GET_MODE (target);
7066   if (!GET_MODE_SIZE (mode).is_constant (&size))
7067     return false;
7068   for (i = 0; i < size; i += UNITS_PER_WORD)
7069     if (!validate_subreg (word_mode, mode, target, i))
7070       return false;
7071   return true;
7072 }
7073
7074 /* Make OP describe an input operand that has value INTVAL and that has
7075    no inherent mode.  This function should only be used for operands that
7076    are always expand-time constants.  The backend may request that INTVAL
7077    be copied into a different kind of rtx, but it must specify the mode
7078    of that rtx if so.  */
7079
7080 void
7081 create_integer_operand (struct expand_operand *op, poly_int64 intval)
7082 {
7083   create_expand_operand (op, EXPAND_INTEGER,
7084                          gen_int_mode (intval, MAX_MODE_INT),
7085                          VOIDmode, false, intval);
7086 }
7087
7088 /* Like maybe_legitimize_operand, but do not change the code of the
7089    current rtx value.  */
7090
7091 static bool
7092 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
7093                                     struct expand_operand *op)
7094 {
7095   /* See if the operand matches in its current form.  */
7096   if (insn_operand_matches (icode, opno, op->value))
7097     return true;
7098
7099   /* If the operand is a memory whose address has no side effects,
7100      try forcing the address into a non-virtual pseudo register.
7101      The check for side effects is important because copy_to_mode_reg
7102      cannot handle things like auto-modified addresses.  */
7103   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
7104     {
7105       rtx addr, mem;
7106
7107       mem = op->value;
7108       addr = XEXP (mem, 0);
7109       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
7110           && !side_effects_p (addr))
7111         {
7112           rtx_insn *last;
7113           machine_mode mode;
7114
7115           last = get_last_insn ();
7116           mode = get_address_mode (mem);
7117           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
7118           if (insn_operand_matches (icode, opno, mem))
7119             {
7120               op->value = mem;
7121               return true;
7122             }
7123           delete_insns_since (last);
7124         }
7125     }
7126
7127   return false;
7128 }
7129
7130 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
7131    on success, storing the new operand value back in OP.  */
7132
7133 static bool
7134 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
7135                           struct expand_operand *op)
7136 {
7137   machine_mode mode, imode;
7138   bool old_volatile_ok, result;
7139
7140   mode = op->mode;
7141   switch (op->type)
7142     {
7143     case EXPAND_FIXED:
7144       old_volatile_ok = volatile_ok;
7145       volatile_ok = true;
7146       result = maybe_legitimize_operand_same_code (icode, opno, op);
7147       volatile_ok = old_volatile_ok;
7148       return result;
7149
7150     case EXPAND_OUTPUT:
7151       gcc_assert (mode != VOIDmode);
7152       if (op->value
7153           && op->value != const0_rtx
7154           && GET_MODE (op->value) == mode
7155           && maybe_legitimize_operand_same_code (icode, opno, op))
7156         return true;
7157
7158       op->value = gen_reg_rtx (mode);
7159       op->target = 0;
7160       break;
7161
7162     case EXPAND_INPUT:
7163     input:
7164       gcc_assert (mode != VOIDmode);
7165       gcc_assert (GET_MODE (op->value) == VOIDmode
7166                   || GET_MODE (op->value) == mode);
7167       if (maybe_legitimize_operand_same_code (icode, opno, op))
7168         return true;
7169
7170       op->value = copy_to_mode_reg (mode, op->value);
7171       break;
7172
7173     case EXPAND_CONVERT_TO:
7174       gcc_assert (mode != VOIDmode);
7175       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
7176       goto input;
7177
7178     case EXPAND_CONVERT_FROM:
7179       if (GET_MODE (op->value) != VOIDmode)
7180         mode = GET_MODE (op->value);
7181       else
7182         /* The caller must tell us what mode this value has.  */
7183         gcc_assert (mode != VOIDmode);
7184
7185       imode = insn_data[(int) icode].operand[opno].mode;
7186       if (imode != VOIDmode && imode != mode)
7187         {
7188           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
7189           mode = imode;
7190         }
7191       goto input;
7192
7193     case EXPAND_ADDRESS:
7194       op->value = convert_memory_address (as_a <scalar_int_mode> (mode),
7195                                           op->value);
7196       goto input;
7197
7198     case EXPAND_INTEGER:
7199       mode = insn_data[(int) icode].operand[opno].mode;
7200       if (mode != VOIDmode
7201           && known_eq (trunc_int_for_mode (op->int_value, mode),
7202                        op->int_value))
7203         {
7204           op->value = gen_int_mode (op->int_value, mode);
7205           goto input;
7206         }
7207       break;
7208     }
7209   return insn_operand_matches (icode, opno, op->value);
7210 }
7211
7212 /* Make OP describe an input operand that should have the same value
7213    as VALUE, after any mode conversion that the target might request.
7214    TYPE is the type of VALUE.  */
7215
7216 void
7217 create_convert_operand_from_type (struct expand_operand *op,
7218                                   rtx value, tree type)
7219 {
7220   create_convert_operand_from (op, value, TYPE_MODE (type),
7221                                TYPE_UNSIGNED (type));
7222 }
7223
7224 /* Return true if the requirements on operands OP1 and OP2 of instruction
7225    ICODE are similar enough for the result of legitimizing OP1 to be
7226    reusable for OP2.  OPNO1 and OPNO2 are the operand numbers associated
7227    with OP1 and OP2 respectively.  */
7228
7229 static inline bool
7230 can_reuse_operands_p (enum insn_code icode,
7231                       unsigned int opno1, unsigned int opno2,
7232                       const struct expand_operand *op1,
7233                       const struct expand_operand *op2)
7234 {
7235   /* Check requirements that are common to all types.  */
7236   if (op1->type != op2->type
7237       || op1->mode != op2->mode
7238       || (insn_data[(int) icode].operand[opno1].mode
7239           != insn_data[(int) icode].operand[opno2].mode))
7240     return false;
7241
7242   /* Check the requirements for specific types.  */
7243   switch (op1->type)
7244     {
7245     case EXPAND_OUTPUT:
7246       /* Outputs must remain distinct.  */
7247       return false;
7248
7249     case EXPAND_FIXED:
7250     case EXPAND_INPUT:
7251     case EXPAND_ADDRESS:
7252     case EXPAND_INTEGER:
7253       return true;
7254
7255     case EXPAND_CONVERT_TO:
7256     case EXPAND_CONVERT_FROM:
7257       return op1->unsigned_p == op2->unsigned_p;
7258     }
7259   gcc_unreachable ();
7260 }
7261
7262 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
7263    of instruction ICODE.  Return true on success, leaving the new operand
7264    values in the OPS themselves.  Emit no code on failure.  */
7265
7266 bool
7267 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
7268                            unsigned int nops, struct expand_operand *ops)
7269 {
7270   rtx_insn *last = get_last_insn ();
7271   rtx *orig_values = XALLOCAVEC (rtx, nops);
7272   for (unsigned int i = 0; i < nops; i++)
7273     {
7274       orig_values[i] = ops[i].value;
7275
7276       /* First try reusing the result of an earlier legitimization.
7277          This avoids duplicate rtl and ensures that tied operands
7278          remain tied.
7279
7280          This search is linear, but NOPS is bounded at compile time
7281          to a small number (current a single digit).  */
7282       unsigned int j = 0;
7283       for (; j < i; ++j)
7284         if (can_reuse_operands_p (icode, opno + j, opno + i, &ops[j], &ops[i])
7285             && rtx_equal_p (orig_values[j], orig_values[i])
7286             && ops[j].value
7287             && insn_operand_matches (icode, opno + i, ops[j].value))
7288           {
7289             ops[i].value = copy_rtx (ops[j].value);
7290             break;
7291           }
7292
7293       /* Otherwise try legitimizing the operand on its own.  */
7294       if (j == i && !maybe_legitimize_operand (icode, opno + i, &ops[i]))
7295         {
7296           delete_insns_since (last);
7297           return false;
7298         }
7299     }
7300   return true;
7301 }
7302
7303 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
7304    as its operands.  Return the instruction pattern on success,
7305    and emit any necessary set-up code.  Return null and emit no
7306    code on failure.  */
7307
7308 rtx_insn *
7309 maybe_gen_insn (enum insn_code icode, unsigned int nops,
7310                 struct expand_operand *ops)
7311 {
7312   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
7313   if (!maybe_legitimize_operands (icode, 0, nops, ops))
7314     return NULL;
7315
7316   switch (nops)
7317     {
7318     case 1:
7319       return GEN_FCN (icode) (ops[0].value);
7320     case 2:
7321       return GEN_FCN (icode) (ops[0].value, ops[1].value);
7322     case 3:
7323       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
7324     case 4:
7325       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7326                               ops[3].value);
7327     case 5:
7328       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7329                               ops[3].value, ops[4].value);
7330     case 6:
7331       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7332                               ops[3].value, ops[4].value, ops[5].value);
7333     case 7:
7334       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7335                               ops[3].value, ops[4].value, ops[5].value,
7336                               ops[6].value);
7337     case 8:
7338       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7339                               ops[3].value, ops[4].value, ops[5].value,
7340                               ops[6].value, ops[7].value);
7341     case 9:
7342       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7343                               ops[3].value, ops[4].value, ops[5].value,
7344                               ops[6].value, ops[7].value, ops[8].value);
7345     }
7346   gcc_unreachable ();
7347 }
7348
7349 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
7350    as its operands.  Return true on success and emit no code on failure.  */
7351
7352 bool
7353 maybe_expand_insn (enum insn_code icode, unsigned int nops,
7354                    struct expand_operand *ops)
7355 {
7356   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7357   if (pat)
7358     {
7359       emit_insn (pat);
7360       return true;
7361     }
7362   return false;
7363 }
7364
7365 /* Like maybe_expand_insn, but for jumps.  */
7366
7367 bool
7368 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
7369                         struct expand_operand *ops)
7370 {
7371   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7372   if (pat)
7373     {
7374       emit_jump_insn (pat);
7375       return true;
7376     }
7377   return false;
7378 }
7379
7380 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
7381    as its operands.  */
7382
7383 void
7384 expand_insn (enum insn_code icode, unsigned int nops,
7385              struct expand_operand *ops)
7386 {
7387   if (!maybe_expand_insn (icode, nops, ops))
7388     gcc_unreachable ();
7389 }
7390
7391 /* Like expand_insn, but for jumps.  */
7392
7393 void
7394 expand_jump_insn (enum insn_code icode, unsigned int nops,
7395                   struct expand_operand *ops)
7396 {
7397   if (!maybe_expand_jump_insn (icode, nops, ops))
7398     gcc_unreachable ();
7399 }