gcc/optabs.cc

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2023 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "backend.h"
  25 #include "target.h"
  26 #include "rtl.h"
  27 #include "tree.h"
  28 #include "memmodel.h"
  29 #include "predict.h"
  30 #include "tm_p.h"
  31 #include "optabs.h"
  32 #include "expmed.h"
  33 #include "emit-rtl.h"
  34 #include "recog.h"
  35 #include "diagnostic-core.h"
  36 #include "rtx-vector-builder.h"
  37
  38 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  39    is properly defined.  */
  40 #include "stor-layout.h"
  41 #include "except.h"
  42 #include "dojump.h"
  43 #include "explow.h"
  44 #include "expr.h"
  45 #include "optabs-tree.h"
  46 #include "libfuncs.h"
  47 #include "internal-fn.h"
  48 #include "langhooks.h"
  49 #include "gimple.h"
  50 #include "ssa.h"
  51
  52 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  53                                    machine_mode *);
  54 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  55 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  56
  57 static rtx emit_conditional_move_1 (rtx, rtx, rtx, rtx, machine_mode);
  58
  59 /* Debug facility for use in GDB.  */
  60 void debug_optab_libfuncs (void);
  61 \f
  62 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
  63    the result of operation CODE applied to OP0 (and OP1 if it is a binary
  64    operation).  OP0_MODE is OP0's mode.
  65
  66    If the last insn does not set TARGET, don't do anything, but return true.
  67
  68    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
  69    or OP1, don't add the REG_EQUAL note but return false.  Our caller can then
  70    try again, ensuring that TARGET is not one of the operands.  */
  71
  72 static bool
  73 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0,
  74                 rtx op1, machine_mode op0_mode)
  75 {
  76   rtx_insn *last_insn;
  77   rtx set;
  78   rtx note;
  79
  80   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
  81
  82   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
  83       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
  84       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
  85       && GET_RTX_CLASS (code) != RTX_COMPARE
  86       && GET_RTX_CLASS (code) != RTX_UNARY)
  87     return true;
  88
  89   if (GET_CODE (target) == ZERO_EXTRACT)
  90     return true;
  91
  92   for (last_insn = insns;
  93        NEXT_INSN (last_insn) != NULL_RTX;
  94        last_insn = NEXT_INSN (last_insn))
  95     ;
  96
  97   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
  98      a value changing in the insn, so the note would be invalid for CSE.  */
  99   if (reg_overlap_mentioned_p (target, op0)
 100       || (op1 && reg_overlap_mentioned_p (target, op1)))
 101     {
 102       if (MEM_P (target)
 103           && (rtx_equal_p (target, op0)
 104               || (op1 && rtx_equal_p (target, op1))))
 105         {
 106           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 107              over expanding it as temp = MEM op X, MEM = temp.  If the target
 108              supports MEM = MEM op X instructions, it is sometimes too hard
 109              to reconstruct that form later, especially if X is also a memory,
 110              and due to multiple occurrences of addresses the address might
 111              be forced into register unnecessarily.
 112              Note that not emitting the REG_EQUIV note might inhibit
 113              CSE in some cases.  */
 114           set = single_set (last_insn);
 115           if (set
 116               && GET_CODE (SET_SRC (set)) == code
 117               && MEM_P (SET_DEST (set))
 118               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 119                   || (op1 && rtx_equal_p (SET_DEST (set),
 120                                           XEXP (SET_SRC (set), 1)))))
 121             return true;
 122         }
 123       return false;
 124     }
 125
 126   set = set_for_reg_notes (last_insn);
 127   if (set == NULL_RTX)
 128     return true;
 129
 130   if (! rtx_equal_p (SET_DEST (set), target)
 131       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 132       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 133           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 134     return true;
 135
 136   if (GET_RTX_CLASS (code) == RTX_UNARY)
 137     switch (code)
 138       {
 139       case FFS:
 140       case CLZ:
 141       case CTZ:
 142       case CLRSB:
 143       case POPCOUNT:
 144       case PARITY:
 145       case BSWAP:
 146         if (op0_mode != VOIDmode && GET_MODE (target) != op0_mode)
 147           {
 148             note = gen_rtx_fmt_e (code, op0_mode, copy_rtx (op0));
 149             if (GET_MODE_UNIT_SIZE (op0_mode)
 150                 > GET_MODE_UNIT_SIZE (GET_MODE (target)))
 151               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 152                                          note, op0_mode);
 153             else
 154               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 155                                          note, op0_mode);
 156             break;
 157           }
 158         /* FALLTHRU */
 159       default:
 160         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 161         break;
 162       }
 163   else
 164     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 165
 166   set_unique_reg_note (last_insn, REG_EQUAL, note);
 167
 168   return true;
 169 }
 170 \f
 171 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 172    for a widening operation would be.  In most cases this would be OP0, but if
 173    that's a constant it'll be VOIDmode, which isn't useful.  */
 174
 175 static machine_mode
 176 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 177 {
 178   machine_mode m0 = GET_MODE (op0);
 179   machine_mode m1 = GET_MODE (op1);
 180   machine_mode result;
 181
 182   if (m0 == VOIDmode && m1 == VOIDmode)
 183     return to_mode;
 184   else if (m0 == VOIDmode || GET_MODE_UNIT_SIZE (m0) < GET_MODE_UNIT_SIZE (m1))
 185     result = m1;
 186   else
 187     result = m0;
 188
 189   if (GET_MODE_UNIT_SIZE (result) > GET_MODE_UNIT_SIZE (to_mode))
 190     return to_mode;
 191
 192   return result;
 193 }
 194 \f
 195 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 196    says whether OP is signed or unsigned.  NO_EXTEND is true if we need
 197    not actually do a sign-extend or zero-extend, but can leave the
 198    higher-order bits of the result rtx undefined, for example, in the case
 199    of logical operations, but not right shifts.  */
 200
 201 static rtx
 202 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 203                int unsignedp, bool no_extend)
 204 {
 205   rtx result;
 206   scalar_int_mode int_mode;
 207
 208   /* If we don't have to extend and this is a constant, return it.  */
 209   if (no_extend && GET_MODE (op) == VOIDmode)
 210     return op;
 211
 212   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 213      extend since it will be more efficient to do so unless the signedness of
 214      a promoted object differs from our extension.  */
 215   if (! no_extend
 216       || !is_a <scalar_int_mode> (mode, &int_mode)
 217       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 218           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 219     return convert_modes (mode, oldmode, op, unsignedp);
 220
 221   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 222      SUBREG.  */
 223   if (GET_MODE_SIZE (int_mode) <= UNITS_PER_WORD)
 224     return gen_lowpart (int_mode, force_reg (GET_MODE (op), op));
 225
 226   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 227      part to OP.  */
 228
 229   result = gen_reg_rtx (int_mode);
 230   emit_clobber (result);
 231   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 232   return result;
 233 }
 234 \f
 235 /* Expand vector widening operations.
 236
 237    There are two different classes of operations handled here:
 238    1) Operations whose result is wider than all the arguments to the operation.
 239       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 240       In this case OP0 and optionally OP1 would be initialized,
 241       but WIDE_OP wouldn't (not relevant for this case).
 242    2) Operations whose result is of the same size as the last argument to the
 243       operation, but wider than all the other arguments to the operation.
 244       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 245       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 246
 247    E.g, when called to expand the following operations, this is how
 248    the arguments will be initialized:
 249                                 nops    OP0     OP1     WIDE_OP
 250    widening-sum                 2       oprnd0  -       oprnd1
 251    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 252    widening-mult                2       oprnd0  oprnd1  -
 253    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 254
 255 rtx
 256 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 257                            rtx target, int unsignedp)
 258 {
 259   class expand_operand eops[4];
 260   tree oprnd0, oprnd1, oprnd2;
 261   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 262   optab widen_pattern_optab;
 263   enum insn_code icode;
 264   int nops = TREE_CODE_LENGTH (ops->code);
 265   int op;
 266   bool sbool = false;
 267
 268   oprnd0 = ops->op0;
 269   oprnd1 = nops >= 2 ? ops->op1 : NULL_TREE;
 270   oprnd2 = nops >= 3 ? ops->op2 : NULL_TREE;
 271
 272   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 273   if (ops->code == VEC_UNPACK_FIX_TRUNC_HI_EXPR
 274       || ops->code == VEC_UNPACK_FIX_TRUNC_LO_EXPR)
 275     /* The sign is from the result type rather than operand's type
 276        for these ops.  */
 277     widen_pattern_optab
 278       = optab_for_tree_code (ops->code, ops->type, optab_default);
 279   else if ((ops->code == VEC_UNPACK_HI_EXPR
 280             || ops->code == VEC_UNPACK_LO_EXPR)
 281            && VECTOR_BOOLEAN_TYPE_P (ops->type)
 282            && VECTOR_BOOLEAN_TYPE_P (TREE_TYPE (oprnd0))
 283            && TYPE_MODE (ops->type) == TYPE_MODE (TREE_TYPE (oprnd0))
 284            && SCALAR_INT_MODE_P (TYPE_MODE (ops->type)))
 285     {
 286       /* For VEC_UNPACK_{LO,HI}_EXPR if the mode of op0 and result is
 287          the same scalar mode for VECTOR_BOOLEAN_TYPE_P vectors, use
 288          vec_unpacks_sbool_{lo,hi}_optab, so that we can pass in
 289          the pattern number of elements in the wider vector.  */
 290       widen_pattern_optab
 291         = (ops->code == VEC_UNPACK_HI_EXPR
 292            ? vec_unpacks_sbool_hi_optab : vec_unpacks_sbool_lo_optab);
 293       sbool = true;
 294     }
 295   else if (ops->code == DOT_PROD_EXPR)
 296     {
 297       enum optab_subtype subtype = optab_default;
 298       signop sign1 = TYPE_SIGN (TREE_TYPE (oprnd0));
 299       signop sign2 = TYPE_SIGN (TREE_TYPE (oprnd1));
 300       if (sign1 == sign2)
 301         ;
 302       else if (sign1 == SIGNED && sign2 == UNSIGNED)
 303         {
 304           subtype = optab_vector_mixed_sign;
 305           /* Same as optab_vector_mixed_sign but flip the operands.  */
 306           std::swap (op0, op1);
 307         }
 308       else if (sign1 == UNSIGNED && sign2 == SIGNED)
 309         subtype = optab_vector_mixed_sign;
 310       else
 311         gcc_unreachable ();
 312
 313       widen_pattern_optab
 314         = optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), subtype);
 315     }
 316   else
 317     widen_pattern_optab
 318       = optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 319   if (ops->code == WIDEN_MULT_PLUS_EXPR
 320       || ops->code == WIDEN_MULT_MINUS_EXPR)
 321     icode = find_widening_optab_handler (widen_pattern_optab,
 322                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 323                                          tmode0);
 324   else
 325     icode = optab_handler (widen_pattern_optab, tmode0);
 326   gcc_assert (icode != CODE_FOR_nothing);
 327
 328   if (nops >= 2)
 329     tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 330   else if (sbool)
 331     {
 332       nops = 2;
 333       op1 = GEN_INT (TYPE_VECTOR_SUBPARTS (TREE_TYPE (oprnd0)).to_constant ());
 334       tmode1 = tmode0;
 335     }
 336
 337   /* The last operand is of a wider mode than the rest of the operands.  */
 338   if (nops == 2)
 339     wmode = tmode1;
 340   else if (nops == 3)
 341     {
 342       gcc_assert (tmode1 == tmode0);
 343       gcc_assert (op1);
 344       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 345     }
 346
 347   op = 0;
 348   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 349   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 350   if (op1)
 351     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 352   if (wide_op)
 353     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 354   expand_insn (icode, op, eops);
 355   return eops[0].value;
 356 }
 357
 358 /* Generate code to perform an operation specified by TERNARY_OPTAB
 359    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 360
 361    UNSIGNEDP is for the case where we have to widen the operands
 362    to perform the operation.  It says to use zero-extension.
 363
 364    If TARGET is nonzero, the value
 365    is generated there, if it is convenient to do so.
 366    In all cases an rtx is returned for the locus of the value;
 367    this may or may not be TARGET.  */
 368
 369 rtx
 370 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 371                    rtx op1, rtx op2, rtx target, int unsignedp)
 372 {
 373   class expand_operand ops[4];
 374   enum insn_code icode = optab_handler (ternary_optab, mode);
 375
 376   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 377
 378   create_output_operand (&ops[0], target, mode);
 379   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 380   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 381   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 382   expand_insn (icode, 4, ops);
 383   return ops[0].value;
 384 }
 385
 386
 387 /* Like expand_binop, but return a constant rtx if the result can be
 388    calculated at compile time.  The arguments and return value are
 389    otherwise the same as for expand_binop.  */
 390
 391 rtx
 392 simplify_expand_binop (machine_mode mode, optab binoptab,
 393                        rtx op0, rtx op1, rtx target, int unsignedp,
 394                        enum optab_methods methods)
 395 {
 396   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 397     {
 398       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 399                                          mode, op0, op1);
 400       if (x)
 401         return x;
 402     }
 403
 404   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 405 }
 406
 407 /* Like simplify_expand_binop, but always put the result in TARGET.
 408    Return true if the expansion succeeded.  */
 409
 410 bool
 411 force_expand_binop (machine_mode mode, optab binoptab,
 412                     rtx op0, rtx op1, rtx target, int unsignedp,
 413                     enum optab_methods methods)
 414 {
 415   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 416                                  target, unsignedp, methods);
 417   if (x == 0)
 418     return false;
 419   if (x != target)
 420     emit_move_insn (target, x);
 421   return true;
 422 }
 423
 424 /* Create a new vector value in VMODE with all elements set to OP.  The
 425    mode of OP must be the element mode of VMODE.  If OP is a constant,
 426    then the return value will be a constant.  */
 427
 428 rtx
 429 expand_vector_broadcast (machine_mode vmode, rtx op)
 430 {
 431   int n;
 432   rtvec vec;
 433
 434   gcc_checking_assert (VECTOR_MODE_P (vmode));
 435
 436   if (valid_for_const_vector_p (vmode, op))
 437     return gen_const_vec_duplicate (vmode, op);
 438
 439   insn_code icode = optab_handler (vec_duplicate_optab, vmode);
 440   if (icode != CODE_FOR_nothing)
 441     {
 442       class expand_operand ops[2];
 443       create_output_operand (&ops[0], NULL_RTX, vmode);
 444       create_input_operand (&ops[1], op, GET_MODE (op));
 445       expand_insn (icode, 2, ops);
 446       return ops[0].value;
 447     }
 448
 449   if (!GET_MODE_NUNITS (vmode).is_constant (&n))
 450     return NULL;
 451
 452   /* ??? If the target doesn't have a vec_init, then we have no easy way
 453      of performing this operation.  Most of this sort of generic support
 454      is hidden away in the vector lowering support in gimple.  */
 455   icode = convert_optab_handler (vec_init_optab, vmode,
 456                                  GET_MODE_INNER (vmode));
 457   if (icode == CODE_FOR_nothing)
 458     return NULL;
 459
 460   vec = rtvec_alloc (n);
 461   for (int i = 0; i < n; ++i)
 462     RTVEC_ELT (vec, i) = op;
 463   rtx ret = gen_reg_rtx (vmode);
 464   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 465
 466   return ret;
 467 }
 468
 469 /* This subroutine of expand_doubleword_shift handles the cases in which
 470    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 471    value are the same as for the parent routine, except that SUPERWORD_OP1
 472    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 473    INTO_TARGET may be null if the caller has decided to calculate it.  */
 474
 475 static bool
 476 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 477                         rtx outof_target, rtx into_target,
 478                         int unsignedp, enum optab_methods methods)
 479 {
 480   if (into_target != 0)
 481     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 482                              into_target, unsignedp, methods))
 483       return false;
 484
 485   if (outof_target != 0)
 486     {
 487       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 488          of the sign bit, otherwise we must fill it with zeros.  */
 489       if (binoptab != ashr_optab)
 490         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 491       else
 492         if (!force_expand_binop (word_mode, binoptab, outof_input,
 493                                  gen_int_shift_amount (word_mode,
 494                                                        BITS_PER_WORD - 1),
 495                                  outof_target, unsignedp, methods))
 496           return false;
 497     }
 498   return true;
 499 }
 500
 501 /* This subroutine of expand_doubleword_shift handles the cases in which
 502    the effective shift value is < BITS_PER_WORD.  The arguments and return
 503    value are the same as for the parent routine.  */
 504
 505 static bool
 506 expand_subword_shift (scalar_int_mode op1_mode, optab binoptab,
 507                       rtx outof_input, rtx into_input, rtx op1,
 508                       rtx outof_target, rtx into_target,
 509                       int unsignedp, enum optab_methods methods,
 510                       unsigned HOST_WIDE_INT shift_mask)
 511 {
 512   optab reverse_unsigned_shift, unsigned_shift;
 513   rtx tmp, carries;
 514
 515   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 516   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 517
 518   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 519      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 520      the opposite direction to BINOPTAB.  */
 521   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 522     {
 523       carries = outof_input;
 524       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 525                                             op1_mode), op1_mode);
 526       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 527                                    0, true, methods);
 528     }
 529   else
 530     {
 531       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 532          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 533          has unknown behavior.  Do a single shift first, then shift by the
 534          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 535          are truncated to the mode size.  */
 536       carries = expand_binop (word_mode, reverse_unsigned_shift,
 537                               outof_input, const1_rtx, 0, unsignedp, methods);
 538       if (shift_mask == BITS_PER_WORD - 1)
 539         {
 540           tmp = immed_wide_int_const
 541             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 542           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 543                                        0, true, methods);
 544         }
 545       else
 546         {
 547           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 548                                                 op1_mode), op1_mode);
 549           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 550                                        0, true, methods);
 551         }
 552     }
 553   if (tmp == 0 || carries == 0)
 554     return false;
 555   carries = expand_binop (word_mode, reverse_unsigned_shift,
 556                           carries, tmp, 0, unsignedp, methods);
 557   if (carries == 0)
 558     return false;
 559
 560   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 561      so the result can go directly into INTO_TARGET if convenient.  */
 562   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 563                       into_target, unsignedp, methods);
 564   if (tmp == 0)
 565     return false;
 566
 567   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 568   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 569                            into_target, unsignedp, methods))
 570     return false;
 571
 572   /* Use a standard word_mode shift for the out-of half.  */
 573   if (outof_target != 0)
 574     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 575                              outof_target, unsignedp, methods))
 576       return false;
 577
 578   return true;
 579 }
 580
 581
 582 /* Try implementing expand_doubleword_shift using conditional moves.
 583    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 584    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 585    are the shift counts to use in the former and latter case.  All other
 586    arguments are the same as the parent routine.  */
 587
 588 static bool
 589 expand_doubleword_shift_condmove (scalar_int_mode op1_mode, optab binoptab,
 590                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 591                                   rtx outof_input, rtx into_input,
 592                                   rtx subword_op1, rtx superword_op1,
 593                                   rtx outof_target, rtx into_target,
 594                                   int unsignedp, enum optab_methods methods,
 595                                   unsigned HOST_WIDE_INT shift_mask)
 596 {
 597   rtx outof_superword, into_superword;
 598
 599   /* Put the superword version of the output into OUTOF_SUPERWORD and
 600      INTO_SUPERWORD.  */
 601   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 602   if (outof_target != 0 && subword_op1 == superword_op1)
 603     {
 604       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 605          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 606       into_superword = outof_target;
 607       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 608                                    outof_superword, 0, unsignedp, methods))
 609         return false;
 610     }
 611   else
 612     {
 613       into_superword = gen_reg_rtx (word_mode);
 614       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 615                                    outof_superword, into_superword,
 616                                    unsignedp, methods))
 617         return false;
 618     }
 619
 620   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 621   if (!expand_subword_shift (op1_mode, binoptab,
 622                              outof_input, into_input, subword_op1,
 623                              outof_target, into_target,
 624                              unsignedp, methods, shift_mask))
 625     return false;
 626
 627   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 628      might be the current value of OUTOF_TARGET.  */
 629   if (!emit_conditional_move (into_target, { cmp_code, cmp1, cmp2, op1_mode },
 630                               into_target, into_superword, word_mode, false))
 631     return false;
 632
 633   if (outof_target != 0)
 634     if (!emit_conditional_move (outof_target,
 635                                 { cmp_code, cmp1, cmp2, op1_mode },
 636                                 outof_target, outof_superword,
 637                                 word_mode, false))
 638       return false;
 639
 640   return true;
 641 }
 642
 643 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 644    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 645    input operand; the shift moves bits in the direction OUTOF_INPUT->
 646    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 647    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 648    If OP1 is constant, it will have been truncated as appropriate
 649    and is known to be nonzero.
 650
 651    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 652    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 653    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 654
 655    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 656    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 657    fill with zeros or sign bits as appropriate.
 658
 659    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 660    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 661    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
 662    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
 663    are undefined.
 664
 665    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
 666    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
 667    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
 668    function wants to calculate it itself.
 669
 670    Return true if the shift could be successfully synthesized.  */
 671
 672 static bool
 673 expand_doubleword_shift (scalar_int_mode op1_mode, optab binoptab,
 674                          rtx outof_input, rtx into_input, rtx op1,
 675                          rtx outof_target, rtx into_target,
 676                          int unsignedp, enum optab_methods methods,
 677                          unsigned HOST_WIDE_INT shift_mask)
 678 {
 679   rtx superword_op1, tmp, cmp1, cmp2;
 680   enum rtx_code cmp_code;
 681
 682   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
 683      fill the result with sign or zero bits as appropriate.  If so, the value
 684      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
 685      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
 686      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
 687
 688      This isn't worthwhile for constant shifts since the optimizers will
 689      cope better with in-range shift counts.  */
 690   if (shift_mask >= BITS_PER_WORD
 691       && outof_target != 0
 692       && !CONSTANT_P (op1))
 693     {
 694       if (!expand_doubleword_shift (op1_mode, binoptab,
 695                                     outof_input, into_input, op1,
 696                                     0, into_target,
 697                                     unsignedp, methods, shift_mask))
 698         return false;
 699       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 700                                outof_target, unsignedp, methods))
 701         return false;
 702       return true;
 703     }
 704
 705   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
 706      is true when the effective shift value is less than BITS_PER_WORD.
 707      Set SUPERWORD_OP1 to the shift count that should be used to shift
 708      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
 709   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
 710   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
 711     {
 712       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
 713          is a subword shift count.  */
 714       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
 715                                     0, true, methods);
 716       cmp2 = CONST0_RTX (op1_mode);
 717       cmp_code = EQ;
 718       superword_op1 = op1;
 719     }
 720   else
 721     {
 722       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
 723       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
 724                                     0, true, methods);
 725       cmp2 = CONST0_RTX (op1_mode);
 726       cmp_code = LT;
 727       superword_op1 = cmp1;
 728     }
 729   if (cmp1 == 0)
 730     return false;
 731
 732   /* If we can compute the condition at compile time, pick the
 733      appropriate subroutine.  */
 734   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
 735   if (tmp != 0 && CONST_INT_P (tmp))
 736     {
 737       if (tmp == const0_rtx)
 738         return expand_superword_shift (binoptab, outof_input, superword_op1,
 739                                        outof_target, into_target,
 740                                        unsignedp, methods);
 741       else
 742         return expand_subword_shift (op1_mode, binoptab,
 743                                      outof_input, into_input, op1,
 744                                      outof_target, into_target,
 745                                      unsignedp, methods, shift_mask);
 746     }
 747
 748   /* Try using conditional moves to generate straight-line code.  */
 749   if (HAVE_conditional_move)
 750     {
 751       rtx_insn *start = get_last_insn ();
 752       if (expand_doubleword_shift_condmove (op1_mode, binoptab,
 753                                             cmp_code, cmp1, cmp2,
 754                                             outof_input, into_input,
 755                                             op1, superword_op1,
 756                                             outof_target, into_target,
 757                                             unsignedp, methods, shift_mask))
 758         return true;
 759       delete_insns_since (start);
 760     }
 761
 762   /* As a last resort, use branches to select the correct alternative.  */
 763   rtx_code_label *subword_label = gen_label_rtx ();
 764   rtx_code_label *done_label = gen_label_rtx ();
 765
 766   NO_DEFER_POP;
 767   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
 768                            0, 0, subword_label,
 769                            profile_probability::uninitialized ());
 770   OK_DEFER_POP;
 771
 772   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 773                                outof_target, into_target,
 774                                unsignedp, methods))
 775     return false;
 776
 777   emit_jump_insn (targetm.gen_jump (done_label));
 778   emit_barrier ();
 779   emit_label (subword_label);
 780
 781   if (!expand_subword_shift (op1_mode, binoptab,
 782                              outof_input, into_input, op1,
 783                              outof_target, into_target,
 784                              unsignedp, methods, shift_mask))
 785     return false;
 786
 787   emit_label (done_label);
 788   return true;
 789 }
 790 \f
 791 /* Subroutine of expand_binop.  Perform a double word multiplication of
 792    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
 793    as the target's word_mode.  This function return NULL_RTX if anything
 794    goes wrong, in which case it may have already emitted instructions
 795    which need to be deleted.
 796
 797    If we want to multiply two two-word values and have normal and widening
 798    multiplies of single-word values, we can do this with three smaller
 799    multiplications.
 800
 801    The multiplication proceeds as follows:
 802                                  _______________________
 803                                 [__op0_high_|__op0_low__]
 804                                  _______________________
 805         *                       [__op1_high_|__op1_low__]
 806         _______________________________________________
 807                                  _______________________
 808     (1)                         [__op0_low__*__op1_low__]
 809                      _______________________
 810     (2a)            [__op0_low__*__op1_high_]
 811                      _______________________
 812     (2b)            [__op0_high_*__op1_low__]
 813          _______________________
 814     (3) [__op0_high_*__op1_high_]
 815
 816
 817   This gives a 4-word result.  Since we are only interested in the
 818   lower 2 words, partial result (3) and the upper words of (2a) and
 819   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
 820   calculated using non-widening multiplication.
 821
 822   (1), however, needs to be calculated with an unsigned widening
 823   multiplication.  If this operation is not directly supported we
 824   try using a signed widening multiplication and adjust the result.
 825   This adjustment works as follows:
 826
 827       If both operands are positive then no adjustment is needed.
 828
 829       If the operands have different signs, for example op0_low < 0 and
 830       op1_low >= 0, the instruction treats the most significant bit of
 831       op0_low as a sign bit instead of a bit with significance
 832       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
 833       with 2**BITS_PER_WORD - op0_low, and two's complements the
 834       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
 835       the result.
 836
 837       Similarly, if both operands are negative, we need to add
 838       (op0_low + op1_low) * 2**BITS_PER_WORD.
 839
 840       We use a trick to adjust quickly.  We logically shift op0_low right
 841       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
 842       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
 843       logical shift exists, we do an arithmetic right shift and subtract
 844       the 0 or -1.  */
 845
 846 static rtx
 847 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
 848                        bool umulp, enum optab_methods methods)
 849 {
 850   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
 851   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
 852   rtx wordm1 = (umulp ? NULL_RTX
 853                 : gen_int_shift_amount (word_mode, BITS_PER_WORD - 1));
 854   rtx product, adjust, product_high, temp;
 855
 856   rtx op0_high = operand_subword_force (op0, high, mode);
 857   rtx op0_low = operand_subword_force (op0, low, mode);
 858   rtx op1_high = operand_subword_force (op1, high, mode);
 859   rtx op1_low = operand_subword_force (op1, low, mode);
 860
 861   /* If we're using an unsigned multiply to directly compute the product
 862      of the low-order words of the operands and perform any required
 863      adjustments of the operands, we begin by trying two more multiplications
 864      and then computing the appropriate sum.
 865
 866      We have checked above that the required addition is provided.
 867      Full-word addition will normally always succeed, especially if
 868      it is provided at all, so we don't worry about its failure.  The
 869      multiplication may well fail, however, so we do handle that.  */
 870
 871   if (!umulp)
 872     {
 873       /* ??? This could be done with emit_store_flag where available.  */
 874       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
 875                            NULL_RTX, 1, methods);
 876       if (temp)
 877         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
 878                                  NULL_RTX, 0, OPTAB_DIRECT);
 879       else
 880         {
 881           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
 882                                NULL_RTX, 0, methods);
 883           if (!temp)
 884             return NULL_RTX;
 885           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
 886                                    NULL_RTX, 0, OPTAB_DIRECT);
 887         }
 888
 889       if (!op0_high)
 890         return NULL_RTX;
 891     }
 892
 893   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
 894                          NULL_RTX, 0, OPTAB_DIRECT);
 895   if (!adjust)
 896     return NULL_RTX;
 897
 898   /* OP0_HIGH should now be dead.  */
 899
 900   if (!umulp)
 901     {
 902       /* ??? This could be done with emit_store_flag where available.  */
 903       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
 904                            NULL_RTX, 1, methods);
 905       if (temp)
 906         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
 907                                  NULL_RTX, 0, OPTAB_DIRECT);
 908       else
 909         {
 910           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
 911                                NULL_RTX, 0, methods);
 912           if (!temp)
 913             return NULL_RTX;
 914           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
 915                                    NULL_RTX, 0, OPTAB_DIRECT);
 916         }
 917
 918       if (!op1_high)
 919         return NULL_RTX;
 920     }
 921
 922   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
 923                        NULL_RTX, 0, OPTAB_DIRECT);
 924   if (!temp)
 925     return NULL_RTX;
 926
 927   /* OP1_HIGH should now be dead.  */
 928
 929   adjust = expand_binop (word_mode, add_optab, adjust, temp,
 930                          NULL_RTX, 0, OPTAB_DIRECT);
 931
 932   if (target && !REG_P (target))
 933     target = NULL_RTX;
 934
 935   /* *_widen_optab needs to determine operand mode, make sure at least
 936      one operand has non-VOID mode.  */
 937   if (GET_MODE (op0_low) == VOIDmode && GET_MODE (op1_low) == VOIDmode)
 938     op0_low = force_reg (word_mode, op0_low);
 939
 940   if (umulp)
 941     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
 942                             target, 1, OPTAB_DIRECT);
 943   else
 944     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
 945                             target, 1, OPTAB_DIRECT);
 946
 947   if (!product)
 948     return NULL_RTX;
 949
 950   product_high = operand_subword (product, high, 1, mode);
 951   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
 952                          NULL_RTX, 0, OPTAB_DIRECT);
 953   emit_move_insn (product_high, adjust);
 954   return product;
 955 }
 956
 957 /* Subroutine of expand_binop.  Optimize unsigned double-word OP0 % OP1 for
 958    constant OP1.  If for some bit in [BITS_PER_WORD / 2, BITS_PER_WORD] range
 959    (prefer higher bits) ((1w << bit) % OP1) == 1, then the modulo can be
 960    computed in word-mode as ((OP0 & (bit - 1)) + ((OP0 >> bit) & (bit - 1))
 961    + (OP0 >> (2 * bit))) % OP1.  Whether we need to sum 2, 3 or 4 values
 962    depends on the bit value, if 2, then carry from the addition needs to be
 963    added too, i.e. like:
 964    sum += __builtin_add_overflow (low, high, &sum)
 965
 966    Optimize signed double-word OP0 % OP1 similarly, just apply some correction
 967    factor to the sum before doing unsigned remainder, in the form of
 968    sum += (((signed) OP0 >> (2 * BITS_PER_WORD - 1)) & const);
 969    then perform unsigned
 970    remainder = sum % OP1;
 971    and finally
 972    remainder += ((signed) OP0 >> (2 * BITS_PER_WORD - 1)) & (1 - OP1);  */
 973
 974 static rtx
 975 expand_doubleword_mod (machine_mode mode, rtx op0, rtx op1, bool unsignedp)
 976 {
 977   if (INTVAL (op1) <= 1 || (INTVAL (op1) & 1) == 0)
 978     return NULL_RTX;
 979
 980   rtx_insn *last = get_last_insn ();
 981   for (int bit = BITS_PER_WORD; bit >= BITS_PER_WORD / 2; bit--)
 982     {
 983       wide_int w = wi::shifted_mask (bit, 1, false, 2 * BITS_PER_WORD);
 984       if (wi::ne_p (wi::umod_trunc (w, INTVAL (op1)), 1))
 985         continue;
 986       rtx sum = NULL_RTX, mask = NULL_RTX;
 987       if (bit == BITS_PER_WORD)
 988         {
 989           /* For signed modulo we need to add correction to the sum
 990              and that might again overflow.  */
 991           if (!unsignedp)
 992             continue;
 993           if (optab_handler (uaddv4_optab, word_mode) == CODE_FOR_nothing)
 994             continue;
 995           tree wtype = lang_hooks.types.type_for_mode (word_mode, 1);
 996           if (wtype == NULL_TREE)
 997             continue;
 998           tree ctype = build_complex_type (wtype);
 999           if (TYPE_MODE (ctype) != GET_MODE_COMPLEX_MODE (word_mode))
1000             continue;
1001           machine_mode cmode = TYPE_MODE (ctype);
1002           rtx op00 = operand_subword_force (op0, 0, mode);
1003           rtx op01 = operand_subword_force (op0, 1, mode);
1004           rtx cres = gen_rtx_CONCAT (cmode, gen_reg_rtx (word_mode),
1005                                      gen_reg_rtx (word_mode));
1006           tree lhs = make_tree (ctype, cres);
1007           tree arg0 = make_tree (wtype, op00);
1008           tree arg1 = make_tree (wtype, op01);
1009           expand_addsub_overflow (UNKNOWN_LOCATION, PLUS_EXPR, lhs, arg0,
1010                                   arg1, true, true, true, false, NULL);
1011           sum = expand_simple_binop (word_mode, PLUS, XEXP (cres, 0),
1012                                      XEXP (cres, 1), NULL_RTX, 1,
1013                                      OPTAB_DIRECT);
1014           if (sum == NULL_RTX)
1015             return NULL_RTX;
1016         }
1017       else
1018         {
1019           /* Code below uses GEN_INT, so we need the masks to be representable
1020              in HOST_WIDE_INTs.  */
1021           if (bit >= HOST_BITS_PER_WIDE_INT)
1022             continue;
1023           /* If op0 is e.g. -1 or -2 unsigned, then the 2 additions might
1024              overflow.  Consider 64-bit -1ULL for word size 32, if we add
1025              0x7fffffffU + 0x7fffffffU + 3U, it wraps around to 1.  */
1026           if (bit == BITS_PER_WORD - 1)
1027             continue;
1028
1029           int count = (2 * BITS_PER_WORD + bit - 1) / bit;
1030           rtx sum_corr = NULL_RTX;
1031
1032           if (!unsignedp)
1033             {
1034               /* For signed modulo, compute it as unsigned modulo of
1035                  sum with a correction added to it if OP0 is negative,
1036                  such that the result can be computed as unsigned
1037                  remainder + ((OP1 >> (2 * BITS_PER_WORD - 1)) & (1 - OP1).  */
1038               w = wi::min_value (2 * BITS_PER_WORD, SIGNED);
1039               wide_int wmod1 = wi::umod_trunc (w, INTVAL (op1));
1040               wide_int wmod2 = wi::smod_trunc (w, INTVAL (op1));
1041               /* wmod2 == -wmod1.  */
1042               wmod2 = wmod2 + (INTVAL (op1) - 1);
1043               if (wi::ne_p (wmod1, wmod2))
1044                 {
1045                   wide_int wcorr = wmod2 - wmod1;
1046                   if (wi::neg_p (w))
1047                     wcorr = wcorr + INTVAL (op1);
1048                   /* Now verify if the count sums can't overflow, and punt
1049                      if they could.  */
1050                   w = wi::mask (bit, false, 2 * BITS_PER_WORD);
1051                   w = w * (count - 1);
1052                   w = w + wi::mask (2 * BITS_PER_WORD - (count - 1) * bit,
1053                                     false, 2 * BITS_PER_WORD);
1054                   w = w + wcorr;
1055                   w = wi::lrshift (w, BITS_PER_WORD);
1056                   if (wi::ne_p (w, 0))
1057                     continue;
1058
1059                   mask = operand_subword_force (op0, WORDS_BIG_ENDIAN ? 0 : 1,
1060                                                 mode);
1061                   mask = expand_simple_binop (word_mode, ASHIFTRT, mask,
1062                                               GEN_INT (BITS_PER_WORD - 1),
1063                                               NULL_RTX, 0, OPTAB_DIRECT);
1064                   if (mask == NULL_RTX)
1065                     return NULL_RTX;
1066                   sum_corr = immed_wide_int_const (wcorr, word_mode);
1067                   sum_corr = expand_simple_binop (word_mode, AND, mask,
1068                                                   sum_corr, NULL_RTX, 1,
1069                                                   OPTAB_DIRECT);
1070                   if (sum_corr == NULL_RTX)
1071                     return NULL_RTX;
1072                 }
1073             }
1074
1075           for (int i = 0; i < count; i++)
1076             {
1077               rtx v = op0;
1078               if (i)
1079                 v = expand_simple_binop (mode, LSHIFTRT, v, GEN_INT (i * bit),
1080                                          NULL_RTX, 1, OPTAB_DIRECT);
1081               if (v == NULL_RTX)
1082                 return NULL_RTX;
1083               v = lowpart_subreg (word_mode, v, mode);
1084               if (v == NULL_RTX)
1085                 return NULL_RTX;
1086               if (i != count - 1)
1087                 v = expand_simple_binop (word_mode, AND, v,
1088                                          GEN_INT ((HOST_WIDE_INT_1U << bit)
1089                                                   - 1), NULL_RTX, 1,
1090                                          OPTAB_DIRECT);
1091               if (v == NULL_RTX)
1092                 return NULL_RTX;
1093               if (sum == NULL_RTX)
1094                 sum = v;
1095               else
1096                 sum = expand_simple_binop (word_mode, PLUS, sum, v, NULL_RTX,
1097                                            1, OPTAB_DIRECT);
1098               if (sum == NULL_RTX)
1099                 return NULL_RTX;
1100             }
1101           if (sum_corr)
1102             {
1103               sum = expand_simple_binop (word_mode, PLUS, sum, sum_corr,
1104                                          NULL_RTX, 1, OPTAB_DIRECT);
1105               if (sum == NULL_RTX)
1106                 return NULL_RTX;
1107             }
1108         }
1109       rtx remainder = expand_divmod (1, TRUNC_MOD_EXPR, word_mode, sum,
1110                                      gen_int_mode (INTVAL (op1), word_mode),
1111                                      NULL_RTX, 1, OPTAB_DIRECT);
1112       if (remainder == NULL_RTX)
1113         return NULL_RTX;
1114
1115       if (!unsignedp)
1116         {
1117           if (mask == NULL_RTX)
1118             {
1119               mask = operand_subword_force (op0, WORDS_BIG_ENDIAN ? 0 : 1,
1120                                             mode);
1121               mask = expand_simple_binop (word_mode, ASHIFTRT, mask,
1122                                           GEN_INT (BITS_PER_WORD - 1),
1123                                           NULL_RTX, 0, OPTAB_DIRECT);
1124               if (mask == NULL_RTX)
1125                 return NULL_RTX;
1126             }
1127           mask = expand_simple_binop (word_mode, AND, mask,
1128                                       gen_int_mode (1 - INTVAL (op1),
1129                                                     word_mode),
1130                                       NULL_RTX, 1, OPTAB_DIRECT);
1131           if (mask == NULL_RTX)
1132             return NULL_RTX;
1133           remainder = expand_simple_binop (word_mode, PLUS, remainder,
1134                                            mask, NULL_RTX, 1, OPTAB_DIRECT);
1135           if (remainder == NULL_RTX)
1136             return NULL_RTX;
1137         }
1138
1139       remainder = convert_modes (mode, word_mode, remainder, unsignedp);
1140       /* Punt if we need any library calls.  */
1141       if (last)
1142         last = NEXT_INSN (last);
1143       else
1144         last = get_insns ();
1145       for (; last; last = NEXT_INSN (last))
1146         if (CALL_P (last))
1147           return NULL_RTX;
1148       return remainder;
1149     }
1150   return NULL_RTX;
1151 }
1152
1153 /* Similarly to the above function, but compute both quotient and remainder.
1154    Quotient can be computed from the remainder as:
1155    rem = op0 % op1;  // Handled using expand_doubleword_mod
1156    quot = (op0 - rem) * inv; // inv is multiplicative inverse of op1 modulo
1157                              // 2 * BITS_PER_WORD
1158
1159    We can also handle cases where op1 is a multiple of power of two constant
1160    and constant handled by expand_doubleword_mod.
1161    op11 = 1 << __builtin_ctz (op1);
1162    op12 = op1 / op11;
1163    rem1 = op0 % op12;  // Handled using expand_doubleword_mod
1164    quot1 = (op0 - rem1) * inv; // inv is multiplicative inverse of op12 modulo
1165                                // 2 * BITS_PER_WORD
1166    rem = (quot1 % op11) * op12 + rem1;
1167    quot = quot1 / op11;  */
1168
1169 rtx
1170 expand_doubleword_divmod (machine_mode mode, rtx op0, rtx op1, rtx *rem,
1171                           bool unsignedp)
1172 {
1173   *rem = NULL_RTX;
1174
1175   /* Negative dividend should have been optimized into positive,
1176      similarly modulo by 1 and modulo by power of two is optimized
1177      differently too.  */
1178   if (INTVAL (op1) <= 1 || pow2p_hwi (INTVAL (op1)))
1179     return NULL_RTX;
1180
1181   rtx op11 = const1_rtx;
1182   rtx op12 = op1;
1183   if ((INTVAL (op1) & 1) == 0)
1184     {
1185       int bit = ctz_hwi (INTVAL (op1));
1186       op11 = GEN_INT (HOST_WIDE_INT_1 << bit);
1187       op12 = GEN_INT (INTVAL (op1) >> bit);
1188     }
1189
1190   rtx rem1 = expand_doubleword_mod (mode, op0, op12, unsignedp);
1191   if (rem1 == NULL_RTX)
1192     return NULL_RTX;
1193
1194   int prec = 2 * BITS_PER_WORD;
1195   wide_int a = wide_int::from (INTVAL (op12), prec + 1, UNSIGNED);
1196   wide_int b = wi::shifted_mask (prec, 1, false, prec + 1);
1197   wide_int m = wide_int::from (wi::mod_inv (a, b), prec, UNSIGNED);
1198   rtx inv = immed_wide_int_const (m, mode);
1199
1200   rtx_insn *last = get_last_insn ();
1201   rtx quot1 = expand_simple_binop (mode, MINUS, op0, rem1,
1202                                    NULL_RTX, unsignedp, OPTAB_DIRECT);
1203   if (quot1 == NULL_RTX)
1204     return NULL_RTX;
1205
1206   quot1 = expand_simple_binop (mode, MULT, quot1, inv,
1207                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1208   if (quot1 == NULL_RTX)
1209     return NULL_RTX;
1210
1211   if (op11 != const1_rtx)
1212     {
1213       rtx rem2 = expand_divmod (1, TRUNC_MOD_EXPR, mode, quot1, op11,
1214                                 NULL_RTX, unsignedp, OPTAB_DIRECT);
1215       if (rem2 == NULL_RTX)
1216         return NULL_RTX;
1217
1218       rem2 = expand_simple_binop (mode, MULT, rem2, op12, NULL_RTX,
1219                                   unsignedp, OPTAB_DIRECT);
1220       if (rem2 == NULL_RTX)
1221         return NULL_RTX;
1222
1223       rem2 = expand_simple_binop (mode, PLUS, rem2, rem1, NULL_RTX,
1224                                   unsignedp, OPTAB_DIRECT);
1225       if (rem2 == NULL_RTX)
1226         return NULL_RTX;
1227
1228       rtx quot2 = expand_divmod (0, TRUNC_DIV_EXPR, mode, quot1, op11,
1229                                  NULL_RTX, unsignedp, OPTAB_DIRECT);
1230       if (quot2 == NULL_RTX)
1231         return NULL_RTX;
1232
1233       rem1 = rem2;
1234       quot1 = quot2;
1235     }
1236
1237   /* Punt if we need any library calls.  */
1238   if (last)
1239     last = NEXT_INSN (last);
1240   else
1241     last = get_insns ();
1242   for (; last; last = NEXT_INSN (last))
1243     if (CALL_P (last))
1244       return NULL_RTX;
1245
1246   *rem = rem1;
1247   return quot1;
1248 }
1249 \f
1250 /* Wrapper around expand_binop which takes an rtx code to specify
1251    the operation to perform, not an optab pointer.  All other
1252    arguments are the same.  */
1253 rtx
1254 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
1255                      rtx op1, rtx target, int unsignedp,
1256                      enum optab_methods methods)
1257 {
1258   optab binop = code_to_optab (code);
1259   gcc_assert (binop);
1260
1261   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
1262 }
1263
1264 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
1265    binop.  Order them according to commutative_operand_precedence and, if
1266    possible, try to put TARGET or a pseudo first.  */
1267 static bool
1268 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
1269 {
1270   int op0_prec = commutative_operand_precedence (op0);
1271   int op1_prec = commutative_operand_precedence (op1);
1272
1273   if (op0_prec < op1_prec)
1274     return true;
1275
1276   if (op0_prec > op1_prec)
1277     return false;
1278
1279   /* With equal precedence, both orders are ok, but it is better if the
1280      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
1281   if (target == 0 || REG_P (target))
1282     return (REG_P (op1) && !REG_P (op0)) || target == op1;
1283   else
1284     return rtx_equal_p (op1, target);
1285 }
1286
1287 /* Return true if BINOPTAB implements a shift operation.  */
1288
1289 static bool
1290 shift_optab_p (optab binoptab)
1291 {
1292   switch (optab_to_code (binoptab))
1293     {
1294     case ASHIFT:
1295     case SS_ASHIFT:
1296     case US_ASHIFT:
1297     case ASHIFTRT:
1298     case LSHIFTRT:
1299     case ROTATE:
1300     case ROTATERT:
1301       return true;
1302
1303     default:
1304       return false;
1305     }
1306 }
1307
1308 /* Return true if BINOPTAB implements a commutative binary operation.  */
1309
1310 static bool
1311 commutative_optab_p (optab binoptab)
1312 {
1313   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
1314           || binoptab == smul_widen_optab
1315           || binoptab == umul_widen_optab
1316           || binoptab == smul_highpart_optab
1317           || binoptab == umul_highpart_optab
1318           || binoptab == vec_widen_sadd_optab
1319           || binoptab == vec_widen_uadd_optab
1320           || binoptab == vec_widen_sadd_hi_optab
1321           || binoptab == vec_widen_sadd_lo_optab
1322           || binoptab == vec_widen_uadd_hi_optab
1323           || binoptab == vec_widen_uadd_lo_optab
1324           || binoptab == vec_widen_sadd_even_optab
1325           || binoptab == vec_widen_sadd_odd_optab
1326           || binoptab == vec_widen_uadd_even_optab
1327           || binoptab == vec_widen_uadd_odd_optab);
1328 }
1329
1330 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
1331    optimizing, and if the operand is a constant that costs more than
1332    1 instruction, force the constant into a register and return that
1333    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
1334
1335 static rtx
1336 avoid_expensive_constant (machine_mode mode, optab binoptab,
1337                           int opn, rtx x, bool unsignedp)
1338 {
1339   bool speed = optimize_insn_for_speed_p ();
1340
1341   if (mode != VOIDmode
1342       && optimize
1343       && CONSTANT_P (x)
1344       && (rtx_cost (x, mode, optab_to_code (binoptab), opn, speed)
1345           > set_src_cost (x, mode, speed)))
1346     {
1347       if (CONST_INT_P (x))
1348         {
1349           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
1350           if (intval != INTVAL (x))
1351             x = GEN_INT (intval);
1352         }
1353       else
1354         x = convert_modes (mode, VOIDmode, x, unsignedp);
1355       x = force_reg (mode, x);
1356     }
1357   return x;
1358 }
1359
1360 /* Helper function for expand_binop: handle the case where there
1361    is an insn ICODE that directly implements the indicated operation.
1362    Returns null if this is not possible.  */
1363 static rtx
1364 expand_binop_directly (enum insn_code icode, machine_mode mode, optab binoptab,
1365                        rtx op0, rtx op1,
1366                        rtx target, int unsignedp, enum optab_methods methods,
1367                        rtx_insn *last)
1368 {
1369   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1370   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1371   machine_mode mode0, mode1, tmp_mode;
1372   class expand_operand ops[3];
1373   bool commutative_p;
1374   rtx_insn *pat;
1375   rtx xop0 = op0, xop1 = op1;
1376   bool canonicalize_op1 = false;
1377
1378   /* If it is a commutative operator and the modes would match
1379      if we would swap the operands, we can save the conversions.  */
1380   commutative_p = commutative_optab_p (binoptab);
1381   if (commutative_p
1382       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1383       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode0)
1384     std::swap (xop0, xop1);
1385
1386   /* If we are optimizing, force expensive constants into a register.  */
1387   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1388   if (!shift_optab_p (binoptab))
1389     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1390   else
1391     /* Shifts and rotates often use a different mode for op1 from op0;
1392        for VOIDmode constants we don't know the mode, so force it
1393        to be canonicalized using convert_modes.  */
1394     canonicalize_op1 = true;
1395
1396   /* In case the insn wants input operands in modes different from
1397      those of the actual operands, convert the operands.  It would
1398      seem that we don't need to convert CONST_INTs, but we do, so
1399      that they're properly zero-extended, sign-extended or truncated
1400      for their mode.  */
1401
1402   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1403   if (xmode0 != VOIDmode && xmode0 != mode0)
1404     {
1405       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1406       mode0 = xmode0;
1407     }
1408
1409   mode1 = ((GET_MODE (xop1) != VOIDmode || canonicalize_op1)
1410            ? GET_MODE (xop1) : mode);
1411   if (xmode1 != VOIDmode && xmode1 != mode1)
1412     {
1413       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1414       mode1 = xmode1;
1415     }
1416
1417   /* If operation is commutative,
1418      try to make the first operand a register.
1419      Even better, try to make it the same as the target.
1420      Also try to make the last operand a constant.  */
1421   if (commutative_p
1422       && swap_commutative_operands_with_target (target, xop0, xop1))
1423     std::swap (xop0, xop1);
1424
1425   /* Now, if insn's predicates don't allow our operands, put them into
1426      pseudo regs.  */
1427
1428   if (binoptab == vec_pack_trunc_optab
1429       || binoptab == vec_pack_usat_optab
1430       || binoptab == vec_pack_ssat_optab
1431       || binoptab == vec_pack_ufix_trunc_optab
1432       || binoptab == vec_pack_sfix_trunc_optab
1433       || binoptab == vec_packu_float_optab
1434       || binoptab == vec_packs_float_optab)
1435     {
1436       /* The mode of the result is different then the mode of the
1437          arguments.  */
1438       tmp_mode = insn_data[(int) icode].operand[0].mode;
1439       if (VECTOR_MODE_P (mode)
1440           && maybe_ne (GET_MODE_NUNITS (tmp_mode), 2 * GET_MODE_NUNITS (mode)))
1441         {
1442           delete_insns_since (last);
1443           return NULL_RTX;
1444         }
1445     }
1446   else
1447     tmp_mode = mode;
1448
1449   create_output_operand (&ops[0], target, tmp_mode);
1450   create_input_operand (&ops[1], xop0, mode0);
1451   create_input_operand (&ops[2], xop1, mode1);
1452   pat = maybe_gen_insn (icode, 3, ops);
1453   if (pat)
1454     {
1455       /* If PAT is composed of more than one insn, try to add an appropriate
1456          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1457          operand, call expand_binop again, this time without a target.  */
1458       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1459           && ! add_equal_note (pat, ops[0].value,
1460                                optab_to_code (binoptab),
1461                                ops[1].value, ops[2].value, mode0))
1462         {
1463           delete_insns_since (last);
1464           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1465                                unsignedp, methods);
1466         }
1467
1468       emit_insn (pat);
1469       return ops[0].value;
1470     }
1471   delete_insns_since (last);
1472   return NULL_RTX;
1473 }
1474
1475 /* Generate code to perform an operation specified by BINOPTAB
1476    on operands OP0 and OP1, with result having machine-mode MODE.
1477
1478    UNSIGNEDP is for the case where we have to widen the operands
1479    to perform the operation.  It says to use zero-extension.
1480
1481    If TARGET is nonzero, the value
1482    is generated there, if it is convenient to do so.
1483    In all cases an rtx is returned for the locus of the value;
1484    this may or may not be TARGET.  */
1485
1486 rtx
1487 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1488               rtx target, int unsignedp, enum optab_methods methods)
1489 {
1490   enum optab_methods next_methods
1491     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1492        ? OPTAB_WIDEN : methods);
1493   enum mode_class mclass;
1494   enum insn_code icode;
1495   machine_mode wider_mode;
1496   scalar_int_mode int_mode;
1497   rtx libfunc;
1498   rtx temp;
1499   rtx_insn *entry_last = get_last_insn ();
1500   rtx_insn *last;
1501
1502   mclass = GET_MODE_CLASS (mode);
1503
1504   /* If subtracting an integer constant, convert this into an addition of
1505      the negated constant.  */
1506
1507   if (binoptab == sub_optab && CONST_INT_P (op1))
1508     {
1509       op1 = negate_rtx (mode, op1);
1510       binoptab = add_optab;
1511     }
1512   /* For shifts, constant invalid op1 might be expanded from different
1513      mode than MODE.  As those are invalid, force them to a register
1514      to avoid further problems during expansion.  */
1515   else if (CONST_INT_P (op1)
1516            && shift_optab_p (binoptab)
1517            && UINTVAL (op1) >= GET_MODE_BITSIZE (GET_MODE_INNER (mode)))
1518     {
1519       op1 = gen_int_mode (INTVAL (op1), GET_MODE_INNER (mode));
1520       op1 = force_reg (GET_MODE_INNER (mode), op1);
1521     }
1522
1523   /* Record where to delete back to if we backtrack.  */
1524   last = get_last_insn ();
1525
1526   /* If we can do it with a three-operand insn, do so.  */
1527
1528   if (methods != OPTAB_MUST_WIDEN)
1529     {
1530       if (convert_optab_p (binoptab))
1531         {
1532           machine_mode from_mode = widened_mode (mode, op0, op1);
1533           icode = find_widening_optab_handler (binoptab, mode, from_mode);
1534         }
1535       else
1536         icode = optab_handler (binoptab, mode);
1537       if (icode != CODE_FOR_nothing)
1538         {
1539           temp = expand_binop_directly (icode, mode, binoptab, op0, op1,
1540                                         target, unsignedp, methods, last);
1541           if (temp)
1542             return temp;
1543         }
1544     }
1545
1546   /* If we were trying to rotate, and that didn't work, try rotating
1547      the other direction before falling back to shifts and bitwise-or.  */
1548   if (((binoptab == rotl_optab
1549         && (icode = optab_handler (rotr_optab, mode)) != CODE_FOR_nothing)
1550        || (binoptab == rotr_optab
1551            && (icode = optab_handler (rotl_optab, mode)) != CODE_FOR_nothing))
1552       && is_int_mode (mode, &int_mode))
1553     {
1554       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1555       rtx newop1;
1556       unsigned int bits = GET_MODE_PRECISION (int_mode);
1557
1558       if (CONST_INT_P (op1))
1559         newop1 = gen_int_shift_amount (int_mode, bits - INTVAL (op1));
1560       else if (targetm.shift_truncation_mask (int_mode) == bits - 1)
1561         newop1 = negate_rtx (GET_MODE (op1), op1);
1562       else
1563         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1564                                gen_int_mode (bits, GET_MODE (op1)), op1,
1565                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1566
1567       temp = expand_binop_directly (icode, int_mode, otheroptab, op0, newop1,
1568                                     target, unsignedp, methods, last);
1569       if (temp)
1570         return temp;
1571     }
1572
1573   /* If this is a multiply, see if we can do a widening operation that
1574      takes operands of this mode and makes a wider mode.  */
1575
1576   if (binoptab == smul_optab
1577       && GET_MODE_2XWIDER_MODE (mode).exists (&wider_mode)
1578       && (convert_optab_handler ((unsignedp
1579                                   ? umul_widen_optab
1580                                   : smul_widen_optab),
1581                                  wider_mode, mode) != CODE_FOR_nothing))
1582     {
1583       /* *_widen_optab needs to determine operand mode, make sure at least
1584          one operand has non-VOID mode.  */
1585       if (GET_MODE (op0) == VOIDmode && GET_MODE (op1) == VOIDmode)
1586         op0 = force_reg (mode, op0);
1587       temp = expand_binop (wider_mode,
1588                            unsignedp ? umul_widen_optab : smul_widen_optab,
1589                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1590
1591       if (temp != 0)
1592         {
1593           if (GET_MODE_CLASS (mode) == MODE_INT
1594               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1595             return gen_lowpart (mode, temp);
1596           else
1597             return convert_to_mode (mode, temp, unsignedp);
1598         }
1599     }
1600
1601   /* If this is a vector shift by a scalar, see if we can do a vector
1602      shift by a vector.  If so, broadcast the scalar into a vector.  */
1603   if (mclass == MODE_VECTOR_INT)
1604     {
1605       optab otheroptab = unknown_optab;
1606
1607       if (binoptab == ashl_optab)
1608         otheroptab = vashl_optab;
1609       else if (binoptab == ashr_optab)
1610         otheroptab = vashr_optab;
1611       else if (binoptab == lshr_optab)
1612         otheroptab = vlshr_optab;
1613       else if (binoptab == rotl_optab)
1614         otheroptab = vrotl_optab;
1615       else if (binoptab == rotr_optab)
1616         otheroptab = vrotr_optab;
1617
1618       if (otheroptab
1619           && (icode = optab_handler (otheroptab, mode)) != CODE_FOR_nothing)
1620         {
1621           /* The scalar may have been extended to be too wide.  Truncate
1622              it back to the proper size to fit in the broadcast vector.  */
1623           scalar_mode inner_mode = GET_MODE_INNER (mode);
1624           if (!CONST_INT_P (op1)
1625               && (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (op1)))
1626                   > GET_MODE_BITSIZE (inner_mode)))
1627             op1 = force_reg (inner_mode,
1628                              simplify_gen_unary (TRUNCATE, inner_mode, op1,
1629                                                  GET_MODE (op1)));
1630           rtx vop1 = expand_vector_broadcast (mode, op1);
1631           if (vop1)
1632             {
1633               temp = expand_binop_directly (icode, mode, otheroptab, op0, vop1,
1634                                             target, unsignedp, methods, last);
1635               if (temp)
1636                 return temp;
1637             }
1638         }
1639     }
1640
1641   /* Look for a wider mode of the same class for which we think we
1642      can open-code the operation.  Check for a widening multiply at the
1643      wider mode as well.  */
1644
1645   if (CLASS_HAS_WIDER_MODES_P (mclass)
1646       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1647     FOR_EACH_WIDER_MODE (wider_mode, mode)
1648       {
1649         machine_mode next_mode;
1650         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1651             || (binoptab == smul_optab
1652                 && GET_MODE_WIDER_MODE (wider_mode).exists (&next_mode)
1653                 && (find_widening_optab_handler ((unsignedp
1654                                                   ? umul_widen_optab
1655                                                   : smul_widen_optab),
1656                                                  next_mode, mode)
1657                     != CODE_FOR_nothing)))
1658           {
1659             rtx xop0 = op0, xop1 = op1;
1660             bool no_extend = false;
1661
1662             /* For certain integer operations, we need not actually extend
1663                the narrow operands, as long as we will truncate
1664                the results to the same narrowness.  */
1665
1666             if ((binoptab == ior_optab || binoptab == and_optab
1667                  || binoptab == xor_optab
1668                  || binoptab == add_optab || binoptab == sub_optab
1669                  || binoptab == smul_optab || binoptab == ashl_optab)
1670                 && mclass == MODE_INT)
1671               {
1672                 no_extend = true;
1673                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1674                                                  xop0, unsignedp);
1675                 if (binoptab != ashl_optab)
1676                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1677                                                    xop1, unsignedp);
1678               }
1679
1680             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1681
1682             /* The second operand of a shift must always be extended.  */
1683             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1684                                   no_extend && binoptab != ashl_optab);
1685
1686             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1687                                  unsignedp, OPTAB_DIRECT);
1688             if (temp)
1689               {
1690                 if (mclass != MODE_INT
1691                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1692                   {
1693                     if (target == 0)
1694                       target = gen_reg_rtx (mode);
1695                     convert_move (target, temp, 0);
1696                     return target;
1697                   }
1698                 else
1699                   return gen_lowpart (mode, temp);
1700               }
1701             else
1702               delete_insns_since (last);
1703           }
1704       }
1705
1706   /* If operation is commutative,
1707      try to make the first operand a register.
1708      Even better, try to make it the same as the target.
1709      Also try to make the last operand a constant.  */
1710   if (commutative_optab_p (binoptab)
1711       && swap_commutative_operands_with_target (target, op0, op1))
1712     std::swap (op0, op1);
1713
1714   /* These can be done a word at a time.  */
1715   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1716       && is_int_mode (mode, &int_mode)
1717       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
1718       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1719     {
1720       int i;
1721       rtx_insn *insns;
1722
1723       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1724          won't be accurate, so use a new target.  */
1725       if (target == 0
1726           || target == op0
1727           || target == op1
1728           || reg_overlap_mentioned_p (target, op0)
1729           || reg_overlap_mentioned_p (target, op1)
1730           || !valid_multiword_target_p (target))
1731         target = gen_reg_rtx (int_mode);
1732
1733       start_sequence ();
1734
1735       /* Do the actual arithmetic.  */
1736       machine_mode op0_mode = GET_MODE (op0);
1737       machine_mode op1_mode = GET_MODE (op1);
1738       if (op0_mode == VOIDmode)
1739         op0_mode = int_mode;
1740       if (op1_mode == VOIDmode)
1741         op1_mode = int_mode;
1742       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
1743         {
1744           rtx target_piece = operand_subword (target, i, 1, int_mode);
1745           rtx x = expand_binop (word_mode, binoptab,
1746                                 operand_subword_force (op0, i, op0_mode),
1747                                 operand_subword_force (op1, i, op1_mode),
1748                                 target_piece, unsignedp, next_methods);
1749
1750           if (x == 0)
1751             break;
1752
1753           if (target_piece != x)
1754             emit_move_insn (target_piece, x);
1755         }
1756
1757       insns = get_insns ();
1758       end_sequence ();
1759
1760       if (i == GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD)
1761         {
1762           emit_insn (insns);
1763           return target;
1764         }
1765     }
1766
1767   /* Synthesize double word shifts from single word shifts.  */
1768   if ((binoptab == lshr_optab || binoptab == ashl_optab
1769        || binoptab == ashr_optab)
1770       && is_int_mode (mode, &int_mode)
1771       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1772       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1773       && GET_MODE_PRECISION (int_mode) == GET_MODE_BITSIZE (int_mode)
1774       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1775       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1776       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1777     {
1778       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1779       scalar_int_mode op1_mode;
1780
1781       double_shift_mask = targetm.shift_truncation_mask (int_mode);
1782       shift_mask = targetm.shift_truncation_mask (word_mode);
1783       op1_mode = (GET_MODE (op1) != VOIDmode
1784                   ? as_a <scalar_int_mode> (GET_MODE (op1))
1785                   : word_mode);
1786
1787       /* Apply the truncation to constant shifts.  */
1788       if (double_shift_mask > 0 && CONST_INT_P (op1))
1789         op1 = gen_int_mode (INTVAL (op1) & double_shift_mask, op1_mode);
1790
1791       if (op1 == CONST0_RTX (op1_mode))
1792         return op0;
1793
1794       /* Make sure that this is a combination that expand_doubleword_shift
1795          can handle.  See the comments there for details.  */
1796       if (double_shift_mask == 0
1797           || (shift_mask == BITS_PER_WORD - 1
1798               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1799         {
1800           rtx_insn *insns;
1801           rtx into_target, outof_target;
1802           rtx into_input, outof_input;
1803           int left_shift, outof_word;
1804
1805           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1806              won't be accurate, so use a new target.  */
1807           if (target == 0
1808               || target == op0
1809               || target == op1
1810               || reg_overlap_mentioned_p (target, op0)
1811               || reg_overlap_mentioned_p (target, op1)
1812               || !valid_multiword_target_p (target))
1813             target = gen_reg_rtx (int_mode);
1814
1815           start_sequence ();
1816
1817           /* OUTOF_* is the word we are shifting bits away from, and
1818              INTO_* is the word that we are shifting bits towards, thus
1819              they differ depending on the direction of the shift and
1820              WORDS_BIG_ENDIAN.  */
1821
1822           left_shift = binoptab == ashl_optab;
1823           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1824
1825           outof_target = operand_subword (target, outof_word, 1, int_mode);
1826           into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1827
1828           outof_input = operand_subword_force (op0, outof_word, int_mode);
1829           into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1830
1831           if (expand_doubleword_shift (op1_mode, binoptab,
1832                                        outof_input, into_input, op1,
1833                                        outof_target, into_target,
1834                                        unsignedp, next_methods, shift_mask))
1835             {
1836               insns = get_insns ();
1837               end_sequence ();
1838
1839               emit_insn (insns);
1840               return target;
1841             }
1842           end_sequence ();
1843         }
1844     }
1845
1846   /* Synthesize double word rotates from single word shifts.  */
1847   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1848       && is_int_mode (mode, &int_mode)
1849       && CONST_INT_P (op1)
1850       && GET_MODE_PRECISION (int_mode) == 2 * BITS_PER_WORD
1851       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1852       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1853     {
1854       rtx_insn *insns;
1855       rtx into_target, outof_target;
1856       rtx into_input, outof_input;
1857       rtx inter;
1858       int shift_count, left_shift, outof_word;
1859
1860       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1861          won't be accurate, so use a new target. Do this also if target is not
1862          a REG, first because having a register instead may open optimization
1863          opportunities, and second because if target and op0 happen to be MEMs
1864          designating the same location, we would risk clobbering it too early
1865          in the code sequence we generate below.  */
1866       if (target == 0
1867           || target == op0
1868           || target == op1
1869           || !REG_P (target)
1870           || reg_overlap_mentioned_p (target, op0)
1871           || reg_overlap_mentioned_p (target, op1)
1872           || !valid_multiword_target_p (target))
1873         target = gen_reg_rtx (int_mode);
1874
1875       start_sequence ();
1876
1877       shift_count = INTVAL (op1);
1878
1879       /* OUTOF_* is the word we are shifting bits away from, and
1880          INTO_* is the word that we are shifting bits towards, thus
1881          they differ depending on the direction of the shift and
1882          WORDS_BIG_ENDIAN.  */
1883
1884       left_shift = (binoptab == rotl_optab);
1885       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1886
1887       outof_target = operand_subword (target, outof_word, 1, int_mode);
1888       into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1889
1890       outof_input = operand_subword_force (op0, outof_word, int_mode);
1891       into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1892
1893       if (shift_count == BITS_PER_WORD)
1894         {
1895           /* This is just a word swap.  */
1896           emit_move_insn (outof_target, into_input);
1897           emit_move_insn (into_target, outof_input);
1898           inter = const0_rtx;
1899         }
1900       else
1901         {
1902           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1903           HOST_WIDE_INT first_shift_count, second_shift_count;
1904           optab reverse_unsigned_shift, unsigned_shift;
1905
1906           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1907                                     ? lshr_optab : ashl_optab);
1908
1909           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1910                             ? ashl_optab : lshr_optab);
1911
1912           if (shift_count > BITS_PER_WORD)
1913             {
1914               first_shift_count = shift_count - BITS_PER_WORD;
1915               second_shift_count = 2 * BITS_PER_WORD - shift_count;
1916             }
1917           else
1918             {
1919               first_shift_count = BITS_PER_WORD - shift_count;
1920               second_shift_count = shift_count;
1921             }
1922           rtx first_shift_count_rtx
1923             = gen_int_shift_amount (word_mode, first_shift_count);
1924           rtx second_shift_count_rtx
1925             = gen_int_shift_amount (word_mode, second_shift_count);
1926
1927           into_temp1 = expand_binop (word_mode, unsigned_shift,
1928                                      outof_input, first_shift_count_rtx,
1929                                      NULL_RTX, unsignedp, next_methods);
1930           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1931                                      into_input, second_shift_count_rtx,
1932                                      NULL_RTX, unsignedp, next_methods);
1933
1934           if (into_temp1 != 0 && into_temp2 != 0)
1935             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1936                                   into_target, unsignedp, next_methods);
1937           else
1938             inter = 0;
1939
1940           if (inter != 0 && inter != into_target)
1941             emit_move_insn (into_target, inter);
1942
1943           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1944                                       into_input, first_shift_count_rtx,
1945                                       NULL_RTX, unsignedp, next_methods);
1946           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1947                                       outof_input, second_shift_count_rtx,
1948                                       NULL_RTX, unsignedp, next_methods);
1949
1950           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1951             inter = expand_binop (word_mode, ior_optab,
1952                                   outof_temp1, outof_temp2,
1953                                   outof_target, unsignedp, next_methods);
1954
1955           if (inter != 0 && inter != outof_target)
1956             emit_move_insn (outof_target, inter);
1957         }
1958
1959       insns = get_insns ();
1960       end_sequence ();
1961
1962       if (inter != 0)
1963         {
1964           emit_insn (insns);
1965           return target;
1966         }
1967     }
1968
1969   /* These can be done a word at a time by propagating carries.  */
1970   if ((binoptab == add_optab || binoptab == sub_optab)
1971       && is_int_mode (mode, &int_mode)
1972       && GET_MODE_SIZE (int_mode) >= 2 * UNITS_PER_WORD
1973       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1974     {
1975       unsigned int i;
1976       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1977       const unsigned int nwords = GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD;
1978       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1979       rtx xop0, xop1, xtarget;
1980
1981       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1982          value is one of those, use it.  Otherwise, use 1 since it is the
1983          one easiest to get.  */
1984 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1985       int normalizep = STORE_FLAG_VALUE;
1986 #else
1987       int normalizep = 1;
1988 #endif
1989
1990       /* Prepare the operands.  */
1991       xop0 = force_reg (int_mode, op0);
1992       xop1 = force_reg (int_mode, op1);
1993
1994       xtarget = gen_reg_rtx (int_mode);
1995
1996       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1997         target = xtarget;
1998
1999       /* Indicate for flow that the entire target reg is being set.  */
2000       if (REG_P (target))
2001         emit_clobber (xtarget);
2002
2003       /* Do the actual arithmetic.  */
2004       for (i = 0; i < nwords; i++)
2005         {
2006           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
2007           rtx target_piece = operand_subword (xtarget, index, 1, int_mode);
2008           rtx op0_piece = operand_subword_force (xop0, index, int_mode);
2009           rtx op1_piece = operand_subword_force (xop1, index, int_mode);
2010           rtx x;
2011
2012           /* Main add/subtract of the input operands.  */
2013           x = expand_binop (word_mode, binoptab,
2014                             op0_piece, op1_piece,
2015                             target_piece, unsignedp, next_methods);
2016           if (x == 0)
2017             break;
2018
2019           if (i + 1 < nwords)
2020             {
2021               /* Store carry from main add/subtract.  */
2022               carry_out = gen_reg_rtx (word_mode);
2023               carry_out = emit_store_flag_force (carry_out,
2024                                                  (binoptab == add_optab
2025                                                   ? LT : GT),
2026                                                  x, op0_piece,
2027                                                  word_mode, 1, normalizep);
2028             }
2029
2030           if (i > 0)
2031             {
2032               rtx newx;
2033
2034               /* Add/subtract previous carry to main result.  */
2035               newx = expand_binop (word_mode,
2036                                    normalizep == 1 ? binoptab : otheroptab,
2037                                    x, carry_in,
2038                                    NULL_RTX, 1, next_methods);
2039
2040               if (i + 1 < nwords)
2041                 {
2042                   /* Get out carry from adding/subtracting carry in.  */
2043                   rtx carry_tmp = gen_reg_rtx (word_mode);
2044                   carry_tmp = emit_store_flag_force (carry_tmp,
2045                                                      (binoptab == add_optab
2046                                                       ? LT : GT),
2047                                                      newx, x,
2048                                                      word_mode, 1, normalizep);
2049
2050                   /* Logical-ior the two poss. carry together.  */
2051                   carry_out = expand_binop (word_mode, ior_optab,
2052                                             carry_out, carry_tmp,
2053                                             carry_out, 0, next_methods);
2054                   if (carry_out == 0)
2055                     break;
2056                 }
2057               emit_move_insn (target_piece, newx);
2058             }
2059           else
2060             {
2061               if (x != target_piece)
2062                 emit_move_insn (target_piece, x);
2063             }
2064
2065           carry_in = carry_out;
2066         }
2067
2068       if (i == GET_MODE_BITSIZE (int_mode) / (unsigned) BITS_PER_WORD)
2069         {
2070           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing
2071               || ! rtx_equal_p (target, xtarget))
2072             {
2073               rtx_insn *temp = emit_move_insn (target, xtarget);
2074
2075               set_dst_reg_note (temp, REG_EQUAL,
2076                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
2077                                                 int_mode, copy_rtx (xop0),
2078                                                 copy_rtx (xop1)),
2079                                 target);
2080             }
2081           else
2082             target = xtarget;
2083
2084           return target;
2085         }
2086
2087       else
2088         delete_insns_since (last);
2089     }
2090
2091   /* Attempt to synthesize double word multiplies using a sequence of word
2092      mode multiplications.  We first attempt to generate a sequence using a
2093      more efficient unsigned widening multiply, and if that fails we then
2094      try using a signed widening multiply.  */
2095
2096   if (binoptab == smul_optab
2097       && is_int_mode (mode, &int_mode)
2098       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2099       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
2100       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
2101     {
2102       rtx product = NULL_RTX;
2103       if (convert_optab_handler (umul_widen_optab, int_mode, word_mode)
2104           != CODE_FOR_nothing)
2105         {
2106           product = expand_doubleword_mult (int_mode, op0, op1, target,
2107                                             true, methods);
2108           if (!product)
2109             delete_insns_since (last);
2110         }
2111
2112       if (product == NULL_RTX
2113           && (convert_optab_handler (smul_widen_optab, int_mode, word_mode)
2114               != CODE_FOR_nothing))
2115         {
2116           product = expand_doubleword_mult (int_mode, op0, op1, target,
2117                                             false, methods);
2118           if (!product)
2119             delete_insns_since (last);
2120         }
2121
2122       if (product != NULL_RTX)
2123         {
2124           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing)
2125             {
2126               rtx_insn *move = emit_move_insn (target ? target : product,
2127                                                product);
2128               set_dst_reg_note (move,
2129                                 REG_EQUAL,
2130                                 gen_rtx_fmt_ee (MULT, int_mode,
2131                                                 copy_rtx (op0),
2132                                                 copy_rtx (op1)),
2133                                 target ? target : product);
2134             }
2135           return product;
2136         }
2137     }
2138
2139   /* Attempt to synthetize double word modulo by constant divisor.  */
2140   if ((binoptab == umod_optab
2141        || binoptab == smod_optab
2142        || binoptab == udiv_optab
2143        || binoptab == sdiv_optab)
2144       && optimize
2145       && CONST_INT_P (op1)
2146       && is_int_mode (mode, &int_mode)
2147       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2148       && optab_handler ((binoptab == umod_optab || binoptab == udiv_optab)
2149                         ? udivmod_optab : sdivmod_optab,
2150                         int_mode) == CODE_FOR_nothing
2151       && optab_handler (and_optab, word_mode) != CODE_FOR_nothing
2152       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing
2153       && optimize_insn_for_speed_p ())
2154     {
2155       rtx res = NULL_RTX;
2156       if ((binoptab == umod_optab || binoptab == smod_optab)
2157           && (INTVAL (op1) & 1) == 0)
2158         res = expand_doubleword_mod (int_mode, op0, op1,
2159                                      binoptab == umod_optab);
2160       else
2161         {
2162           rtx quot = expand_doubleword_divmod (int_mode, op0, op1, &res,
2163                                                binoptab == umod_optab
2164                                                || binoptab == udiv_optab);
2165           if (quot == NULL_RTX)
2166             res = NULL_RTX;
2167           else if (binoptab == udiv_optab || binoptab == sdiv_optab)
2168             res = quot;
2169         }
2170       if (res != NULL_RTX)
2171         {
2172           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing)
2173             {
2174               rtx_insn *move = emit_move_insn (target ? target : res,
2175                                                res);
2176               set_dst_reg_note (move, REG_EQUAL,
2177                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
2178                                                 int_mode, copy_rtx (op0), op1),
2179                                 target ? target : res);
2180             }
2181           return res;
2182         }
2183       else
2184         delete_insns_since (last);
2185     }
2186
2187   /* It can't be open-coded in this mode.
2188      Use a library call if one is available and caller says that's ok.  */
2189
2190   libfunc = optab_libfunc (binoptab, mode);
2191   if (libfunc
2192       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
2193     {
2194       rtx_insn *insns;
2195       rtx op1x = op1;
2196       machine_mode op1_mode = mode;
2197       rtx value;
2198
2199       start_sequence ();
2200
2201       if (shift_optab_p (binoptab))
2202         {
2203           op1_mode = targetm.libgcc_shift_count_mode ();
2204           /* Specify unsigned here,
2205              since negative shift counts are meaningless.  */
2206           op1x = convert_to_mode (op1_mode, op1, 1);
2207         }
2208
2209       if (GET_MODE (op0) != VOIDmode
2210           && GET_MODE (op0) != mode)
2211         op0 = convert_to_mode (mode, op0, unsignedp);
2212
2213       /* Pass 1 for NO_QUEUE so we don't lose any increments
2214          if the libcall is cse'd or moved.  */
2215       value = emit_library_call_value (libfunc,
2216                                        NULL_RTX, LCT_CONST, mode,
2217                                        op0, mode, op1x, op1_mode);
2218
2219       insns = get_insns ();
2220       end_sequence ();
2221
2222       bool trapv = trapv_binoptab_p (binoptab);
2223       target = gen_reg_rtx (mode);
2224       emit_libcall_block_1 (insns, target, value,
2225                             trapv ? NULL_RTX
2226                             : gen_rtx_fmt_ee (optab_to_code (binoptab),
2227                                               mode, op0, op1), trapv);
2228
2229       return target;
2230     }
2231
2232   delete_insns_since (last);
2233
2234   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2235
2236   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
2237          || methods == OPTAB_MUST_WIDEN))
2238     {
2239       /* Caller says, don't even try.  */
2240       delete_insns_since (entry_last);
2241       return 0;
2242     }
2243
2244   /* Compute the value of METHODS to pass to recursive calls.
2245      Don't allow widening to be tried recursively.  */
2246
2247   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
2248
2249   /* Look for a wider mode of the same class for which it appears we can do
2250      the operation.  */
2251
2252   if (CLASS_HAS_WIDER_MODES_P (mclass))
2253     {
2254       /* This code doesn't make sense for conversion optabs, since we
2255          wouldn't then want to extend the operands to be the same size
2256          as the result.  */
2257       gcc_assert (!convert_optab_p (binoptab));
2258       FOR_EACH_WIDER_MODE (wider_mode, mode)
2259         {
2260           if (optab_handler (binoptab, wider_mode)
2261               || (methods == OPTAB_LIB
2262                   && optab_libfunc (binoptab, wider_mode)))
2263             {
2264               rtx xop0 = op0, xop1 = op1;
2265               bool no_extend = false;
2266
2267               /* For certain integer operations, we need not actually extend
2268                  the narrow operands, as long as we will truncate
2269                  the results to the same narrowness.  */
2270
2271               if ((binoptab == ior_optab || binoptab == and_optab
2272                    || binoptab == xor_optab
2273                    || binoptab == add_optab || binoptab == sub_optab
2274                    || binoptab == smul_optab || binoptab == ashl_optab)
2275                   && mclass == MODE_INT)
2276                 no_extend = true;
2277
2278               xop0 = widen_operand (xop0, wider_mode, mode,
2279                                     unsignedp, no_extend);
2280
2281               /* The second operand of a shift must always be extended.  */
2282               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
2283                                     no_extend && binoptab != ashl_optab);
2284
2285               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
2286                                    unsignedp, methods);
2287               if (temp)
2288                 {
2289                   if (mclass != MODE_INT
2290                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2291                     {
2292                       if (target == 0)
2293                         target = gen_reg_rtx (mode);
2294                       convert_move (target, temp, 0);
2295                       return target;
2296                     }
2297                   else
2298                     return gen_lowpart (mode, temp);
2299                 }
2300               else
2301                 delete_insns_since (last);
2302             }
2303         }
2304     }
2305
2306   delete_insns_since (entry_last);
2307   return 0;
2308 }
2309 \f
2310 /* Expand a binary operator which has both signed and unsigned forms.
2311    UOPTAB is the optab for unsigned operations, and SOPTAB is for
2312    signed operations.
2313
2314    If we widen unsigned operands, we may use a signed wider operation instead
2315    of an unsigned wider operation, since the result would be the same.  */
2316
2317 rtx
2318 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
2319                    rtx op0, rtx op1, rtx target, int unsignedp,
2320                    enum optab_methods methods)
2321 {
2322   rtx temp;
2323   optab direct_optab = unsignedp ? uoptab : soptab;
2324   bool save_enable;
2325
2326   /* Do it without widening, if possible.  */
2327   temp = expand_binop (mode, direct_optab, op0, op1, target,
2328                        unsignedp, OPTAB_DIRECT);
2329   if (temp || methods == OPTAB_DIRECT)
2330     return temp;
2331
2332   /* Try widening to a signed int.  Disable any direct use of any
2333      signed insn in the current mode.  */
2334   save_enable = swap_optab_enable (soptab, mode, false);
2335
2336   temp = expand_binop (mode, soptab, op0, op1, target,
2337                        unsignedp, OPTAB_WIDEN);
2338
2339   /* For unsigned operands, try widening to an unsigned int.  */
2340   if (!temp && unsignedp)
2341     temp = expand_binop (mode, uoptab, op0, op1, target,
2342                          unsignedp, OPTAB_WIDEN);
2343   if (temp || methods == OPTAB_WIDEN)
2344     goto egress;
2345
2346   /* Use the right width libcall if that exists.  */
2347   temp = expand_binop (mode, direct_optab, op0, op1, target,
2348                        unsignedp, OPTAB_LIB);
2349   if (temp || methods == OPTAB_LIB)
2350     goto egress;
2351
2352   /* Must widen and use a libcall, use either signed or unsigned.  */
2353   temp = expand_binop (mode, soptab, op0, op1, target,
2354                        unsignedp, methods);
2355   if (!temp && unsignedp)
2356     temp = expand_binop (mode, uoptab, op0, op1, target,
2357                          unsignedp, methods);
2358
2359  egress:
2360   /* Undo the fiddling above.  */
2361   if (save_enable)
2362     swap_optab_enable (soptab, mode, true);
2363   return temp;
2364 }
2365 \f
2366 /* Generate code to perform an operation specified by UNOPPTAB
2367    on operand OP0, with two results to TARG0 and TARG1.
2368    We assume that the order of the operands for the instruction
2369    is TARG0, TARG1, OP0.
2370
2371    Either TARG0 or TARG1 may be zero, but what that means is that
2372    the result is not actually wanted.  We will generate it into
2373    a dummy pseudo-reg and discard it.  They may not both be zero.
2374
2375    Returns true if this operation can be performed; false if not.  */
2376
2377 bool
2378 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
2379                     int unsignedp)
2380 {
2381   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2382   enum mode_class mclass;
2383   machine_mode wider_mode;
2384   rtx_insn *entry_last = get_last_insn ();
2385   rtx_insn *last;
2386
2387   mclass = GET_MODE_CLASS (mode);
2388
2389   if (!targ0)
2390     targ0 = gen_reg_rtx (mode);
2391   if (!targ1)
2392     targ1 = gen_reg_rtx (mode);
2393
2394   /* Record where to go back to if we fail.  */
2395   last = get_last_insn ();
2396
2397   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2398     {
2399       class expand_operand ops[3];
2400       enum insn_code icode = optab_handler (unoptab, mode);
2401
2402       create_fixed_operand (&ops[0], targ0);
2403       create_fixed_operand (&ops[1], targ1);
2404       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
2405       if (maybe_expand_insn (icode, 3, ops))
2406         return true;
2407     }
2408
2409   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2410
2411   if (CLASS_HAS_WIDER_MODES_P (mclass))
2412     {
2413       FOR_EACH_WIDER_MODE (wider_mode, mode)
2414         {
2415           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2416             {
2417               rtx t0 = gen_reg_rtx (wider_mode);
2418               rtx t1 = gen_reg_rtx (wider_mode);
2419               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2420
2421               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
2422                 {
2423                   convert_move (targ0, t0, unsignedp);
2424                   convert_move (targ1, t1, unsignedp);
2425                   return true;
2426                 }
2427               else
2428                 delete_insns_since (last);
2429             }
2430         }
2431     }
2432
2433   delete_insns_since (entry_last);
2434   return false;
2435 }
2436 \f
2437 /* Generate code to perform an operation specified by BINOPTAB
2438    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2439    We assume that the order of the operands for the instruction
2440    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2441    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2442
2443    Either TARG0 or TARG1 may be zero, but what that means is that
2444    the result is not actually wanted.  We will generate it into
2445    a dummy pseudo-reg and discard it.  They may not both be zero.
2446
2447    Returns true if this operation can be performed; false if not.  */
2448
2449 bool
2450 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2451                      int unsignedp)
2452 {
2453   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2454   enum mode_class mclass;
2455   machine_mode wider_mode;
2456   rtx_insn *entry_last = get_last_insn ();
2457   rtx_insn *last;
2458
2459   mclass = GET_MODE_CLASS (mode);
2460
2461   if (!targ0)
2462     targ0 = gen_reg_rtx (mode);
2463   if (!targ1)
2464     targ1 = gen_reg_rtx (mode);
2465
2466   /* Record where to go back to if we fail.  */
2467   last = get_last_insn ();
2468
2469   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2470     {
2471       class expand_operand ops[4];
2472       enum insn_code icode = optab_handler (binoptab, mode);
2473       machine_mode mode0 = insn_data[icode].operand[1].mode;
2474       machine_mode mode1 = insn_data[icode].operand[2].mode;
2475       rtx xop0 = op0, xop1 = op1;
2476
2477       /* If we are optimizing, force expensive constants into a register.  */
2478       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2479       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2480
2481       create_fixed_operand (&ops[0], targ0);
2482       create_convert_operand_from (&ops[1], xop0, mode, unsignedp);
2483       create_convert_operand_from (&ops[2], xop1, mode, unsignedp);
2484       create_fixed_operand (&ops[3], targ1);
2485       if (maybe_expand_insn (icode, 4, ops))
2486         return true;
2487       delete_insns_since (last);
2488     }
2489
2490   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2491
2492   if (CLASS_HAS_WIDER_MODES_P (mclass))
2493     {
2494       FOR_EACH_WIDER_MODE (wider_mode, mode)
2495         {
2496           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2497             {
2498               rtx t0 = gen_reg_rtx (wider_mode);
2499               rtx t1 = gen_reg_rtx (wider_mode);
2500               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2501               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2502
2503               if (expand_twoval_binop (binoptab, cop0, cop1,
2504                                        t0, t1, unsignedp))
2505                 {
2506                   convert_move (targ0, t0, unsignedp);
2507                   convert_move (targ1, t1, unsignedp);
2508                   return true;
2509                 }
2510               else
2511                 delete_insns_since (last);
2512             }
2513         }
2514     }
2515
2516   delete_insns_since (entry_last);
2517   return false;
2518 }
2519
2520 /* Expand the two-valued library call indicated by BINOPTAB, but
2521    preserve only one of the values.  If TARG0 is non-NULL, the first
2522    value is placed into TARG0; otherwise the second value is placed
2523    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2524    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2525    This routine assumes that the value returned by the library call is
2526    as if the return value was of an integral mode twice as wide as the
2527    mode of OP0.  Returns 1 if the call was successful.  */
2528
2529 bool
2530 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2531                              rtx targ0, rtx targ1, enum rtx_code code)
2532 {
2533   machine_mode mode;
2534   machine_mode libval_mode;
2535   rtx libval;
2536   rtx_insn *insns;
2537   rtx libfunc;
2538
2539   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2540   gcc_assert (!targ0 != !targ1);
2541
2542   mode = GET_MODE (op0);
2543   libfunc = optab_libfunc (binoptab, mode);
2544   if (!libfunc)
2545     return false;
2546
2547   /* The value returned by the library function will have twice as
2548      many bits as the nominal MODE.  */
2549   libval_mode = smallest_int_mode_for_size (2 * GET_MODE_BITSIZE (mode));
2550   start_sequence ();
2551   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2552                                     libval_mode,
2553                                     op0, mode,
2554                                     op1, mode);
2555   /* Get the part of VAL containing the value that we want.  */
2556   libval = simplify_gen_subreg (mode, libval, libval_mode,
2557                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2558   insns = get_insns ();
2559   end_sequence ();
2560   /* Move the into the desired location.  */
2561   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2562                       gen_rtx_fmt_ee (code, mode, op0, op1));
2563
2564   return true;
2565 }
2566
2567 \f
2568 /* Wrapper around expand_unop which takes an rtx code to specify
2569    the operation to perform, not an optab pointer.  All other
2570    arguments are the same.  */
2571 rtx
2572 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2573                     rtx target, int unsignedp)
2574 {
2575   optab unop = code_to_optab (code);
2576   gcc_assert (unop);
2577
2578   return expand_unop (mode, unop, op0, target, unsignedp);
2579 }
2580
2581 /* Try calculating
2582         (clz:narrow x)
2583    as
2584         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2585
2586    A similar operation can be used for clrsb.  UNOPTAB says which operation
2587    we are trying to expand.  */
2588 static rtx
2589 widen_leading (scalar_int_mode mode, rtx op0, rtx target, optab unoptab)
2590 {
2591   opt_scalar_int_mode wider_mode_iter;
2592   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2593     {
2594       scalar_int_mode wider_mode = wider_mode_iter.require ();
2595       if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2596         {
2597           rtx xop0, temp;
2598           rtx_insn *last;
2599
2600           last = get_last_insn ();
2601
2602           if (target == 0)
2603             target = gen_reg_rtx (mode);
2604           xop0 = widen_operand (op0, wider_mode, mode,
2605                                 unoptab != clrsb_optab, false);
2606           temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2607                               unoptab != clrsb_optab);
2608           if (temp != 0)
2609             temp = expand_binop
2610               (wider_mode, sub_optab, temp,
2611                gen_int_mode (GET_MODE_PRECISION (wider_mode)
2612                              - GET_MODE_PRECISION (mode),
2613                              wider_mode),
2614                target, true, OPTAB_DIRECT);
2615           if (temp == 0)
2616             delete_insns_since (last);
2617
2618           return temp;
2619         }
2620     }
2621   return 0;
2622 }
2623
2624 /* Attempt to emit (clrsb:mode op0) as
2625    (plus:mode (clz:mode (xor:mode op0 (ashr:mode op0 (const_int prec-1))))
2626               (const_int -1))
2627    if CLZ_DEFINED_VALUE_AT_ZERO (mode, val) is 2 and val is prec,
2628    or as
2629    (clz:mode (ior:mode (xor:mode (ashl:mode op0 (const_int 1))
2630                                  (ashr:mode op0 (const_int prec-1)))
2631                        (const_int 1)))
2632    otherwise.  */
2633
2634 static rtx
2635 expand_clrsb_using_clz (scalar_int_mode mode, rtx op0, rtx target)
2636 {
2637   if (optimize_insn_for_size_p ()
2638       || optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2639     return NULL_RTX;
2640
2641   start_sequence ();
2642   HOST_WIDE_INT val = 0;
2643   if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) != 2
2644       || val != GET_MODE_PRECISION (mode))
2645     val = 0;
2646   else
2647     val = 1;
2648
2649   rtx temp2 = op0;
2650   if (!val)
2651     {
2652       temp2 = expand_binop (mode, ashl_optab, op0, const1_rtx,
2653                             NULL_RTX, 0, OPTAB_DIRECT);
2654       if (!temp2)
2655         {
2656         fail:
2657           end_sequence ();
2658           return NULL_RTX;
2659         }
2660     }
2661
2662   rtx temp = expand_binop (mode, ashr_optab, op0,
2663                            GEN_INT (GET_MODE_PRECISION (mode) - 1),
2664                            NULL_RTX, 0, OPTAB_DIRECT);
2665   if (!temp)
2666     goto fail;
2667
2668   temp = expand_binop (mode, xor_optab, temp2, temp, NULL_RTX, 0,
2669                        OPTAB_DIRECT);
2670   if (!temp)
2671     goto fail;
2672
2673   if (!val)
2674     {
2675       temp = expand_binop (mode, ior_optab, temp, const1_rtx,
2676                            NULL_RTX, 0, OPTAB_DIRECT);
2677       if (!temp)
2678         goto fail;
2679     }
2680   temp = expand_unop_direct (mode, clz_optab, temp, val ? NULL_RTX : target,
2681                              true);
2682   if (!temp)
2683     goto fail;
2684   if (val)
2685     {
2686       temp = expand_binop (mode, add_optab, temp, constm1_rtx,
2687                            target, 0, OPTAB_DIRECT);
2688       if (!temp)
2689         goto fail;
2690     }
2691
2692   rtx_insn *seq = get_insns ();
2693   end_sequence ();
2694
2695   add_equal_note (seq, temp, CLRSB, op0, NULL_RTX, mode);
2696   emit_insn (seq);
2697   return temp;
2698 }
2699
2700 static rtx expand_ffs (scalar_int_mode, rtx, rtx);
2701
2702 /* Try calculating clz, ctz or ffs of a double-word quantity as two clz, ctz or
2703    ffs operations on word-sized quantities, choosing which based on whether the
2704    high (for clz) or low (for ctz and ffs) word is nonzero.  */
2705 static rtx
2706 expand_doubleword_clz_ctz_ffs (scalar_int_mode mode, rtx op0, rtx target,
2707                                optab unoptab)
2708 {
2709   rtx xop0 = force_reg (mode, op0);
2710   rtx subhi = gen_highpart (word_mode, xop0);
2711   rtx sublo = gen_lowpart (word_mode, xop0);
2712   rtx_code_label *hi0_label = gen_label_rtx ();
2713   rtx_code_label *after_label = gen_label_rtx ();
2714   rtx_insn *seq;
2715   rtx temp, result;
2716   int addend = 0;
2717
2718   /* If we were not given a target, use a word_mode register, not a
2719      'mode' register.  The result will fit, and nobody is expecting
2720      anything bigger (the return type of __builtin_clz* is int).  */
2721   if (!target)
2722     target = gen_reg_rtx (word_mode);
2723
2724   /* In any case, write to a word_mode scratch in both branches of the
2725      conditional, so we can ensure there is a single move insn setting
2726      'target' to tag a REG_EQUAL note on.  */
2727   result = gen_reg_rtx (word_mode);
2728
2729   if (unoptab != clz_optab)
2730     std::swap (subhi, sublo);
2731
2732   start_sequence ();
2733
2734   /* If the high word is not equal to zero,
2735      then clz of the full value is clz of the high word.  */
2736   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2737                            word_mode, true, hi0_label);
2738
2739   if (optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2740     temp = expand_unop_direct (word_mode, unoptab, subhi, result, true);
2741   else
2742     {
2743       gcc_assert (unoptab == ffs_optab);
2744       temp = expand_ffs (word_mode, subhi, result);
2745     }
2746   if (!temp)
2747     goto fail;
2748
2749   if (temp != result)
2750     convert_move (result, temp, true);
2751
2752   emit_jump_insn (targetm.gen_jump (after_label));
2753   emit_barrier ();
2754
2755   /* Else clz of the full value is clz of the low word plus the number
2756      of bits in the high word.  Similarly for ctz/ffs of the high word,
2757      except that ffs should be 0 when both words are zero.  */
2758   emit_label (hi0_label);
2759
2760   if (unoptab == ffs_optab)
2761     {
2762       convert_move (result, const0_rtx, true);
2763       emit_cmp_and_jump_insns (sublo, CONST0_RTX (word_mode), EQ, 0,
2764                                word_mode, true, after_label);
2765     }
2766
2767   if (optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2768     temp = expand_unop_direct (word_mode, unoptab, sublo, NULL_RTX, true);
2769   else
2770     {
2771       gcc_assert (unoptab == ffs_optab);
2772       temp = expand_unop_direct (word_mode, ctz_optab, sublo, NULL_RTX, true);
2773       addend = 1;
2774     }
2775
2776   if (!temp)
2777     goto fail;
2778
2779   temp = expand_binop (word_mode, add_optab, temp,
2780                        gen_int_mode (GET_MODE_BITSIZE (word_mode) + addend,
2781                                      word_mode),
2782                        result, true, OPTAB_DIRECT);
2783   if (!temp)
2784     goto fail;
2785   if (temp != result)
2786     convert_move (result, temp, true);
2787
2788   emit_label (after_label);
2789   convert_move (target, result, true);
2790
2791   seq = get_insns ();
2792   end_sequence ();
2793
2794   add_equal_note (seq, target, optab_to_code (unoptab), xop0, NULL_RTX, mode);
2795   emit_insn (seq);
2796   return target;
2797
2798  fail:
2799   end_sequence ();
2800   return 0;
2801 }
2802
2803 /* Try calculating popcount of a double-word quantity as two popcount's of
2804    word-sized quantities and summing up the results.  */
2805 static rtx
2806 expand_doubleword_popcount (scalar_int_mode mode, rtx op0, rtx target)
2807 {
2808   rtx t0, t1, t;
2809   rtx_insn *seq;
2810
2811   start_sequence ();
2812
2813   t0 = expand_unop_direct (word_mode, popcount_optab,
2814                            operand_subword_force (op0, 0, mode), NULL_RTX,
2815                            true);
2816   t1 = expand_unop_direct (word_mode, popcount_optab,
2817                            operand_subword_force (op0, 1, mode), NULL_RTX,
2818                            true);
2819   if (!t0 || !t1)
2820     {
2821       end_sequence ();
2822       return NULL_RTX;
2823     }
2824
2825   /* If we were not given a target, use a word_mode register, not a
2826      'mode' register.  The result will fit, and nobody is expecting
2827      anything bigger (the return type of __builtin_popcount* is int).  */
2828   if (!target)
2829     target = gen_reg_rtx (word_mode);
2830
2831   t = expand_binop (word_mode, add_optab, t0, t1, target, 0, OPTAB_DIRECT);
2832
2833   seq = get_insns ();
2834   end_sequence ();
2835
2836   add_equal_note (seq, t, POPCOUNT, op0, NULL_RTX, mode);
2837   emit_insn (seq);
2838   return t;
2839 }
2840
2841 /* Try calculating
2842         (parity:wide x)
2843    as
2844         (parity:narrow (low (x) ^ high (x))) */
2845 static rtx
2846 expand_doubleword_parity (scalar_int_mode mode, rtx op0, rtx target)
2847 {
2848   rtx t = expand_binop (word_mode, xor_optab,
2849                         operand_subword_force (op0, 0, mode),
2850                         operand_subword_force (op0, 1, mode),
2851                         NULL_RTX, 0, OPTAB_DIRECT);
2852   return expand_unop (word_mode, parity_optab, t, target, true);
2853 }
2854
2855 /* Try calculating
2856         (bswap:narrow x)
2857    as
2858         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2859 static rtx
2860 widen_bswap (scalar_int_mode mode, rtx op0, rtx target)
2861 {
2862   rtx x;
2863   rtx_insn *last;
2864   opt_scalar_int_mode wider_mode_iter;
2865
2866   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2867     if (optab_handler (bswap_optab, wider_mode_iter.require ())
2868         != CODE_FOR_nothing)
2869       break;
2870
2871   if (!wider_mode_iter.exists ())
2872     return NULL_RTX;
2873
2874   scalar_int_mode wider_mode = wider_mode_iter.require ();
2875   last = get_last_insn ();
2876
2877   x = widen_operand (op0, wider_mode, mode, true, true);
2878   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2879
2880   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2881               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2882   if (x != 0)
2883     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2884                       GET_MODE_BITSIZE (wider_mode)
2885                       - GET_MODE_BITSIZE (mode),
2886                       NULL_RTX, true);
2887
2888   if (x != 0)
2889     {
2890       if (target == 0)
2891         target = gen_reg_rtx (mode);
2892       emit_move_insn (target, gen_lowpart (mode, x));
2893     }
2894   else
2895     delete_insns_since (last);
2896
2897   return target;
2898 }
2899
2900 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2901
2902 static rtx
2903 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2904 {
2905   rtx t0, t1;
2906
2907   t1 = expand_unop (word_mode, bswap_optab,
2908                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2909   t0 = expand_unop (word_mode, bswap_optab,
2910                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2911
2912   if (target == 0 || !valid_multiword_target_p (target))
2913     target = gen_reg_rtx (mode);
2914   if (REG_P (target))
2915     emit_clobber (target);
2916   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2917   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2918
2919   return target;
2920 }
2921
2922 /* Try calculating (parity x) as (and (popcount x) 1), where
2923    popcount can also be done in a wider mode.  */
2924 static rtx
2925 expand_parity (scalar_int_mode mode, rtx op0, rtx target)
2926 {
2927   enum mode_class mclass = GET_MODE_CLASS (mode);
2928   opt_scalar_int_mode wider_mode_iter;
2929   FOR_EACH_MODE_FROM (wider_mode_iter, mode)
2930     {
2931       scalar_int_mode wider_mode = wider_mode_iter.require ();
2932       if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2933         {
2934           rtx xop0, temp;
2935           rtx_insn *last;
2936
2937           last = get_last_insn ();
2938
2939           if (target == 0 || GET_MODE (target) != wider_mode)
2940             target = gen_reg_rtx (wider_mode);
2941
2942           xop0 = widen_operand (op0, wider_mode, mode, true, false);
2943           temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2944                               true);
2945           if (temp != 0)
2946             temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2947                                  target, true, OPTAB_DIRECT);
2948
2949           if (temp)
2950             {
2951               if (mclass != MODE_INT
2952                   || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2953                 return convert_to_mode (mode, temp, 0);
2954               else
2955                 return gen_lowpart (mode, temp);
2956             }
2957           else
2958             delete_insns_since (last);
2959         }
2960     }
2961   return 0;
2962 }
2963
2964 /* Try calculating ctz(x) as K - clz(x & -x) ,
2965    where K is GET_MODE_PRECISION(mode) - 1.
2966
2967    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2968    don't have to worry about what the hardware does in that case.  (If
2969    the clz instruction produces the usual value at 0, which is K, the
2970    result of this code sequence will be -1; expand_ffs, below, relies
2971    on this.  It might be nice to have it be K instead, for consistency
2972    with the (very few) processors that provide a ctz with a defined
2973    value, but that would take one more instruction, and it would be
2974    less convenient for expand_ffs anyway.  */
2975
2976 static rtx
2977 expand_ctz (scalar_int_mode mode, rtx op0, rtx target)
2978 {
2979   rtx_insn *seq;
2980   rtx temp;
2981
2982   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2983     return 0;
2984
2985   start_sequence ();
2986
2987   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2988   if (temp)
2989     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2990                          true, OPTAB_DIRECT);
2991   if (temp)
2992     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2993   if (temp)
2994     temp = expand_binop (mode, sub_optab,
2995                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2996                          temp, target,
2997                          true, OPTAB_DIRECT);
2998   if (temp == 0)
2999     {
3000       end_sequence ();
3001       return 0;
3002     }
3003
3004   seq = get_insns ();
3005   end_sequence ();
3006
3007   add_equal_note (seq, temp, CTZ, op0, NULL_RTX, mode);
3008   emit_insn (seq);
3009   return temp;
3010 }
3011
3012
3013 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
3014    else with the sequence used by expand_clz.
3015
3016    The ffs builtin promises to return zero for a zero value and ctz/clz
3017    may have an undefined value in that case.  If they do not give us a
3018    convenient value, we have to generate a test and branch.  */
3019 static rtx
3020 expand_ffs (scalar_int_mode mode, rtx op0, rtx target)
3021 {
3022   HOST_WIDE_INT val = 0;
3023   bool defined_at_zero = false;
3024   rtx temp;
3025   rtx_insn *seq;
3026
3027   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
3028     {
3029       start_sequence ();
3030
3031       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
3032       if (!temp)
3033         goto fail;
3034
3035       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
3036     }
3037   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
3038     {
3039       start_sequence ();
3040       temp = expand_ctz (mode, op0, 0);
3041       if (!temp)
3042         goto fail;
3043
3044       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
3045         {
3046           defined_at_zero = true;
3047           val = (GET_MODE_PRECISION (mode) - 1) - val;
3048         }
3049     }
3050   else
3051     return 0;
3052
3053   if (defined_at_zero && val == -1)
3054     /* No correction needed at zero.  */;
3055   else
3056     {
3057       /* We don't try to do anything clever with the situation found
3058          on some processors (eg Alpha) where ctz(0:mode) ==
3059          bitsize(mode).  If someone can think of a way to send N to -1
3060          and leave alone all values in the range 0..N-1 (where N is a
3061          power of two), cheaper than this test-and-branch, please add it.
3062
3063          The test-and-branch is done after the operation itself, in case
3064          the operation sets condition codes that can be recycled for this.
3065          (This is true on i386, for instance.)  */
3066
3067       rtx_code_label *nonzero_label = gen_label_rtx ();
3068       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
3069                                mode, true, nonzero_label);
3070
3071       convert_move (temp, GEN_INT (-1), false);
3072       emit_label (nonzero_label);
3073     }
3074
3075   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
3076      to produce a value in the range 0..bitsize.  */
3077   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
3078                        target, false, OPTAB_DIRECT);
3079   if (!temp)
3080     goto fail;
3081
3082   seq = get_insns ();
3083   end_sequence ();
3084
3085   add_equal_note (seq, temp, FFS, op0, NULL_RTX, mode);
3086   emit_insn (seq);
3087   return temp;
3088
3089  fail:
3090   end_sequence ();
3091   return 0;
3092 }
3093
3094 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
3095    conditions, VAL may already be a SUBREG against which we cannot generate
3096    a further SUBREG.  In this case, we expect forcing the value into a
3097    register will work around the situation.  */
3098
3099 static rtx
3100 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
3101                            machine_mode imode)
3102 {
3103   rtx ret;
3104   ret = lowpart_subreg (omode, val, imode);
3105   if (ret == NULL)
3106     {
3107       val = force_reg (imode, val);
3108       ret = lowpart_subreg (omode, val, imode);
3109       gcc_assert (ret != NULL);
3110     }
3111   return ret;
3112 }
3113
3114 /* Expand a floating point absolute value or negation operation via a
3115    logical operation on the sign bit.  */
3116
3117 static rtx
3118 expand_absneg_bit (enum rtx_code code, scalar_float_mode mode,
3119                    rtx op0, rtx target)
3120 {
3121   const struct real_format *fmt;
3122   int bitpos, word, nwords, i;
3123   scalar_int_mode imode;
3124   rtx temp;
3125   rtx_insn *insns;
3126
3127   /* The format has to have a simple sign bit.  */
3128   fmt = REAL_MODE_FORMAT (mode);
3129   if (fmt == NULL)
3130     return NULL_RTX;
3131
3132   bitpos = fmt->signbit_rw;
3133   if (bitpos < 0)
3134     return NULL_RTX;
3135
3136   /* Don't create negative zeros if the format doesn't support them.  */
3137   if (code == NEG && !fmt->has_signed_zero)
3138     return NULL_RTX;
3139
3140   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3141     {
3142       if (!int_mode_for_mode (mode).exists (&imode))
3143         return NULL_RTX;
3144       word = 0;
3145       nwords = 1;
3146     }
3147   else
3148     {
3149       imode = word_mode;
3150
3151       if (FLOAT_WORDS_BIG_ENDIAN)
3152         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3153       else
3154         word = bitpos / BITS_PER_WORD;
3155       bitpos = bitpos % BITS_PER_WORD;
3156       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3157     }
3158
3159   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3160   if (code == ABS)
3161     mask = ~mask;
3162
3163   if (target == 0
3164       || target == op0
3165       || reg_overlap_mentioned_p (target, op0)
3166       || (nwords > 1 && !valid_multiword_target_p (target)))
3167     target = gen_reg_rtx (mode);
3168
3169   if (nwords > 1)
3170     {
3171       start_sequence ();
3172
3173       for (i = 0; i < nwords; ++i)
3174         {
3175           rtx targ_piece = operand_subword (target, i, 1, mode);
3176           rtx op0_piece = operand_subword_force (op0, i, mode);
3177
3178           if (i == word)
3179             {
3180               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
3181                                    op0_piece,
3182                                    immed_wide_int_const (mask, imode),
3183                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3184               if (temp != targ_piece)
3185                 emit_move_insn (targ_piece, temp);
3186             }
3187           else
3188             emit_move_insn (targ_piece, op0_piece);
3189         }
3190
3191       insns = get_insns ();
3192       end_sequence ();
3193
3194       emit_insn (insns);
3195     }
3196   else
3197     {
3198       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
3199                            gen_lowpart (imode, op0),
3200                            immed_wide_int_const (mask, imode),
3201                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3202       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3203
3204       set_dst_reg_note (get_last_insn (), REG_EQUAL,
3205                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
3206                         target);
3207     }
3208
3209   return target;
3210 }
3211
3212 /* As expand_unop, but will fail rather than attempt the operation in a
3213    different mode or with a libcall.  */
3214 static rtx
3215 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
3216                     int unsignedp)
3217 {
3218   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
3219     {
3220       class expand_operand ops[2];
3221       enum insn_code icode = optab_handler (unoptab, mode);
3222       rtx_insn *last = get_last_insn ();
3223       rtx_insn *pat;
3224
3225       create_output_operand (&ops[0], target, mode);
3226       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
3227       pat = maybe_gen_insn (icode, 2, ops);
3228       if (pat)
3229         {
3230           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3231               && ! add_equal_note (pat, ops[0].value,
3232                                    optab_to_code (unoptab),
3233                                    ops[1].value, NULL_RTX, mode))
3234             {
3235               delete_insns_since (last);
3236               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
3237             }
3238
3239           emit_insn (pat);
3240
3241           return ops[0].value;
3242         }
3243     }
3244   return 0;
3245 }
3246
3247 /* Generate code to perform an operation specified by UNOPTAB
3248    on operand OP0, with result having machine-mode MODE.
3249
3250    UNSIGNEDP is for the case where we have to widen the operands
3251    to perform the operation.  It says to use zero-extension.
3252
3253    If TARGET is nonzero, the value
3254    is generated there, if it is convenient to do so.
3255    In all cases an rtx is returned for the locus of the value;
3256    this may or may not be TARGET.  */
3257
3258 rtx
3259 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
3260              int unsignedp)
3261 {
3262   enum mode_class mclass = GET_MODE_CLASS (mode);
3263   machine_mode wider_mode;
3264   scalar_int_mode int_mode;
3265   scalar_float_mode float_mode;
3266   rtx temp;
3267   rtx libfunc;
3268
3269   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
3270   if (temp)
3271     return temp;
3272
3273   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
3274
3275   /* Widening (or narrowing) clz needs special treatment.  */
3276   if (unoptab == clz_optab)
3277     {
3278       if (is_a <scalar_int_mode> (mode, &int_mode))
3279         {
3280           temp = widen_leading (int_mode, op0, target, unoptab);
3281           if (temp)
3282             return temp;
3283
3284           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
3285               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3286             {
3287               temp = expand_doubleword_clz_ctz_ffs (int_mode, op0, target,
3288                                                     unoptab);
3289               if (temp)
3290                 return temp;
3291             }
3292         }
3293
3294       goto try_libcall;
3295     }
3296
3297   if (unoptab == clrsb_optab)
3298     {
3299       if (is_a <scalar_int_mode> (mode, &int_mode))
3300         {
3301           temp = widen_leading (int_mode, op0, target, unoptab);
3302           if (temp)
3303             return temp;
3304           temp = expand_clrsb_using_clz (int_mode, op0, target);
3305           if (temp)
3306             return temp;
3307         }
3308       goto try_libcall;
3309     }
3310
3311   if (unoptab == popcount_optab
3312       && is_a <scalar_int_mode> (mode, &int_mode)
3313       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
3314       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing
3315       && optimize_insn_for_speed_p ())
3316     {
3317       temp = expand_doubleword_popcount (int_mode, op0, target);
3318       if (temp)
3319         return temp;
3320     }
3321
3322   if (unoptab == parity_optab
3323       && is_a <scalar_int_mode> (mode, &int_mode)
3324       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
3325       && (optab_handler (unoptab, word_mode) != CODE_FOR_nothing
3326           || optab_handler (popcount_optab, word_mode) != CODE_FOR_nothing)
3327       && optimize_insn_for_speed_p ())
3328     {
3329       temp = expand_doubleword_parity (int_mode, op0, target);
3330       if (temp)
3331         return temp;
3332     }
3333
3334   /* Widening (or narrowing) bswap needs special treatment.  */
3335   if (unoptab == bswap_optab)
3336     {
3337       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
3338          or ROTATERT.  First try these directly; if this fails, then try the
3339          obvious pair of shifts with allowed widening, as this will probably
3340          be always more efficient than the other fallback methods.  */
3341       if (mode == HImode)
3342         {
3343           rtx_insn *last;
3344           rtx temp1, temp2;
3345
3346           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
3347             {
3348               temp = expand_binop (mode, rotl_optab, op0,
3349                                    gen_int_shift_amount (mode, 8),
3350                                    target, unsignedp, OPTAB_DIRECT);
3351               if (temp)
3352                 return temp;
3353              }
3354
3355           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
3356             {
3357               temp = expand_binop (mode, rotr_optab, op0,
3358                                    gen_int_shift_amount (mode, 8),
3359                                    target, unsignedp, OPTAB_DIRECT);
3360               if (temp)
3361                 return temp;
3362             }
3363
3364           last = get_last_insn ();
3365
3366           temp1 = expand_binop (mode, ashl_optab, op0,
3367                                 gen_int_shift_amount (mode, 8), NULL_RTX,
3368                                 unsignedp, OPTAB_WIDEN);
3369           temp2 = expand_binop (mode, lshr_optab, op0,
3370                                 gen_int_shift_amount (mode, 8), NULL_RTX,
3371                                 unsignedp, OPTAB_WIDEN);
3372           if (temp1 && temp2)
3373             {
3374               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
3375                                    unsignedp, OPTAB_WIDEN);
3376               if (temp)
3377                 return temp;
3378             }
3379
3380           delete_insns_since (last);
3381         }
3382
3383       if (is_a <scalar_int_mode> (mode, &int_mode))
3384         {
3385           temp = widen_bswap (int_mode, op0, target);
3386           if (temp)
3387             return temp;
3388
3389           /* We do not provide a 128-bit bswap in libgcc so force the use of
3390              a double bswap for 64-bit targets.  */
3391           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
3392               && (UNITS_PER_WORD == 8
3393                   || optab_handler (unoptab, word_mode) != CODE_FOR_nothing))
3394             {
3395               temp = expand_doubleword_bswap (mode, op0, target);
3396               if (temp)
3397                 return temp;
3398             }
3399         }
3400
3401       goto try_libcall;
3402     }
3403
3404   if (CLASS_HAS_WIDER_MODES_P (mclass))
3405     FOR_EACH_WIDER_MODE (wider_mode, mode)
3406       {
3407         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
3408           {
3409             rtx xop0 = op0;
3410             rtx_insn *last = get_last_insn ();
3411
3412             /* For certain operations, we need not actually extend
3413                the narrow operand, as long as we will truncate the
3414                results to the same narrowness.  */
3415
3416             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3417                                   (unoptab == neg_optab
3418                                    || unoptab == one_cmpl_optab)
3419                                   && mclass == MODE_INT);
3420
3421             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3422                                 unsignedp);
3423
3424             if (temp)
3425               {
3426                 if (mclass != MODE_INT
3427                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
3428                   {
3429                     if (target == 0)
3430                       target = gen_reg_rtx (mode);
3431                     convert_move (target, temp, 0);
3432                     return target;
3433                   }
3434                 else
3435                   return gen_lowpart (mode, temp);
3436               }
3437             else
3438               delete_insns_since (last);
3439           }
3440       }
3441
3442   /* These can be done a word at a time.  */
3443   if (unoptab == one_cmpl_optab
3444       && is_int_mode (mode, &int_mode)
3445       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
3446       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3447     {
3448       int i;
3449       rtx_insn *insns;
3450
3451       if (target == 0
3452           || target == op0
3453           || reg_overlap_mentioned_p (target, op0)
3454           || !valid_multiword_target_p (target))
3455         target = gen_reg_rtx (int_mode);
3456
3457       start_sequence ();
3458
3459       /* Do the actual arithmetic.  */
3460       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
3461         {
3462           rtx target_piece = operand_subword (target, i, 1, int_mode);
3463           rtx x = expand_unop (word_mode, unoptab,
3464                                operand_subword_force (op0, i, int_mode),
3465                                target_piece, unsignedp);
3466
3467           if (target_piece != x)
3468             emit_move_insn (target_piece, x);
3469         }
3470
3471       insns = get_insns ();
3472       end_sequence ();
3473
3474       emit_insn (insns);
3475       return target;
3476     }
3477
3478   /* Emit ~op0 as op0 ^ -1.  */
3479   if (unoptab == one_cmpl_optab
3480       && (SCALAR_INT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_VECTOR_INT)
3481       && optab_handler (xor_optab, mode) != CODE_FOR_nothing)
3482     {
3483       temp = expand_binop (mode, xor_optab, op0, CONSTM1_RTX (mode),
3484                            target, unsignedp, OPTAB_DIRECT);
3485       if (temp)
3486         return temp;
3487     }
3488
3489   if (optab_to_code (unoptab) == NEG)
3490     {
3491       /* Try negating floating point values by flipping the sign bit.  */
3492       if (is_a <scalar_float_mode> (mode, &float_mode))
3493         {
3494           temp = expand_absneg_bit (NEG, float_mode, op0, target);
3495           if (temp)
3496             return temp;
3497         }
3498
3499       /* If there is no negation pattern, and we have no negative zero,
3500          try subtracting from zero.  */
3501       if (!HONOR_SIGNED_ZEROS (mode))
3502         {
3503           temp = expand_binop (mode, (unoptab == negv_optab
3504                                       ? subv_optab : sub_optab),
3505                                CONST0_RTX (mode), op0, target,
3506                                unsignedp, OPTAB_DIRECT);
3507           if (temp)
3508             return temp;
3509         }
3510     }
3511
3512   /* Try calculating parity (x) as popcount (x) % 2.  */
3513   if (unoptab == parity_optab && is_a <scalar_int_mode> (mode, &int_mode))
3514     {
3515       temp = expand_parity (int_mode, op0, target);
3516       if (temp)
3517         return temp;
3518     }
3519
3520   /* Try implementing ffs (x) in terms of clz (x).  */
3521   if (unoptab == ffs_optab && is_a <scalar_int_mode> (mode, &int_mode))
3522     {
3523       temp = expand_ffs (int_mode, op0, target);
3524       if (temp)
3525         return temp;
3526     }
3527
3528   /* Try implementing ctz (x) in terms of clz (x).  */
3529   if (unoptab == ctz_optab && is_a <scalar_int_mode> (mode, &int_mode))
3530     {
3531       temp = expand_ctz (int_mode, op0, target);
3532       if (temp)
3533         return temp;
3534     }
3535
3536   if ((unoptab == ctz_optab || unoptab == ffs_optab)
3537       && optimize_insn_for_speed_p ()
3538       && is_a <scalar_int_mode> (mode, &int_mode)
3539       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
3540       && (optab_handler (unoptab, word_mode) != CODE_FOR_nothing
3541           || optab_handler (ctz_optab, word_mode) != CODE_FOR_nothing))
3542     {
3543       temp = expand_doubleword_clz_ctz_ffs (int_mode, op0, target, unoptab);
3544       if (temp)
3545         return temp;
3546     }
3547
3548  try_libcall:
3549   /* Now try a library call in this mode.  */
3550   libfunc = optab_libfunc (unoptab, mode);
3551   if (libfunc)
3552     {
3553       rtx_insn *insns;
3554       rtx value;
3555       rtx eq_value;
3556       machine_mode outmode = mode;
3557
3558       /* All of these functions return small values.  Thus we choose to
3559          have them return something that isn't a double-word.  */
3560       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
3561           || unoptab == clrsb_optab || unoptab == popcount_optab
3562           || unoptab == parity_optab)
3563         outmode
3564           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3565                                           optab_libfunc (unoptab, mode)));
3566
3567       start_sequence ();
3568
3569       /* Pass 1 for NO_QUEUE so we don't lose any increments
3570          if the libcall is cse'd or moved.  */
3571       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3572                                        op0, mode);
3573       insns = get_insns ();
3574       end_sequence ();
3575
3576       target = gen_reg_rtx (outmode);
3577       bool trapv = trapv_unoptab_p (unoptab);
3578       if (trapv)
3579         eq_value = NULL_RTX;
3580       else
3581         {
3582           eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3583           if (GET_MODE_UNIT_SIZE (outmode) < GET_MODE_UNIT_SIZE (mode))
3584             eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3585           else if (GET_MODE_UNIT_SIZE (outmode) > GET_MODE_UNIT_SIZE (mode))
3586             eq_value = simplify_gen_unary (ZERO_EXTEND,
3587                                            outmode, eq_value, mode);
3588         }
3589       emit_libcall_block_1 (insns, target, value, eq_value, trapv);
3590
3591       return target;
3592     }
3593
3594   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3595
3596   if (CLASS_HAS_WIDER_MODES_P (mclass))
3597     {
3598       FOR_EACH_WIDER_MODE (wider_mode, mode)
3599         {
3600           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3601               || optab_libfunc (unoptab, wider_mode))
3602             {
3603               rtx xop0 = op0;
3604               rtx_insn *last = get_last_insn ();
3605
3606               /* For certain operations, we need not actually extend
3607                  the narrow operand, as long as we will truncate the
3608                  results to the same narrowness.  */
3609               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3610                                     (unoptab == neg_optab
3611                                      || unoptab == one_cmpl_optab
3612                                      || unoptab == bswap_optab)
3613                                     && mclass == MODE_INT);
3614
3615               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3616                                   unsignedp);
3617
3618               /* If we are generating clz using wider mode, adjust the
3619                  result.  Similarly for clrsb.  */
3620               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3621                   && temp != 0)
3622                 {
3623                   scalar_int_mode wider_int_mode
3624                     = as_a <scalar_int_mode> (wider_mode);
3625                   int_mode = as_a <scalar_int_mode> (mode);
3626                   temp = expand_binop
3627                     (wider_mode, sub_optab, temp,
3628                      gen_int_mode (GET_MODE_PRECISION (wider_int_mode)
3629                                    - GET_MODE_PRECISION (int_mode),
3630                                    wider_int_mode),
3631                      target, true, OPTAB_DIRECT);
3632                 }
3633
3634               /* Likewise for bswap.  */
3635               if (unoptab == bswap_optab && temp != 0)
3636                 {
3637                   scalar_int_mode wider_int_mode
3638                     = as_a <scalar_int_mode> (wider_mode);
3639                   int_mode = as_a <scalar_int_mode> (mode);
3640                   gcc_assert (GET_MODE_PRECISION (wider_int_mode)
3641                               == GET_MODE_BITSIZE (wider_int_mode)
3642                               && GET_MODE_PRECISION (int_mode)
3643                                  == GET_MODE_BITSIZE (int_mode));
3644
3645                   temp = expand_shift (RSHIFT_EXPR, wider_int_mode, temp,
3646                                        GET_MODE_BITSIZE (wider_int_mode)
3647                                        - GET_MODE_BITSIZE (int_mode),
3648                                        NULL_RTX, true);
3649                 }
3650
3651               if (temp)
3652                 {
3653                   if (mclass != MODE_INT)
3654                     {
3655                       if (target == 0)
3656                         target = gen_reg_rtx (mode);
3657                       convert_move (target, temp, 0);
3658                       return target;
3659                     }
3660                   else
3661                     return gen_lowpart (mode, temp);
3662                 }
3663               else
3664                 delete_insns_since (last);
3665             }
3666         }
3667     }
3668
3669   /* One final attempt at implementing negation via subtraction,
3670      this time allowing widening of the operand.  */
3671   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3672     {
3673       rtx temp;
3674       temp = expand_binop (mode,
3675                            unoptab == negv_optab ? subv_optab : sub_optab,
3676                            CONST0_RTX (mode), op0,
3677                            target, unsignedp, OPTAB_LIB_WIDEN);
3678       if (temp)
3679         return temp;
3680     }
3681
3682   return 0;
3683 }
3684 \f
3685 /* Emit code to compute the absolute value of OP0, with result to
3686    TARGET if convenient.  (TARGET may be 0.)  The return value says
3687    where the result actually is to be found.
3688
3689    MODE is the mode of the operand; the mode of the result is
3690    different but can be deduced from MODE.
3691
3692  */
3693
3694 rtx
3695 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3696                    int result_unsignedp)
3697 {
3698   rtx temp;
3699
3700   if (GET_MODE_CLASS (mode) != MODE_INT
3701       || ! flag_trapv)
3702     result_unsignedp = 1;
3703
3704   /* First try to do it with a special abs instruction.  */
3705   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3706                       op0, target, 0);
3707   if (temp != 0)
3708     return temp;
3709
3710   /* For floating point modes, try clearing the sign bit.  */
3711   scalar_float_mode float_mode;
3712   if (is_a <scalar_float_mode> (mode, &float_mode))
3713     {
3714       temp = expand_absneg_bit (ABS, float_mode, op0, target);
3715       if (temp)
3716         return temp;
3717     }
3718
3719   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3720   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3721       && !HONOR_SIGNED_ZEROS (mode))
3722     {
3723       rtx_insn *last = get_last_insn ();
3724
3725       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3726                           op0, NULL_RTX, 0);
3727       if (temp != 0)
3728         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3729                              OPTAB_WIDEN);
3730
3731       if (temp != 0)
3732         return temp;
3733
3734       delete_insns_since (last);
3735     }
3736
3737   /* If this machine has expensive jumps, we can do integer absolute
3738      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3739      where W is the width of MODE.  */
3740
3741   scalar_int_mode int_mode;
3742   if (is_int_mode (mode, &int_mode)
3743       && BRANCH_COST (optimize_insn_for_speed_p (),
3744                       false) >= 2)
3745     {
3746       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3747                                    GET_MODE_PRECISION (int_mode) - 1,
3748                                    NULL_RTX, 0);
3749
3750       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3751                            OPTAB_LIB_WIDEN);
3752       if (temp != 0)
3753         temp = expand_binop (int_mode,
3754                              result_unsignedp ? sub_optab : subv_optab,
3755                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3756
3757       if (temp != 0)
3758         return temp;
3759     }
3760
3761   return NULL_RTX;
3762 }
3763
3764 rtx
3765 expand_abs (machine_mode mode, rtx op0, rtx target,
3766             int result_unsignedp, int safe)
3767 {
3768   rtx temp;
3769   rtx_code_label *op1;
3770
3771   if (GET_MODE_CLASS (mode) != MODE_INT
3772       || ! flag_trapv)
3773     result_unsignedp = 1;
3774
3775   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3776   if (temp != 0)
3777     return temp;
3778
3779   /* If that does not win, use conditional jump and negate.  */
3780
3781   /* It is safe to use the target if it is the same
3782      as the source if this is also a pseudo register */
3783   if (op0 == target && REG_P (op0)
3784       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3785     safe = 1;
3786
3787   op1 = gen_label_rtx ();
3788   if (target == 0 || ! safe
3789       || GET_MODE (target) != mode
3790       || (MEM_P (target) && MEM_VOLATILE_P (target))
3791       || (REG_P (target)
3792           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3793     target = gen_reg_rtx (mode);
3794
3795   emit_move_insn (target, op0);
3796   NO_DEFER_POP;
3797
3798   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3799                            NULL_RTX, NULL, op1,
3800                            profile_probability::uninitialized ());
3801
3802   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3803                      target, target, 0);
3804   if (op0 != target)
3805     emit_move_insn (target, op0);
3806   emit_label (op1);
3807   OK_DEFER_POP;
3808   return target;
3809 }
3810
3811 /* Emit code to compute the one's complement absolute value of OP0
3812    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3813    (TARGET may be NULL_RTX.)  The return value says where the result
3814    actually is to be found.
3815
3816    MODE is the mode of the operand; the mode of the result is
3817    different but can be deduced from MODE.  */
3818
3819 rtx
3820 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3821 {
3822   rtx temp;
3823
3824   /* Not applicable for floating point modes.  */
3825   if (FLOAT_MODE_P (mode))
3826     return NULL_RTX;
3827
3828   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3829   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3830     {
3831       rtx_insn *last = get_last_insn ();
3832
3833       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3834       if (temp != 0)
3835         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3836                              OPTAB_WIDEN);
3837
3838       if (temp != 0)
3839         return temp;
3840
3841       delete_insns_since (last);
3842     }
3843
3844   /* If this machine has expensive jumps, we can do one's complement
3845      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3846
3847   scalar_int_mode int_mode;
3848   if (is_int_mode (mode, &int_mode)
3849       && BRANCH_COST (optimize_insn_for_speed_p (),
3850                      false) >= 2)
3851     {
3852       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3853                                    GET_MODE_PRECISION (int_mode) - 1,
3854                                    NULL_RTX, 0);
3855
3856       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3857                            OPTAB_LIB_WIDEN);
3858
3859       if (temp != 0)
3860         return temp;
3861     }
3862
3863   return NULL_RTX;
3864 }
3865
3866 /* A subroutine of expand_copysign, perform the copysign operation using the
3867    abs and neg primitives advertised to exist on the target.  The assumption
3868    is that we have a split register file, and leaving op0 in fp registers,
3869    and not playing with subregs so much, will help the register allocator.  */
3870
3871 static rtx
3872 expand_copysign_absneg (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3873                         int bitpos, bool op0_is_abs)
3874 {
3875   scalar_int_mode imode;
3876   enum insn_code icode;
3877   rtx sign;
3878   rtx_code_label *label;
3879
3880   if (target == op1)
3881     target = NULL_RTX;
3882
3883   /* Check if the back end provides an insn that handles signbit for the
3884      argument's mode. */
3885   icode = optab_handler (signbit_optab, mode);
3886   if (icode != CODE_FOR_nothing)
3887     {
3888       imode = as_a <scalar_int_mode> (insn_data[(int) icode].operand[0].mode);
3889       sign = gen_reg_rtx (imode);
3890       emit_unop_insn (icode, sign, op1, UNKNOWN);
3891     }
3892   else
3893     {
3894       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3895         {
3896           if (!int_mode_for_mode (mode).exists (&imode))
3897             return NULL_RTX;
3898           op1 = gen_lowpart (imode, op1);
3899         }
3900       else
3901         {
3902           int word;
3903
3904           imode = word_mode;
3905           if (FLOAT_WORDS_BIG_ENDIAN)
3906             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3907           else
3908             word = bitpos / BITS_PER_WORD;
3909           bitpos = bitpos % BITS_PER_WORD;
3910           op1 = operand_subword_force (op1, word, mode);
3911         }
3912
3913       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3914       sign = expand_binop (imode, and_optab, op1,
3915                            immed_wide_int_const (mask, imode),
3916                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3917     }
3918
3919   if (!op0_is_abs)
3920     {
3921       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3922       if (op0 == NULL)
3923         return NULL_RTX;
3924       target = op0;
3925     }
3926   else
3927     {
3928       if (target == NULL_RTX)
3929         target = copy_to_reg (op0);
3930       else
3931         emit_move_insn (target, op0);
3932     }
3933
3934   label = gen_label_rtx ();
3935   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3936
3937   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3938     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3939   else
3940     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3941   if (op0 != target)
3942     emit_move_insn (target, op0);
3943
3944   emit_label (label);
3945
3946   return target;
3947 }
3948
3949
3950 /* A subroutine of expand_copysign, perform the entire copysign operation
3951    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3952    is true if op0 is known to have its sign bit clear.  */
3953
3954 static rtx
3955 expand_copysign_bit (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3956                      int bitpos, bool op0_is_abs)
3957 {
3958   scalar_int_mode imode;
3959   int word, nwords, i;
3960   rtx temp;
3961   rtx_insn *insns;
3962
3963   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3964     {
3965       if (!int_mode_for_mode (mode).exists (&imode))
3966         return NULL_RTX;
3967       word = 0;
3968       nwords = 1;
3969     }
3970   else
3971     {
3972       imode = word_mode;
3973
3974       if (FLOAT_WORDS_BIG_ENDIAN)
3975         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3976       else
3977         word = bitpos / BITS_PER_WORD;
3978       bitpos = bitpos % BITS_PER_WORD;
3979       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3980     }
3981
3982   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3983
3984   if (target == 0
3985       || target == op0
3986       || target == op1
3987       || reg_overlap_mentioned_p (target, op0)
3988       || reg_overlap_mentioned_p (target, op1)
3989       || (nwords > 1 && !valid_multiword_target_p (target)))
3990     target = gen_reg_rtx (mode);
3991
3992   if (nwords > 1)
3993     {
3994       start_sequence ();
3995
3996       for (i = 0; i < nwords; ++i)
3997         {
3998           rtx targ_piece = operand_subword (target, i, 1, mode);
3999           rtx op0_piece = operand_subword_force (op0, i, mode);
4000
4001           if (i == word)
4002             {
4003               if (!op0_is_abs)
4004                 op0_piece
4005                   = expand_binop (imode, and_optab, op0_piece,
4006                                   immed_wide_int_const (~mask, imode),
4007                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
4008               op1 = expand_binop (imode, and_optab,
4009                                   operand_subword_force (op1, i, mode),
4010                                   immed_wide_int_const (mask, imode),
4011                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
4012
4013               temp = expand_binop (imode, ior_optab, op0_piece, op1,
4014                                    targ_piece, 1, OPTAB_LIB_WIDEN);
4015               if (temp != targ_piece)
4016                 emit_move_insn (targ_piece, temp);
4017             }
4018           else
4019             emit_move_insn (targ_piece, op0_piece);
4020         }
4021
4022       insns = get_insns ();
4023       end_sequence ();
4024
4025       emit_insn (insns);
4026     }
4027   else
4028     {
4029       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
4030                           immed_wide_int_const (mask, imode),
4031                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
4032
4033       op0 = gen_lowpart (imode, op0);
4034       if (!op0_is_abs)
4035         op0 = expand_binop (imode, and_optab, op0,
4036                             immed_wide_int_const (~mask, imode),
4037                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
4038
4039       temp = expand_binop (imode, ior_optab, op0, op1,
4040                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
4041       target = lowpart_subreg_maybe_copy (mode, temp, imode);
4042     }
4043
4044   return target;
4045 }
4046
4047 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
4048    scalar floating point mode.  Return NULL if we do not know how to
4049    expand the operation inline.  */
4050
4051 rtx
4052 expand_copysign (rtx op0, rtx op1, rtx target)
4053 {
4054   scalar_float_mode mode;
4055   const struct real_format *fmt;
4056   bool op0_is_abs;
4057   rtx temp;
4058
4059   mode = as_a <scalar_float_mode> (GET_MODE (op0));
4060   gcc_assert (GET_MODE (op1) == mode);
4061
4062   /* First try to do it with a special instruction.  */
4063   temp = expand_binop (mode, copysign_optab, op0, op1,
4064                        target, 0, OPTAB_DIRECT);
4065   if (temp)
4066     return temp;
4067
4068   fmt = REAL_MODE_FORMAT (mode);
4069   if (fmt == NULL || !fmt->has_signed_zero)
4070     return NULL_RTX;
4071
4072   op0_is_abs = false;
4073   if (CONST_DOUBLE_AS_FLOAT_P (op0))
4074     {
4075       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
4076         op0 = simplify_unary_operation (ABS, mode, op0, mode);
4077       op0_is_abs = true;
4078     }
4079
4080   if (fmt->signbit_ro >= 0
4081       && (CONST_DOUBLE_AS_FLOAT_P (op0)
4082           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
4083               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
4084     {
4085       temp = expand_copysign_absneg (mode, op0, op1, target,
4086                                      fmt->signbit_ro, op0_is_abs);
4087       if (temp)
4088         return temp;
4089     }
4090
4091   if (fmt->signbit_rw < 0)
4092     return NULL_RTX;
4093   return expand_copysign_bit (mode, op0, op1, target,
4094                               fmt->signbit_rw, op0_is_abs);
4095 }
4096 \f
4097 /* Generate an instruction whose insn-code is INSN_CODE,
4098    with two operands: an output TARGET and an input OP0.
4099    TARGET *must* be nonzero, and the output is always stored there.
4100    CODE is an rtx code such that (CODE OP0) is an rtx that describes
4101    the value that is stored into TARGET.
4102
4103    Return false if expansion failed.  */
4104
4105 bool
4106 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
4107                       enum rtx_code code)
4108 {
4109   class expand_operand ops[2];
4110   rtx_insn *pat;
4111
4112   create_output_operand (&ops[0], target, GET_MODE (target));
4113   create_input_operand (&ops[1], op0, GET_MODE (op0));
4114   pat = maybe_gen_insn (icode, 2, ops);
4115   if (!pat)
4116     return false;
4117
4118   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
4119       && code != UNKNOWN)
4120     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX,
4121                     GET_MODE (op0));
4122
4123   emit_insn (pat);
4124
4125   if (ops[0].value != target)
4126     emit_move_insn (target, ops[0].value);
4127   return true;
4128 }
4129 /* Generate an instruction whose insn-code is INSN_CODE,
4130    with two operands: an output TARGET and an input OP0.
4131    TARGET *must* be nonzero, and the output is always stored there.
4132    CODE is an rtx code such that (CODE OP0) is an rtx that describes
4133    the value that is stored into TARGET.  */
4134
4135 void
4136 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
4137 {
4138   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
4139   gcc_assert (ok);
4140 }
4141 \f
4142 struct no_conflict_data
4143 {
4144   rtx target;
4145   rtx_insn *first, *insn;
4146   bool must_stay;
4147 };
4148
4149 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
4150    the currently examined clobber / store has to stay in the list of
4151    insns that constitute the actual libcall block.  */
4152 static void
4153 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
4154 {
4155   struct no_conflict_data *p= (struct no_conflict_data *) p0;
4156
4157   /* If this inns directly contributes to setting the target, it must stay.  */
4158   if (reg_overlap_mentioned_p (p->target, dest))
4159     p->must_stay = true;
4160   /* If we haven't committed to keeping any other insns in the list yet,
4161      there is nothing more to check.  */
4162   else if (p->insn == p->first)
4163     return;
4164   /* If this insn sets / clobbers a register that feeds one of the insns
4165      already in the list, this insn has to stay too.  */
4166   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
4167            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
4168            || reg_used_between_p (dest, p->first, p->insn)
4169            /* Likewise if this insn depends on a register set by a previous
4170               insn in the list, or if it sets a result (presumably a hard
4171               register) that is set or clobbered by a previous insn.
4172               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
4173               SET_DEST perform the former check on the address, and the latter
4174               check on the MEM.  */
4175            || (GET_CODE (set) == SET
4176                && (modified_in_p (SET_SRC (set), p->first)
4177                    || modified_in_p (SET_DEST (set), p->first)
4178                    || modified_between_p (SET_SRC (set), p->first, p->insn)
4179                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
4180     p->must_stay = true;
4181 }
4182
4183 \f
4184 /* Emit code to make a call to a constant function or a library call.
4185
4186    INSNS is a list containing all insns emitted in the call.
4187    These insns leave the result in RESULT.  Our block is to copy RESULT
4188    to TARGET, which is logically equivalent to EQUIV.
4189
4190    We first emit any insns that set a pseudo on the assumption that these are
4191    loading constants into registers; doing so allows them to be safely cse'ed
4192    between blocks.  Then we emit all the other insns in the block, followed by
4193    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
4194    note with an operand of EQUIV.  */
4195
4196 static void
4197 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
4198                       bool equiv_may_trap)
4199 {
4200   rtx final_dest = target;
4201   rtx_insn *next, *last, *insn;
4202
4203   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
4204      into a MEM later.  Protect the libcall block from this change.  */
4205   if (! REG_P (target) || REG_USERVAR_P (target))
4206     target = gen_reg_rtx (GET_MODE (target));
4207
4208   /* If we're using non-call exceptions, a libcall corresponding to an
4209      operation that may trap may also trap.  */
4210   /* ??? See the comment in front of make_reg_eh_region_note.  */
4211   if (cfun->can_throw_non_call_exceptions
4212       && (equiv_may_trap || may_trap_p (equiv)))
4213     {
4214       for (insn = insns; insn; insn = NEXT_INSN (insn))
4215         if (CALL_P (insn))
4216           {
4217             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
4218             if (note)
4219               {
4220                 int lp_nr = INTVAL (XEXP (note, 0));
4221                 if (lp_nr == 0 || lp_nr == INT_MIN)
4222                   remove_note (insn, note);
4223               }
4224           }
4225     }
4226   else
4227     {
4228       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
4229          reg note to indicate that this call cannot throw or execute a nonlocal
4230          goto (unless there is already a REG_EH_REGION note, in which case
4231          we update it).  */
4232       for (insn = insns; insn; insn = NEXT_INSN (insn))
4233         if (CALL_P (insn))
4234           make_reg_eh_region_note_nothrow_nononlocal (insn);
4235     }
4236
4237   /* First emit all insns that set pseudos.  Remove them from the list as
4238      we go.  Avoid insns that set pseudos which were referenced in previous
4239      insns.  These can be generated by move_by_pieces, for example,
4240      to update an address.  Similarly, avoid insns that reference things
4241      set in previous insns.  */
4242
4243   for (insn = insns; insn; insn = next)
4244     {
4245       rtx set = single_set (insn);
4246
4247       next = NEXT_INSN (insn);
4248
4249       if (set != 0 && REG_P (SET_DEST (set))
4250           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
4251         {
4252           struct no_conflict_data data;
4253
4254           data.target = const0_rtx;
4255           data.first = insns;
4256           data.insn = insn;
4257           data.must_stay = 0;
4258           note_stores (insn, no_conflict_move_test, &data);
4259           if (! data.must_stay)
4260             {
4261               if (PREV_INSN (insn))
4262                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
4263               else
4264                 insns = next;
4265
4266               if (next)
4267                 SET_PREV_INSN (next) = PREV_INSN (insn);
4268
4269               add_insn (insn);
4270             }
4271         }
4272
4273       /* Some ports use a loop to copy large arguments onto the stack.
4274          Don't move anything outside such a loop.  */
4275       if (LABEL_P (insn))
4276         break;
4277     }
4278
4279   /* Write the remaining insns followed by the final copy.  */
4280   for (insn = insns; insn; insn = next)
4281     {
4282       next = NEXT_INSN (insn);
4283
4284       add_insn (insn);
4285     }
4286
4287   last = emit_move_insn (target, result);
4288   if (equiv)
4289     set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
4290
4291   if (final_dest != target)
4292     emit_move_insn (final_dest, target);
4293 }
4294
4295 void
4296 emit_libcall_block (rtx_insn *insns, rtx target, rtx result, rtx equiv)
4297 {
4298   emit_libcall_block_1 (insns, target, result, equiv, false);
4299 }
4300 \f
4301 /* True if we can perform a comparison of mode MODE straightforwardly.
4302    PURPOSE describes how this comparison will be used.  CODE is the rtx
4303    comparison code we will be using.
4304
4305    ??? Actually, CODE is slightly weaker than that.  A target is still
4306    required to implement all of the normal bcc operations, but not
4307    required to implement all (or any) of the unordered bcc operations.  */
4308
4309 bool
4310 can_compare_p (enum rtx_code code, machine_mode mode,
4311                enum can_compare_purpose purpose)
4312 {
4313   rtx test;
4314   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
4315   do
4316     {
4317       enum insn_code icode;
4318
4319       if (purpose == ccp_jump
4320           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
4321           && insn_operand_matches (icode, 0, test))
4322         return true;
4323       if (purpose == ccp_store_flag
4324           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
4325           && insn_operand_matches (icode, 1, test))
4326         return true;
4327       if (purpose == ccp_cmov
4328           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
4329         return true;
4330
4331       mode = GET_MODE_WIDER_MODE (mode).else_void ();
4332       PUT_MODE (test, mode);
4333     }
4334   while (mode != VOIDmode);
4335
4336   return false;
4337 }
4338
4339 /* Return whether RTL code CODE corresponds to an unsigned optab.  */
4340
4341 static bool
4342 unsigned_optab_p (enum rtx_code code)
4343 {
4344   return code == LTU || code == LEU || code == GTU || code == GEU;
4345 }
4346
4347 /* Return whether the backend-emitted comparison for code CODE, comparing
4348    operands of mode VALUE_MODE and producing a result with MASK_MODE, matches
4349    operand OPNO of pattern ICODE.  */
4350
4351 static bool
4352 insn_predicate_matches_p (enum insn_code icode, unsigned int opno,
4353                           enum rtx_code code, machine_mode mask_mode,
4354                           machine_mode value_mode)
4355 {
4356   rtx reg1 = alloca_raw_REG (value_mode, LAST_VIRTUAL_REGISTER + 1);
4357   rtx reg2 = alloca_raw_REG (value_mode, LAST_VIRTUAL_REGISTER + 2);
4358   rtx test = alloca_rtx_fmt_ee (code, mask_mode, reg1, reg2);
4359   return insn_operand_matches (icode, opno, test);
4360 }
4361
4362 /* Return whether the backend can emit a vector comparison (vec_cmp/vec_cmpu)
4363    for code CODE, comparing operands of mode VALUE_MODE and producing a result
4364    with MASK_MODE.  */
4365
4366 bool
4367 can_vec_cmp_compare_p (enum rtx_code code, machine_mode value_mode,
4368                        machine_mode mask_mode)
4369 {
4370   enum insn_code icode
4371       = get_vec_cmp_icode (value_mode, mask_mode, unsigned_optab_p (code));
4372   if (icode == CODE_FOR_nothing)
4373     return false;
4374
4375   return insn_predicate_matches_p (icode, 1, code, mask_mode, value_mode);
4376 }
4377
4378 /* Return whether the backend can emit a vector comparison (vcond/vcondu) for
4379    code CODE, comparing operands of mode CMP_OP_MODE and producing a result
4380    with VALUE_MODE.  */
4381
4382 bool
4383 can_vcond_compare_p (enum rtx_code code, machine_mode value_mode,
4384                      machine_mode cmp_op_mode)
4385 {
4386   enum insn_code icode
4387       = get_vcond_icode (value_mode, cmp_op_mode, unsigned_optab_p (code));
4388   if (icode == CODE_FOR_nothing)
4389     return false;
4390
4391   return insn_predicate_matches_p (icode, 3, code, value_mode, cmp_op_mode);
4392 }
4393
4394 /* Return whether the backend can emit vector set instructions for inserting
4395    element into vector at variable index position.  */
4396
4397 bool
4398 can_vec_set_var_idx_p (machine_mode vec_mode)
4399 {
4400   if (!VECTOR_MODE_P (vec_mode))
4401     return false;
4402
4403   machine_mode inner_mode = GET_MODE_INNER (vec_mode);
4404
4405   rtx reg1 = alloca_raw_REG (vec_mode, LAST_VIRTUAL_REGISTER + 1);
4406   rtx reg2 = alloca_raw_REG (inner_mode, LAST_VIRTUAL_REGISTER + 2);
4407
4408   enum insn_code icode = optab_handler (vec_set_optab, vec_mode);
4409
4410   const struct insn_data_d *data = &insn_data[icode];
4411   machine_mode idx_mode = data->operand[2].mode;
4412
4413   rtx reg3 = alloca_raw_REG (idx_mode, LAST_VIRTUAL_REGISTER + 3);
4414
4415   return icode != CODE_FOR_nothing && insn_operand_matches (icode, 0, reg1)
4416          && insn_operand_matches (icode, 1, reg2)
4417          && insn_operand_matches (icode, 2, reg3);
4418 }
4419
4420 /* Return whether the backend can emit a vec_extract instruction with
4421    a non-constant index.  */
4422 bool
4423 can_vec_extract_var_idx_p (machine_mode vec_mode, machine_mode extr_mode)
4424 {
4425   if (!VECTOR_MODE_P (vec_mode))
4426     return false;
4427
4428   rtx reg1 = alloca_raw_REG (extr_mode, LAST_VIRTUAL_REGISTER + 1);
4429   rtx reg2 = alloca_raw_REG (vec_mode, LAST_VIRTUAL_REGISTER + 2);
4430
4431   enum insn_code icode = convert_optab_handler (vec_extract_optab,
4432                                                 vec_mode, extr_mode);
4433
4434   const struct insn_data_d *data = &insn_data[icode];
4435   machine_mode idx_mode = data->operand[2].mode;
4436
4437   rtx reg3 = alloca_raw_REG (idx_mode, LAST_VIRTUAL_REGISTER + 3);
4438
4439   return icode != CODE_FOR_nothing && insn_operand_matches (icode, 0, reg1)
4440          && insn_operand_matches (icode, 1, reg2)
4441          && insn_operand_matches (icode, 2, reg3);
4442 }
4443
4444 /* This function is called when we are going to emit a compare instruction that
4445    compares the values found in X and Y, using the rtl operator COMPARISON.
4446
4447    If they have mode BLKmode, then SIZE specifies the size of both operands.
4448
4449    UNSIGNEDP nonzero says that the operands are unsigned;
4450    this matters if they need to be widened (as given by METHODS).
4451
4452    *PTEST is where the resulting comparison RTX is returned or NULL_RTX
4453    if we failed to produce one.
4454
4455    *PMODE is the mode of the inputs (in case they are const_int).
4456
4457    This function performs all the setup necessary so that the caller only has
4458    to emit a single comparison insn.  This setup can involve doing a BLKmode
4459    comparison or emitting a library call to perform the comparison if no insn
4460    is available to handle it.
4461    The values which are passed in through pointers can be modified; the caller
4462    should perform the comparison on the modified values.  Constant
4463    comparisons must have already been folded.  */
4464
4465 static void
4466 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
4467                   int unsignedp, enum optab_methods methods,
4468                   rtx *ptest, machine_mode *pmode)
4469 {
4470   machine_mode mode = *pmode;
4471   rtx libfunc, test;
4472   machine_mode cmp_mode;
4473
4474   /* The other methods are not needed.  */
4475   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
4476               || methods == OPTAB_LIB_WIDEN);
4477
4478   if (CONST_SCALAR_INT_P (y))
4479     canonicalize_comparison (mode, &comparison, &y);
4480
4481   /* If we are optimizing, force expensive constants into a register.  */
4482   if (CONSTANT_P (x) && optimize
4483       && (rtx_cost (x, mode, COMPARE, 0, optimize_insn_for_speed_p ())
4484           > COSTS_N_INSNS (1))
4485       && can_create_pseudo_p ())
4486     x = force_reg (mode, x);
4487
4488   if (CONSTANT_P (y) && optimize
4489       && (rtx_cost (y, mode, COMPARE, 1, optimize_insn_for_speed_p ())
4490           > COSTS_N_INSNS (1))
4491       && can_create_pseudo_p ())
4492     y = force_reg (mode, y);
4493
4494   /* Don't let both operands fail to indicate the mode.  */
4495   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
4496     x = force_reg (mode, x);
4497   if (mode == VOIDmode)
4498     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
4499
4500   /* Handle all BLKmode compares.  */
4501
4502   if (mode == BLKmode)
4503     {
4504       machine_mode result_mode;
4505       enum insn_code cmp_code;
4506       rtx result;
4507       rtx opalign
4508         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
4509
4510       gcc_assert (size);
4511
4512       /* Try to use a memory block compare insn - either cmpstr
4513          or cmpmem will do.  */
4514       opt_scalar_int_mode cmp_mode_iter;
4515       FOR_EACH_MODE_IN_CLASS (cmp_mode_iter, MODE_INT)
4516         {
4517           scalar_int_mode cmp_mode = cmp_mode_iter.require ();
4518           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
4519           if (cmp_code == CODE_FOR_nothing)
4520             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
4521           if (cmp_code == CODE_FOR_nothing)
4522             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
4523           if (cmp_code == CODE_FOR_nothing)
4524             continue;
4525
4526           /* Must make sure the size fits the insn's mode.  */
4527           if (CONST_INT_P (size)
4528               ? UINTVAL (size) > GET_MODE_MASK (cmp_mode)
4529               : (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (size)))
4530                  > GET_MODE_BITSIZE (cmp_mode)))
4531             continue;
4532
4533           result_mode = insn_data[cmp_code].operand[0].mode;
4534           result = gen_reg_rtx (result_mode);
4535           size = convert_to_mode (cmp_mode, size, 1);
4536           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
4537
4538           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
4539           *pmode = result_mode;
4540           return;
4541         }
4542
4543       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
4544         goto fail;
4545
4546       /* Otherwise call a library function.  */
4547       result = emit_block_comp_via_libcall (x, y, size);
4548
4549       x = result;
4550       y = const0_rtx;
4551       mode = TYPE_MODE (integer_type_node);
4552       methods = OPTAB_LIB_WIDEN;
4553       unsignedp = false;
4554     }
4555
4556   /* Don't allow operands to the compare to trap, as that can put the
4557      compare and branch in different basic blocks.  */
4558   if (cfun->can_throw_non_call_exceptions)
4559     {
4560       if (!can_create_pseudo_p () && (may_trap_p (x) || may_trap_p (y)))
4561         goto fail;
4562       if (may_trap_p (x))
4563         x = copy_to_reg (x);
4564       if (may_trap_p (y))
4565         y = copy_to_reg (y);
4566     }
4567
4568   if (GET_MODE_CLASS (mode) == MODE_CC)
4569     {
4570       enum insn_code icode = optab_handler (cbranch_optab, CCmode);
4571       test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4572       if (icode != CODE_FOR_nothing
4573           && insn_operand_matches (icode, 0, test))
4574         {
4575           *ptest = test;
4576           return;
4577         }
4578       else
4579         goto fail;
4580     }
4581
4582   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4583   FOR_EACH_WIDER_MODE_FROM (cmp_mode, mode)
4584     {
4585       enum insn_code icode;
4586       icode = optab_handler (cbranch_optab, cmp_mode);
4587       if (icode != CODE_FOR_nothing
4588           && insn_operand_matches (icode, 0, test))
4589         {
4590           rtx_insn *last = get_last_insn ();
4591           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
4592           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
4593           if (op0 && op1
4594               && insn_operand_matches (icode, 1, op0)
4595               && insn_operand_matches (icode, 2, op1))
4596             {
4597               XEXP (test, 0) = op0;
4598               XEXP (test, 1) = op1;
4599               *ptest = test;
4600               *pmode = cmp_mode;
4601               return;
4602             }
4603           delete_insns_since (last);
4604         }
4605
4606       if (methods == OPTAB_DIRECT)
4607         break;
4608     }
4609
4610   if (methods != OPTAB_LIB_WIDEN)
4611     goto fail;
4612
4613   if (SCALAR_FLOAT_MODE_P (mode))
4614     {
4615       /* Small trick if UNORDERED isn't implemented by the hardware.  */
4616       if (comparison == UNORDERED && rtx_equal_p (x, y))
4617         {
4618           prepare_cmp_insn (x, y, UNLT, NULL_RTX, unsignedp, OPTAB_WIDEN,
4619                             ptest, pmode);
4620           if (*ptest)
4621             return;
4622         }
4623
4624       prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
4625     }
4626   else
4627     {
4628       rtx result;
4629       machine_mode ret_mode;
4630
4631       /* Handle a libcall just for the mode we are using.  */
4632       libfunc = optab_libfunc (cmp_optab, mode);
4633       gcc_assert (libfunc);
4634
4635       /* If we want unsigned, and this mode has a distinct unsigned
4636          comparison routine, use that.  */
4637       if (unsignedp)
4638         {
4639           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
4640           if (ulibfunc)
4641             libfunc = ulibfunc;
4642         }
4643
4644       ret_mode = targetm.libgcc_cmp_return_mode ();
4645       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4646                                         ret_mode, x, mode, y, mode);
4647
4648       /* There are two kinds of comparison routines. Biased routines
4649          return 0/1/2, and unbiased routines return -1/0/1. Other parts
4650          of gcc expect that the comparison operation is equivalent
4651          to the modified comparison. For signed comparisons compare the
4652          result against 1 in the biased case, and zero in the unbiased
4653          case. For unsigned comparisons always compare against 1 after
4654          biasing the unbiased result by adding 1. This gives us a way to
4655          represent LTU.
4656          The comparisons in the fixed-point helper library are always
4657          biased.  */
4658       x = result;
4659       y = const1_rtx;
4660
4661       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
4662         {
4663           if (unsignedp)
4664             x = plus_constant (ret_mode, result, 1);
4665           else
4666             y = const0_rtx;
4667         }
4668
4669       *pmode = ret_mode;
4670       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
4671                         ptest, pmode);
4672     }
4673
4674   return;
4675
4676  fail:
4677   *ptest = NULL_RTX;
4678 }
4679
4680 /* Before emitting an insn with code ICODE, make sure that X, which is going
4681    to be used for operand OPNUM of the insn, is converted from mode MODE to
4682    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
4683    that it is accepted by the operand predicate.  Return the new value.  */
4684
4685 rtx
4686 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
4687                  machine_mode wider_mode, int unsignedp)
4688 {
4689   if (mode != wider_mode)
4690     x = convert_modes (wider_mode, mode, x, unsignedp);
4691
4692   if (!insn_operand_matches (icode, opnum, x))
4693     {
4694       machine_mode op_mode = insn_data[(int) icode].operand[opnum].mode;
4695       if (reload_completed)
4696         return NULL_RTX;
4697       if (GET_MODE (x) != op_mode && GET_MODE (x) != VOIDmode)
4698         return NULL_RTX;
4699       x = copy_to_mode_reg (op_mode, x);
4700     }
4701
4702   return x;
4703 }
4704
4705 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4706    we can do the branch.  */
4707
4708 static void
4709 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label,
4710                           direct_optab cmp_optab, profile_probability prob,
4711                           bool test_branch)
4712 {
4713   machine_mode optab_mode;
4714   enum mode_class mclass;
4715   enum insn_code icode;
4716   rtx_insn *insn;
4717
4718   mclass = GET_MODE_CLASS (mode);
4719   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4720   icode = optab_handler (cmp_optab, optab_mode);
4721
4722   gcc_assert (icode != CODE_FOR_nothing);
4723   gcc_assert (test_branch || insn_operand_matches (icode, 0, test));
4724   if (test_branch)
4725     insn = emit_jump_insn (GEN_FCN (icode) (XEXP (test, 0),
4726                                             XEXP (test, 1), label));
4727   else
4728     insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4729                                             XEXP (test, 1), label));
4730
4731   if (prob.initialized_p ()
4732       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4733       && insn
4734       && JUMP_P (insn)
4735       && any_condjump_p (insn)
4736       && !find_reg_note (insn, REG_BR_PROB, 0))
4737     add_reg_br_prob_note (insn, prob);
4738 }
4739
4740 /* PTEST points to a comparison that compares its first operand with zero.
4741    Check to see if it can be performed as a bit-test-and-branch instead.
4742    On success, return the instruction that performs the bit-test-and-branch
4743    and replace the second operand of *PTEST with the bit number to test.
4744    On failure, return CODE_FOR_nothing and leave *PTEST unchanged.
4745
4746    Note that the comparison described by *PTEST should not be taken
4747    literally after a successful return.  *PTEST is just a convenient
4748    place to store the two operands of the bit-and-test.
4749
4750    VAL must contain the original tree expression for the first operand
4751    of *PTEST.  */
4752
4753 static enum insn_code
4754 validate_test_and_branch (tree val, rtx *ptest, machine_mode *pmode, optab *res)
4755 {
4756   if (!val || TREE_CODE (val) != SSA_NAME)
4757     return CODE_FOR_nothing;
4758
4759   machine_mode mode = TYPE_MODE (TREE_TYPE (val));
4760   rtx test = *ptest;
4761   direct_optab optab;
4762
4763   if (GET_CODE (test) == EQ)
4764     optab = tbranch_eq_optab;
4765   else if (GET_CODE (test) == NE)
4766     optab = tbranch_ne_optab;
4767   else
4768     return CODE_FOR_nothing;
4769
4770   *res = optab;
4771
4772   /* If the target supports the testbit comparison directly, great.  */
4773   auto icode = direct_optab_handler (optab, mode);
4774   if (icode == CODE_FOR_nothing)
4775     return icode;
4776
4777   if (tree_zero_one_valued_p (val))
4778     {
4779       auto pos = BITS_BIG_ENDIAN ? GET_MODE_BITSIZE (mode) - 1 : 0;
4780       XEXP (test, 1) = gen_int_mode (pos, mode);
4781       *ptest = test;
4782       *pmode = mode;
4783       return icode;
4784     }
4785
4786   wide_int wcst = get_nonzero_bits (val);
4787   if (wcst == -1)
4788     return CODE_FOR_nothing;
4789
4790   int bitpos;
4791
4792   if ((bitpos = wi::exact_log2 (wcst)) == -1)
4793     return CODE_FOR_nothing;
4794
4795   auto pos = BITS_BIG_ENDIAN ? GET_MODE_BITSIZE (mode) - 1 - bitpos : bitpos;
4796   XEXP (test, 1) = gen_int_mode (pos, mode);
4797   *ptest = test;
4798   *pmode = mode;
4799   return icode;
4800 }
4801
4802 /* Generate code to compare X with Y so that the condition codes are
4803    set and to jump to LABEL if the condition is true.  If X is a
4804    constant and Y is not a constant, then the comparison is swapped to
4805    ensure that the comparison RTL has the canonical form.
4806
4807    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4808    need to be widened.  UNSIGNEDP is also used to select the proper
4809    branch condition code.
4810
4811    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4812
4813    MODE is the mode of the inputs (in case they are const_int).
4814
4815    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4816    It will be potentially converted into an unsigned variant based on
4817    UNSIGNEDP to select a proper jump instruction.
4818
4819    PROB is the probability of jumping to LABEL.  If the comparison is against
4820    zero then VAL contains the expression from which the non-zero RTL is
4821    derived.  */
4822
4823 void
4824 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4825                          machine_mode mode, int unsignedp, tree val, rtx label,
4826                          profile_probability prob)
4827 {
4828   rtx op0 = x, op1 = y;
4829   rtx test;
4830
4831   /* Swap operands and condition to ensure canonical RTL.  */
4832   if (swap_commutative_operands_p (x, y)
4833       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4834     {
4835       op0 = y, op1 = x;
4836       comparison = swap_condition (comparison);
4837     }
4838
4839   /* If OP0 is still a constant, then both X and Y must be constants
4840      or the opposite comparison is not supported.  Force X into a register
4841      to create canonical RTL.  */
4842   if (CONSTANT_P (op0))
4843     op0 = force_reg (mode, op0);
4844
4845   if (unsignedp)
4846     comparison = unsigned_condition (comparison);
4847
4848   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4849                     &test, &mode);
4850
4851   /* Check if we're comparing a truth type with 0, and if so check if
4852      the target supports tbranch.  */
4853   machine_mode tmode = mode;
4854   direct_optab optab;
4855   if (op1 == CONST0_RTX (GET_MODE (op1))
4856       && validate_test_and_branch (val, &test, &tmode,
4857                                    &optab) != CODE_FOR_nothing)
4858     {
4859       emit_cmp_and_jump_insn_1 (test, tmode, label, optab, prob, true);
4860       return;
4861     }
4862
4863   emit_cmp_and_jump_insn_1 (test, mode, label, cbranch_optab, prob, false);
4864 }
4865
4866 /* Overloaded version of emit_cmp_and_jump_insns in which VAL is unknown.  */
4867
4868 void
4869 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4870                          machine_mode mode, int unsignedp, rtx label,
4871                          profile_probability prob)
4872 {
4873   emit_cmp_and_jump_insns (x, y, comparison, size, mode, unsignedp, NULL,
4874                            label, prob);
4875 }
4876
4877
4878 /* Emit a library call comparison between floating point X and Y.
4879    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4880
4881 static void
4882 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4883                        rtx *ptest, machine_mode *pmode)
4884 {
4885   enum rtx_code swapped = swap_condition (comparison);
4886   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4887   machine_mode orig_mode = GET_MODE (x);
4888   machine_mode mode;
4889   rtx true_rtx, false_rtx;
4890   rtx value, target, equiv;
4891   rtx_insn *insns;
4892   rtx libfunc = 0;
4893   bool reversed_p = false;
4894   scalar_int_mode cmp_mode = targetm.libgcc_cmp_return_mode ();
4895
4896   FOR_EACH_WIDER_MODE_FROM (mode, orig_mode)
4897     {
4898       if (code_to_optab (comparison)
4899           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4900         break;
4901
4902       if (code_to_optab (swapped)
4903           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4904         {
4905           std::swap (x, y);
4906           comparison = swapped;
4907           break;
4908         }
4909
4910       if (code_to_optab (reversed)
4911           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4912         {
4913           comparison = reversed;
4914           reversed_p = true;
4915           break;
4916         }
4917     }
4918
4919   gcc_assert (mode != VOIDmode);
4920
4921   if (mode != orig_mode)
4922     {
4923       x = convert_to_mode (mode, x, 0);
4924       y = convert_to_mode (mode, y, 0);
4925     }
4926
4927   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4928      the RTL.  The allows the RTL optimizers to delete the libcall if the
4929      condition can be determined at compile-time.  */
4930   if (comparison == UNORDERED
4931       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4932     {
4933       true_rtx = const_true_rtx;
4934       false_rtx = const0_rtx;
4935     }
4936   else
4937     {
4938       switch (comparison)
4939         {
4940         case EQ:
4941           true_rtx = const0_rtx;
4942           false_rtx = const_true_rtx;
4943           break;
4944
4945         case NE:
4946           true_rtx = const_true_rtx;
4947           false_rtx = const0_rtx;
4948           break;
4949
4950         case GT:
4951           true_rtx = const1_rtx;
4952           false_rtx = const0_rtx;
4953           break;
4954
4955         case GE:
4956           true_rtx = const0_rtx;
4957           false_rtx = constm1_rtx;
4958           break;
4959
4960         case LT:
4961           true_rtx = constm1_rtx;
4962           false_rtx = const0_rtx;
4963           break;
4964
4965         case LE:
4966           true_rtx = const0_rtx;
4967           false_rtx = const1_rtx;
4968           break;
4969
4970         default:
4971           gcc_unreachable ();
4972         }
4973     }
4974
4975   if (comparison == UNORDERED)
4976     {
4977       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4978       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4979       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4980                                     temp, const_true_rtx, equiv);
4981     }
4982   else
4983     {
4984       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4985       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4986         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4987                                       equiv, true_rtx, false_rtx);
4988     }
4989
4990   start_sequence ();
4991   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4992                                    cmp_mode, x, mode, y, mode);
4993   insns = get_insns ();
4994   end_sequence ();
4995
4996   target = gen_reg_rtx (cmp_mode);
4997   emit_libcall_block (insns, target, value, equiv);
4998
4999   if (comparison == UNORDERED
5000       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
5001       || reversed_p)
5002     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
5003   else
5004     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
5005
5006   *pmode = cmp_mode;
5007 }
5008 \f
5009 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
5010
5011 void
5012 emit_indirect_jump (rtx loc)
5013 {
5014   if (!targetm.have_indirect_jump ())
5015     sorry ("indirect jumps are not available on this target");
5016   else
5017     {
5018       class expand_operand ops[1];
5019       create_address_operand (&ops[0], loc);
5020       expand_jump_insn (targetm.code_for_indirect_jump, 1, ops);
5021       emit_barrier ();
5022     }
5023 }
5024 \f
5025
5026 /* Emit a conditional move instruction if the machine supports one for that
5027    condition and machine mode.
5028
5029    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
5030    the mode to use should they be constants.  If it is VOIDmode, they cannot
5031    both be constants.
5032
5033    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
5034    should be stored there.  MODE is the mode to use should they be constants.
5035    If it is VOIDmode, they cannot both be constants.
5036
5037    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
5038    is not supported.  */
5039
5040 rtx
5041 emit_conditional_move (rtx target, struct rtx_comparison comp,
5042                        rtx op2, rtx op3,
5043                        machine_mode mode, int unsignedp)
5044 {
5045   rtx comparison;
5046   rtx_insn *last;
5047   enum insn_code icode;
5048   enum rtx_code reversed;
5049
5050   /* If the two source operands are identical, that's just a move.  */
5051
5052   if (rtx_equal_p (op2, op3))
5053     {
5054       if (!target)
5055         target = gen_reg_rtx (mode);
5056
5057       emit_move_insn (target, op3);
5058       return target;
5059     }
5060
5061   /* If one operand is constant, make it the second one.  Only do this
5062      if the other operand is not constant as well.  */
5063
5064   if (swap_commutative_operands_p (comp.op0, comp.op1))
5065     {
5066       std::swap (comp.op0, comp.op1);
5067       comp.code = swap_condition (comp.code);
5068     }
5069
5070   /* get_condition will prefer to generate LT and GT even if the old
5071      comparison was against zero, so undo that canonicalization here since
5072      comparisons against zero are cheaper.  */
5073
5074   if (comp.code == LT && comp.op1 == const1_rtx)
5075     comp.code = LE, comp.op1 = const0_rtx;
5076   else if (comp.code == GT && comp.op1 == constm1_rtx)
5077     comp.code = GE, comp.op1 = const0_rtx;
5078
5079   if (comp.mode == VOIDmode)
5080     comp.mode = GET_MODE (comp.op0);
5081
5082   enum rtx_code orig_code = comp.code;
5083   bool swapped = false;
5084   if (swap_commutative_operands_p (op2, op3)
5085       && ((reversed =
5086            reversed_comparison_code_parts (comp.code, comp.op0, comp.op1, NULL))
5087           != UNKNOWN))
5088     {
5089       std::swap (op2, op3);
5090       comp.code = reversed;
5091       swapped = true;
5092     }
5093
5094   if (mode == VOIDmode)
5095     mode = GET_MODE (op2);
5096
5097   icode = direct_optab_handler (movcc_optab, mode);
5098
5099   if (icode == CODE_FOR_nothing)
5100     return NULL_RTX;
5101
5102   if (!target)
5103     target = gen_reg_rtx (mode);
5104
5105   for (int pass = 0; ; pass++)
5106     {
5107       comp.code = unsignedp ? unsigned_condition (comp.code) : comp.code;
5108       comparison =
5109         simplify_gen_relational (comp.code, VOIDmode,
5110                                  comp.mode, comp.op0, comp.op1);
5111
5112       /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
5113          punt and let the caller figure out how best to deal with this
5114          situation.  */
5115       if (COMPARISON_P (comparison))
5116         {
5117           saved_pending_stack_adjust save;
5118           save_pending_stack_adjust (&save);
5119           last = get_last_insn ();
5120           do_pending_stack_adjust ();
5121           machine_mode cmpmode = comp.mode;
5122           rtx orig_op0 = XEXP (comparison, 0);
5123           rtx orig_op1 = XEXP (comparison, 1);
5124           rtx op2p = op2;
5125           rtx op3p = op3;
5126           /* If we are optimizing, force expensive constants into a register
5127              but preserve an eventual equality with op2/op3.  */
5128           if (CONSTANT_P (orig_op0) && optimize
5129               && (rtx_cost (orig_op0, mode, COMPARE, 0,
5130                             optimize_insn_for_speed_p ())
5131                   > COSTS_N_INSNS (1))
5132               && can_create_pseudo_p ())
5133             {
5134               if (rtx_equal_p (orig_op0, op2))
5135                 op2p = XEXP (comparison, 0) = force_reg (cmpmode, orig_op0);
5136               else if (rtx_equal_p (orig_op0, op3))
5137                 op3p = XEXP (comparison, 0) = force_reg (cmpmode, orig_op0);
5138             }
5139           if (CONSTANT_P (orig_op1) && optimize
5140               && (rtx_cost (orig_op1, mode, COMPARE, 0,
5141                             optimize_insn_for_speed_p ())
5142                   > COSTS_N_INSNS (1))
5143               && can_create_pseudo_p ())
5144             {
5145               if (rtx_equal_p (orig_op1, op2))
5146                 op2p = XEXP (comparison, 1) = force_reg (cmpmode, orig_op1);
5147               else if (rtx_equal_p (orig_op1, op3))
5148                 op3p = XEXP (comparison, 1) = force_reg (cmpmode, orig_op1);
5149             }
5150           prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
5151                             GET_CODE (comparison), NULL_RTX, unsignedp,
5152                             OPTAB_WIDEN, &comparison, &cmpmode);
5153           if (comparison)
5154             {
5155                rtx res = emit_conditional_move_1 (target, comparison,
5156                                                   op2p, op3p, mode);
5157                if (res != NULL_RTX)
5158                  return res;
5159             }
5160           delete_insns_since (last);
5161           restore_pending_stack_adjust (&save);
5162         }
5163
5164       if (pass == 1)
5165         return NULL_RTX;
5166
5167       /* If the preferred op2/op3 order is not usable, retry with other
5168          operand order, perhaps it will expand successfully.  */
5169       if (swapped)
5170         comp.code = orig_code;
5171       else if ((reversed =
5172                 reversed_comparison_code_parts (orig_code, comp.op0, comp.op1,
5173                                                            NULL))
5174                != UNKNOWN)
5175         comp.code = reversed;
5176       else
5177         return NULL_RTX;
5178       std::swap (op2, op3);
5179     }
5180 }
5181
5182 /* Helper function that, in addition to COMPARISON, also tries
5183    the reversed REV_COMPARISON with swapped OP2 and OP3.  As opposed
5184    to when we pass the specific constituents of a comparison, no
5185    additional insns are emitted for it.  It might still be necessary
5186    to emit more than one insn for the final conditional move, though.  */
5187
5188 rtx
5189 emit_conditional_move (rtx target, rtx comparison, rtx rev_comparison,
5190                        rtx op2, rtx op3, machine_mode mode)
5191 {
5192   rtx res = emit_conditional_move_1 (target, comparison, op2, op3, mode);
5193
5194   if (res != NULL_RTX)
5195     return res;
5196
5197   return emit_conditional_move_1 (target, rev_comparison, op3, op2, mode);
5198 }
5199
5200 /* Helper for emitting a conditional move.  */
5201
5202 static rtx
5203 emit_conditional_move_1 (rtx target, rtx comparison,
5204                          rtx op2, rtx op3, machine_mode mode)
5205 {
5206   enum insn_code icode;
5207
5208   if (comparison == NULL_RTX || !COMPARISON_P (comparison))
5209     return NULL_RTX;
5210
5211   /* If the two source operands are identical, that's just a move.
5212      As the comparison comes in non-canonicalized, we must make
5213      sure not to discard any possible side effects.  If there are
5214      side effects, just let the target handle it.  */
5215   if (!side_effects_p (comparison) && rtx_equal_p (op2, op3))
5216     {
5217       if (!target)
5218         target = gen_reg_rtx (mode);
5219
5220       emit_move_insn (target, op3);
5221       return target;
5222     }
5223
5224   if (mode == VOIDmode)
5225     mode = GET_MODE (op2);
5226
5227   icode = direct_optab_handler (movcc_optab, mode);
5228
5229   if (icode == CODE_FOR_nothing)
5230     return NULL_RTX;
5231
5232   if (!target)
5233     target = gen_reg_rtx (mode);
5234
5235   class expand_operand ops[4];
5236
5237   create_output_operand (&ops[0], target, mode);
5238   create_fixed_operand (&ops[1], comparison);
5239   create_input_operand (&ops[2], op2, mode);
5240   create_input_operand (&ops[3], op3, mode);
5241
5242   if (maybe_expand_insn (icode, 4, ops))
5243     {
5244       if (ops[0].value != target)
5245         convert_move (target, ops[0].value, false);
5246       return target;
5247     }
5248
5249   return NULL_RTX;
5250 }
5251
5252
5253 /* Emit a conditional negate or bitwise complement using the
5254    negcc or notcc optabs if available.  Return NULL_RTX if such operations
5255    are not available.  Otherwise return the RTX holding the result.
5256    TARGET is the desired destination of the result.  COMP is the comparison
5257    on which to negate.  If COND is true move into TARGET the negation
5258    or bitwise complement of OP1.  Otherwise move OP2 into TARGET.
5259    CODE is either NEG or NOT.  MODE is the machine mode in which the
5260    operation is performed.  */
5261
5262 rtx
5263 emit_conditional_neg_or_complement (rtx target, rtx_code code,
5264                                      machine_mode mode, rtx cond, rtx op1,
5265                                      rtx op2)
5266 {
5267   optab op = unknown_optab;
5268   if (code == NEG)
5269     op = negcc_optab;
5270   else if (code == NOT)
5271     op = notcc_optab;
5272   else
5273     gcc_unreachable ();
5274
5275   insn_code icode = direct_optab_handler (op, mode);
5276
5277   if (icode == CODE_FOR_nothing)
5278     return NULL_RTX;
5279
5280   if (!target)
5281     target = gen_reg_rtx (mode);
5282
5283   rtx_insn *last = get_last_insn ();
5284   class expand_operand ops[4];
5285
5286   create_output_operand (&ops[0], target, mode);
5287   create_fixed_operand (&ops[1], cond);
5288   create_input_operand (&ops[2], op1, mode);
5289   create_input_operand (&ops[3], op2, mode);
5290
5291   if (maybe_expand_insn (icode, 4, ops))
5292     {
5293       if (ops[0].value != target)
5294         convert_move (target, ops[0].value, false);
5295
5296       return target;
5297     }
5298   delete_insns_since (last);
5299   return NULL_RTX;
5300 }
5301
5302 /* Emit a conditional addition instruction if the machine supports one for that
5303    condition and machine mode.
5304
5305    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
5306    the mode to use should they be constants.  If it is VOIDmode, they cannot
5307    both be constants.
5308
5309    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
5310    should be stored there.  MODE is the mode to use should they be constants.
5311    If it is VOIDmode, they cannot both be constants.
5312
5313    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
5314    is not supported.  */
5315
5316 rtx
5317 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
5318                       machine_mode cmode, rtx op2, rtx op3,
5319                       machine_mode mode, int unsignedp)
5320 {
5321   rtx comparison;
5322   rtx_insn *last;
5323   enum insn_code icode;
5324
5325   /* If one operand is constant, make it the second one.  Only do this
5326      if the other operand is not constant as well.  */
5327
5328   if (swap_commutative_operands_p (op0, op1))
5329     {
5330       std::swap (op0, op1);
5331       code = swap_condition (code);
5332     }
5333
5334   /* get_condition will prefer to generate LT and GT even if the old
5335      comparison was against zero, so undo that canonicalization here since
5336      comparisons against zero are cheaper.  */
5337   if (code == LT && op1 == const1_rtx)
5338     code = LE, op1 = const0_rtx;
5339   else if (code == GT && op1 == constm1_rtx)
5340     code = GE, op1 = const0_rtx;
5341
5342   if (cmode == VOIDmode)
5343     cmode = GET_MODE (op0);
5344
5345   if (mode == VOIDmode)
5346     mode = GET_MODE (op2);
5347
5348   icode = optab_handler (addcc_optab, mode);
5349
5350   if (icode == CODE_FOR_nothing)
5351     return 0;
5352
5353   if (!target)
5354     target = gen_reg_rtx (mode);
5355
5356   code = unsignedp ? unsigned_condition (code) : code;
5357   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
5358
5359   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
5360      return NULL and let the caller figure out how best to deal with this
5361      situation.  */
5362   if (!COMPARISON_P (comparison))
5363     return NULL_RTX;
5364
5365   do_pending_stack_adjust ();
5366   last = get_last_insn ();
5367   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
5368                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
5369                     &comparison, &cmode);
5370   if (comparison)
5371     {
5372       class expand_operand ops[4];
5373
5374       create_output_operand (&ops[0], target, mode);
5375       create_fixed_operand (&ops[1], comparison);
5376       create_input_operand (&ops[2], op2, mode);
5377       create_input_operand (&ops[3], op3, mode);
5378       if (maybe_expand_insn (icode, 4, ops))
5379         {
5380           if (ops[0].value != target)
5381             convert_move (target, ops[0].value, false);
5382           return target;
5383         }
5384     }
5385   delete_insns_since (last);
5386   return NULL_RTX;
5387 }
5388 \f
5389 /* These functions attempt to generate an insn body, rather than
5390    emitting the insn, but if the gen function already emits them, we
5391    make no attempt to turn them back into naked patterns.  */
5392
5393 /* Generate and return an insn body to add Y to X.  */
5394
5395 rtx_insn *
5396 gen_add2_insn (rtx x, rtx y)
5397 {
5398   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
5399
5400   gcc_assert (insn_operand_matches (icode, 0, x));
5401   gcc_assert (insn_operand_matches (icode, 1, x));
5402   gcc_assert (insn_operand_matches (icode, 2, y));
5403
5404   return GEN_FCN (icode) (x, x, y);
5405 }
5406
5407 /* Generate and return an insn body to add r1 and c,
5408    storing the result in r0.  */
5409
5410 rtx_insn *
5411 gen_add3_insn (rtx r0, rtx r1, rtx c)
5412 {
5413   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
5414
5415   if (icode == CODE_FOR_nothing
5416       || !insn_operand_matches (icode, 0, r0)
5417       || !insn_operand_matches (icode, 1, r1)
5418       || !insn_operand_matches (icode, 2, c))
5419     return NULL;
5420
5421   return GEN_FCN (icode) (r0, r1, c);
5422 }
5423
5424 bool
5425 have_add2_insn (rtx x, rtx y)
5426 {
5427   enum insn_code icode;
5428
5429   gcc_assert (GET_MODE (x) != VOIDmode);
5430
5431   icode = optab_handler (add_optab, GET_MODE (x));
5432
5433   if (icode == CODE_FOR_nothing)
5434     return false;
5435
5436   if (!insn_operand_matches (icode, 0, x)
5437       || !insn_operand_matches (icode, 1, x)
5438       || !insn_operand_matches (icode, 2, y))
5439     return false;
5440
5441   return true;
5442 }
5443
5444 /* Generate and return an insn body to add Y to X.  */
5445
5446 rtx_insn *
5447 gen_addptr3_insn (rtx x, rtx y, rtx z)
5448 {
5449   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
5450
5451   gcc_assert (insn_operand_matches (icode, 0, x));
5452   gcc_assert (insn_operand_matches (icode, 1, y));
5453   gcc_assert (insn_operand_matches (icode, 2, z));
5454
5455   return GEN_FCN (icode) (x, y, z);
5456 }
5457
5458 /* Return true if the target implements an addptr pattern and X, Y,
5459    and Z are valid for the pattern predicates.  */
5460
5461 bool
5462 have_addptr3_insn (rtx x, rtx y, rtx z)
5463 {
5464   enum insn_code icode;
5465
5466   gcc_assert (GET_MODE (x) != VOIDmode);
5467
5468   icode = optab_handler (addptr3_optab, GET_MODE (x));
5469
5470   if (icode == CODE_FOR_nothing)
5471     return false;
5472
5473   if (!insn_operand_matches (icode, 0, x)
5474       || !insn_operand_matches (icode, 1, y)
5475       || !insn_operand_matches (icode, 2, z))
5476     return false;
5477
5478   return true;
5479 }
5480
5481 /* Generate and return an insn body to subtract Y from X.  */
5482
5483 rtx_insn *
5484 gen_sub2_insn (rtx x, rtx y)
5485 {
5486   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
5487
5488   gcc_assert (insn_operand_matches (icode, 0, x));
5489   gcc_assert (insn_operand_matches (icode, 1, x));
5490   gcc_assert (insn_operand_matches (icode, 2, y));
5491
5492   return GEN_FCN (icode) (x, x, y);
5493 }
5494
5495 /* Generate and return an insn body to subtract r1 and c,
5496    storing the result in r0.  */
5497
5498 rtx_insn *
5499 gen_sub3_insn (rtx r0, rtx r1, rtx c)
5500 {
5501   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
5502
5503   if (icode == CODE_FOR_nothing
5504       || !insn_operand_matches (icode, 0, r0)
5505       || !insn_operand_matches (icode, 1, r1)
5506       || !insn_operand_matches (icode, 2, c))
5507     return NULL;
5508
5509   return GEN_FCN (icode) (r0, r1, c);
5510 }
5511
5512 bool
5513 have_sub2_insn (rtx x, rtx y)
5514 {
5515   enum insn_code icode;
5516
5517   gcc_assert (GET_MODE (x) != VOIDmode);
5518
5519   icode = optab_handler (sub_optab, GET_MODE (x));
5520
5521   if (icode == CODE_FOR_nothing)
5522     return false;
5523
5524   if (!insn_operand_matches (icode, 0, x)
5525       || !insn_operand_matches (icode, 1, x)
5526       || !insn_operand_matches (icode, 2, y))
5527     return false;
5528
5529   return true;
5530 }
5531 \f
5532 /* Generate the body of an insn to extend Y (with mode MFROM)
5533    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
5534
5535 rtx_insn *
5536 gen_extend_insn (rtx x, rtx y, machine_mode mto,
5537                  machine_mode mfrom, int unsignedp)
5538 {
5539   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
5540   return GEN_FCN (icode) (x, y);
5541 }
5542 \f
5543 /* Generate code to convert FROM to floating point
5544    and store in TO.  FROM must be fixed point and not VOIDmode.
5545    UNSIGNEDP nonzero means regard FROM as unsigned.
5546    Normally this is done by correcting the final value
5547    if it is negative.  */
5548
5549 void
5550 expand_float (rtx to, rtx from, int unsignedp)
5551 {
5552   enum insn_code icode;
5553   rtx target = to;
5554   scalar_mode from_mode, to_mode;
5555   machine_mode fmode, imode;
5556   bool can_do_signed = false;
5557
5558   /* Crash now, because we won't be able to decide which mode to use.  */
5559   gcc_assert (GET_MODE (from) != VOIDmode);
5560
5561   /* Look for an insn to do the conversion.  Do it in the specified
5562      modes if possible; otherwise convert either input, output or both to
5563      wider mode.  If the integer mode is wider than the mode of FROM,
5564      we can do the conversion signed even if the input is unsigned.  */
5565
5566   FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
5567     FOR_EACH_MODE_FROM (imode, GET_MODE (from))
5568       {
5569         int doing_unsigned = unsignedp;
5570
5571         if (fmode != GET_MODE (to)
5572             && (significand_size (fmode)
5573                 < GET_MODE_UNIT_PRECISION (GET_MODE (from))))
5574           continue;
5575
5576         icode = can_float_p (fmode, imode, unsignedp);
5577         if (icode == CODE_FOR_nothing && unsignedp)
5578           {
5579             enum insn_code scode = can_float_p (fmode, imode, 0);
5580             if (scode != CODE_FOR_nothing)
5581               can_do_signed = true;
5582             if (imode != GET_MODE (from))
5583               icode = scode, doing_unsigned = 0;
5584           }
5585
5586         if (icode != CODE_FOR_nothing)
5587           {
5588             if (imode != GET_MODE (from))
5589               from = convert_to_mode (imode, from, unsignedp);
5590
5591             if (fmode != GET_MODE (to))
5592               target = gen_reg_rtx (fmode);
5593
5594             emit_unop_insn (icode, target, from,
5595                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
5596
5597             if (target != to)
5598               convert_move (to, target, 0);
5599             return;
5600           }
5601       }
5602
5603   /* Unsigned integer, and no way to convert directly.  Convert as signed,
5604      then unconditionally adjust the result.  */
5605   if (unsignedp
5606       && can_do_signed
5607       && is_a <scalar_mode> (GET_MODE (to), &to_mode)
5608       && is_a <scalar_mode> (GET_MODE (from), &from_mode))
5609     {
5610       opt_scalar_mode fmode_iter;
5611       rtx_code_label *label = gen_label_rtx ();
5612       rtx temp;
5613       REAL_VALUE_TYPE offset;
5614
5615       /* Look for a usable floating mode FMODE wider than the source and at
5616          least as wide as the target.  Using FMODE will avoid rounding woes
5617          with unsigned values greater than the signed maximum value.  */
5618
5619       FOR_EACH_MODE_FROM (fmode_iter, to_mode)
5620         {
5621           scalar_mode fmode = fmode_iter.require ();
5622           if (GET_MODE_PRECISION (from_mode) < GET_MODE_BITSIZE (fmode)
5623               && can_float_p (fmode, from_mode, 0) != CODE_FOR_nothing)
5624             break;
5625         }
5626
5627       if (!fmode_iter.exists (&fmode))
5628         {
5629           /* There is no such mode.  Pretend the target is wide enough.  */
5630           fmode = to_mode;
5631
5632           /* Avoid double-rounding when TO is narrower than FROM.  */
5633           if ((significand_size (fmode) + 1)
5634               < GET_MODE_PRECISION (from_mode))
5635             {
5636               rtx temp1;
5637               rtx_code_label *neglabel = gen_label_rtx ();
5638
5639               /* Don't use TARGET if it isn't a register, is a hard register,
5640                  or is the wrong mode.  */
5641               if (!REG_P (target)
5642                   || REGNO (target) < FIRST_PSEUDO_REGISTER
5643                   || GET_MODE (target) != fmode)
5644                 target = gen_reg_rtx (fmode);
5645
5646               imode = from_mode;
5647               do_pending_stack_adjust ();
5648
5649               /* Test whether the sign bit is set.  */
5650               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
5651                                        0, neglabel);
5652
5653               /* The sign bit is not set.  Convert as signed.  */
5654               expand_float (target, from, 0);
5655               emit_jump_insn (targetm.gen_jump (label));
5656               emit_barrier ();
5657
5658               /* The sign bit is set.
5659                  Convert to a usable (positive signed) value by shifting right
5660                  one bit, while remembering if a nonzero bit was shifted
5661                  out; i.e., compute  (from & 1) | (from >> 1).  */
5662
5663               emit_label (neglabel);
5664               temp = expand_binop (imode, and_optab, from, const1_rtx,
5665                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
5666               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
5667               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
5668                                    OPTAB_LIB_WIDEN);
5669               expand_float (target, temp, 0);
5670
5671               /* Multiply by 2 to undo the shift above.  */
5672               temp = expand_binop (fmode, add_optab, target, target,
5673                                    target, 0, OPTAB_LIB_WIDEN);
5674               if (temp != target)
5675                 emit_move_insn (target, temp);
5676
5677               do_pending_stack_adjust ();
5678               emit_label (label);
5679               goto done;
5680             }
5681         }
5682
5683       /* If we are about to do some arithmetic to correct for an
5684          unsigned operand, do it in a pseudo-register.  */
5685
5686       if (to_mode != fmode
5687           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
5688         target = gen_reg_rtx (fmode);
5689
5690       /* Convert as signed integer to floating.  */
5691       expand_float (target, from, 0);
5692
5693       /* If FROM is negative (and therefore TO is negative),
5694          correct its value by 2**bitwidth.  */
5695
5696       do_pending_stack_adjust ();
5697       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, from_mode,
5698                                0, label);
5699
5700
5701       real_2expN (&offset, GET_MODE_PRECISION (from_mode), fmode);
5702       temp = expand_binop (fmode, add_optab, target,
5703                            const_double_from_real_value (offset, fmode),
5704                            target, 0, OPTAB_LIB_WIDEN);
5705       if (temp != target)
5706         emit_move_insn (target, temp);
5707
5708       do_pending_stack_adjust ();
5709       emit_label (label);
5710       goto done;
5711     }
5712
5713   /* No hardware instruction available; call a library routine.  */
5714     {
5715       rtx libfunc;
5716       rtx_insn *insns;
5717       rtx value;
5718       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
5719
5720       if (is_narrower_int_mode (GET_MODE (from), SImode))
5721         from = convert_to_mode (SImode, from, unsignedp);
5722
5723       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5724       gcc_assert (libfunc);
5725
5726       start_sequence ();
5727
5728       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5729                                        GET_MODE (to), from, GET_MODE (from));
5730       insns = get_insns ();
5731       end_sequence ();
5732
5733       emit_libcall_block (insns, target, value,
5734                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
5735                                          GET_MODE (to), from));
5736     }
5737
5738  done:
5739
5740   /* Copy result to requested destination
5741      if we have been computing in a temp location.  */
5742
5743   if (target != to)
5744     {
5745       if (GET_MODE (target) == GET_MODE (to))
5746         emit_move_insn (to, target);
5747       else
5748         convert_move (to, target, 0);
5749     }
5750 }
5751 \f
5752 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5753    must be floating point.  */
5754
5755 void
5756 expand_fix (rtx to, rtx from, int unsignedp)
5757 {
5758   enum insn_code icode;
5759   rtx target = to;
5760   machine_mode fmode, imode;
5761   opt_scalar_mode fmode_iter;
5762   bool must_trunc = false;
5763
5764   /* We first try to find a pair of modes, one real and one integer, at
5765      least as wide as FROM and TO, respectively, in which we can open-code
5766      this conversion.  If the integer mode is wider than the mode of TO,
5767      we can do the conversion either signed or unsigned.  */
5768
5769   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
5770     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
5771       {
5772         int doing_unsigned = unsignedp;
5773
5774         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
5775         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
5776           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
5777
5778         if (icode != CODE_FOR_nothing)
5779           {
5780             rtx_insn *last = get_last_insn ();
5781             rtx from1 = from;
5782             if (fmode != GET_MODE (from))
5783               {
5784                 if (REAL_MODE_FORMAT (GET_MODE (from))
5785                     == &arm_bfloat_half_format
5786                     && REAL_MODE_FORMAT (fmode) == &ieee_single_format)
5787                   /* The BF -> SF conversions can be just a shift, doesn't
5788                      need to handle sNANs.  */
5789                   {
5790                     int save_flag_finite_math_only = flag_finite_math_only;
5791                     flag_finite_math_only = true;
5792                     from1 = convert_to_mode (fmode, from, 0);
5793                     flag_finite_math_only = save_flag_finite_math_only;
5794                   }
5795                 else
5796                   from1 = convert_to_mode (fmode, from, 0);
5797               }
5798
5799             if (must_trunc)
5800               {
5801                 rtx temp = gen_reg_rtx (GET_MODE (from1));
5802                 from1 = expand_unop (GET_MODE (from1), ftrunc_optab, from1,
5803                                      temp, 0);
5804               }
5805
5806             if (imode != GET_MODE (to))
5807               target = gen_reg_rtx (imode);
5808
5809             if (maybe_emit_unop_insn (icode, target, from1,
5810                                       doing_unsigned ? UNSIGNED_FIX : FIX))
5811               {
5812                 if (target != to)
5813                   convert_move (to, target, unsignedp);
5814                 return;
5815               }
5816             delete_insns_since (last);
5817           }
5818       }
5819
5820   /* For an unsigned conversion, there is one more way to do it.
5821      If we have a signed conversion, we generate code that compares
5822      the real value to the largest representable positive number.  If if
5823      is smaller, the conversion is done normally.  Otherwise, subtract
5824      one plus the highest signed number, convert, and add it back.
5825
5826      We only need to check all real modes, since we know we didn't find
5827      anything with a wider integer mode.
5828
5829      This code used to extend FP value into mode wider than the destination.
5830      This is needed for decimal float modes which cannot accurately
5831      represent one plus the highest signed number of the same size, but
5832      not for binary modes.  Consider, for instance conversion from SFmode
5833      into DImode.
5834
5835      The hot path through the code is dealing with inputs smaller than 2^63
5836      and doing just the conversion, so there is no bits to lose.
5837
5838      In the other path we know the value is positive in the range 2^63..2^64-1
5839      inclusive.  (as for other input overflow happens and result is undefined)
5840      So we know that the most important bit set in mantissa corresponds to
5841      2^63.  The subtraction of 2^63 should not generate any rounding as it
5842      simply clears out that bit.  The rest is trivial.  */
5843
5844   scalar_int_mode to_mode;
5845   if (unsignedp
5846       && is_a <scalar_int_mode> (GET_MODE (to), &to_mode)
5847       && HWI_COMPUTABLE_MODE_P (to_mode))
5848     FOR_EACH_MODE_FROM (fmode_iter, as_a <scalar_mode> (GET_MODE (from)))
5849       {
5850         scalar_mode fmode = fmode_iter.require ();
5851         if (CODE_FOR_nothing != can_fix_p (to_mode, fmode,
5852                                            0, &must_trunc)
5853             && (!DECIMAL_FLOAT_MODE_P (fmode)
5854                 || (GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (to_mode))))
5855           {
5856             int bitsize;
5857             REAL_VALUE_TYPE offset;
5858             rtx limit;
5859             rtx_code_label *lab1, *lab2;
5860             rtx_insn *insn;
5861
5862             bitsize = GET_MODE_PRECISION (to_mode);
5863             real_2expN (&offset, bitsize - 1, fmode);
5864             limit = const_double_from_real_value (offset, fmode);
5865             lab1 = gen_label_rtx ();
5866             lab2 = gen_label_rtx ();
5867
5868             if (fmode != GET_MODE (from))
5869               {
5870                 if (REAL_MODE_FORMAT (GET_MODE (from))
5871                     == &arm_bfloat_half_format
5872                     && REAL_MODE_FORMAT (fmode) == &ieee_single_format)
5873                   /* The BF -> SF conversions can be just a shift, doesn't
5874                      need to handle sNANs.  */
5875                   {
5876                     int save_flag_finite_math_only = flag_finite_math_only;
5877                     flag_finite_math_only = true;
5878                     from = convert_to_mode (fmode, from, 0);
5879                     flag_finite_math_only = save_flag_finite_math_only;
5880                   }
5881                 else
5882                   from = convert_to_mode (fmode, from, 0);
5883               }
5884
5885             /* See if we need to do the subtraction.  */
5886             do_pending_stack_adjust ();
5887             emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX,
5888                                      GET_MODE (from), 0, lab1);
5889
5890             /* If not, do the signed "fix" and branch around fixup code.  */
5891             expand_fix (to, from, 0);
5892             emit_jump_insn (targetm.gen_jump (lab2));
5893             emit_barrier ();
5894
5895             /* Otherwise, subtract 2**(N-1), convert to signed number,
5896                then add 2**(N-1).  Do the addition using XOR since this
5897                will often generate better code.  */
5898             emit_label (lab1);
5899             target = expand_binop (GET_MODE (from), sub_optab, from, limit,
5900                                    NULL_RTX, 0, OPTAB_LIB_WIDEN);
5901             expand_fix (to, target, 0);
5902             target = expand_binop (to_mode, xor_optab, to,
5903                                    gen_int_mode
5904                                    (HOST_WIDE_INT_1 << (bitsize - 1),
5905                                     to_mode),
5906                                    to, 1, OPTAB_LIB_WIDEN);
5907
5908             if (target != to)
5909               emit_move_insn (to, target);
5910
5911             emit_label (lab2);
5912
5913             if (optab_handler (mov_optab, to_mode) != CODE_FOR_nothing)
5914               {
5915                 /* Make a place for a REG_NOTE and add it.  */
5916                 insn = emit_move_insn (to, to);
5917                 set_dst_reg_note (insn, REG_EQUAL,
5918                                   gen_rtx_fmt_e (UNSIGNED_FIX, to_mode,
5919                                                  copy_rtx (from)),
5920                                   to);
5921               }
5922
5923             return;
5924           }
5925       }
5926
5927 #ifdef HAVE_SFmode
5928   if (REAL_MODE_FORMAT (GET_MODE (from)) == &arm_bfloat_half_format
5929       && REAL_MODE_FORMAT (SFmode) == &ieee_single_format)
5930     /* We don't have BF -> TI library functions, use BF -> SF -> TI
5931        instead but the BF -> SF conversion can be just a shift, doesn't
5932        need to handle sNANs.  */
5933     {
5934       int save_flag_finite_math_only = flag_finite_math_only;
5935       flag_finite_math_only = true;
5936       from = convert_to_mode (SFmode, from, 0);
5937       flag_finite_math_only = save_flag_finite_math_only;
5938       expand_fix (to, from, unsignedp);
5939       return;
5940     }
5941 #endif
5942
5943   /* We can't do it with an insn, so use a library call.  But first ensure
5944      that the mode of TO is at least as wide as SImode, since those are the
5945      only library calls we know about.  */
5946
5947   if (is_narrower_int_mode (GET_MODE (to), SImode))
5948     {
5949       target = gen_reg_rtx (SImode);
5950
5951       expand_fix (target, from, unsignedp);
5952     }
5953   else
5954     {
5955       rtx_insn *insns;
5956       rtx value;
5957       rtx libfunc;
5958
5959       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5960       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5961       gcc_assert (libfunc);
5962
5963       start_sequence ();
5964
5965       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5966                                        GET_MODE (to), from, GET_MODE (from));
5967       insns = get_insns ();
5968       end_sequence ();
5969
5970       emit_libcall_block (insns, target, value,
5971                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5972                                          GET_MODE (to), from));
5973     }
5974
5975   if (target != to)
5976     {
5977       if (GET_MODE (to) == GET_MODE (target))
5978         emit_move_insn (to, target);
5979       else
5980         convert_move (to, target, 0);
5981     }
5982 }
5983
5984
5985 /* Promote integer arguments for a libcall if necessary.
5986    emit_library_call_value cannot do the promotion because it does not
5987    know if it should do a signed or unsigned promotion.  This is because
5988    there are no tree types defined for libcalls.  */
5989
5990 static rtx
5991 prepare_libcall_arg (rtx arg, int uintp)
5992 {
5993   scalar_int_mode mode;
5994   machine_mode arg_mode;
5995   if (is_a <scalar_int_mode> (GET_MODE (arg), &mode))
5996     {
5997       /*  If we need to promote the integer function argument we need to do
5998           it here instead of inside emit_library_call_value because in
5999           emit_library_call_value we don't know if we should do a signed or
6000           unsigned promotion.  */
6001
6002       int unsigned_p = 0;
6003       arg_mode = promote_function_mode (NULL_TREE, mode,
6004                                         &unsigned_p, NULL_TREE, 0);
6005       if (arg_mode != mode)
6006         return convert_to_mode (arg_mode, arg, uintp);
6007     }
6008     return arg;
6009 }
6010
6011 /* Generate code to convert FROM or TO a fixed-point.
6012    If UINTP is true, either TO or FROM is an unsigned integer.
6013    If SATP is true, we need to saturate the result.  */
6014
6015 void
6016 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
6017 {
6018   machine_mode to_mode = GET_MODE (to);
6019   machine_mode from_mode = GET_MODE (from);
6020   convert_optab tab;
6021   enum rtx_code this_code;
6022   enum insn_code code;
6023   rtx_insn *insns;
6024   rtx value;
6025   rtx libfunc;
6026
6027   if (to_mode == from_mode)
6028     {
6029       emit_move_insn (to, from);
6030       return;
6031     }
6032
6033   if (uintp)
6034     {
6035       tab = satp ? satfractuns_optab : fractuns_optab;
6036       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
6037     }
6038   else
6039     {
6040       tab = satp ? satfract_optab : fract_optab;
6041       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
6042     }
6043   code = convert_optab_handler (tab, to_mode, from_mode);
6044   if (code != CODE_FOR_nothing)
6045     {
6046       emit_unop_insn (code, to, from, this_code);
6047       return;
6048     }
6049
6050   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
6051   gcc_assert (libfunc);
6052
6053   from = prepare_libcall_arg (from, uintp);
6054   from_mode = GET_MODE (from);
6055
6056   start_sequence ();
6057   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
6058                                    from, from_mode);
6059   insns = get_insns ();
6060   end_sequence ();
6061
6062   emit_libcall_block (insns, to, value,
6063                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
6064 }
6065
6066 /* Generate code to convert FROM to fixed point and store in TO.  FROM
6067    must be floating point, TO must be signed.  Use the conversion optab
6068    TAB to do the conversion.  */
6069
6070 bool
6071 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
6072 {
6073   enum insn_code icode;
6074   rtx target = to;
6075   machine_mode fmode, imode;
6076
6077   /* We first try to find a pair of modes, one real and one integer, at
6078      least as wide as FROM and TO, respectively, in which we can open-code
6079      this conversion.  If the integer mode is wider than the mode of TO,
6080      we can do the conversion either signed or unsigned.  */
6081
6082   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
6083     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
6084       {
6085         icode = convert_optab_handler (tab, imode, fmode,
6086                                        insn_optimization_type ());
6087         if (icode != CODE_FOR_nothing)
6088           {
6089             rtx_insn *last = get_last_insn ();
6090             if (fmode != GET_MODE (from))
6091               from = convert_to_mode (fmode, from, 0);
6092
6093             if (imode != GET_MODE (to))
6094               target = gen_reg_rtx (imode);
6095
6096             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
6097               {
6098                 delete_insns_since (last);
6099                 continue;
6100               }
6101             if (target != to)
6102               convert_move (to, target, 0);
6103             return true;
6104           }
6105       }
6106
6107   return false;
6108 }
6109 \f
6110 /* Report whether we have an instruction to perform the operation
6111    specified by CODE on operands of mode MODE.  */
6112 bool
6113 have_insn_for (enum rtx_code code, machine_mode mode)
6114 {
6115   return (code_to_optab (code)
6116           && (optab_handler (code_to_optab (code), mode)
6117               != CODE_FOR_nothing));
6118 }
6119
6120 /* Print information about the current contents of the optabs on
6121    STDERR.  */
6122
6123 DEBUG_FUNCTION void
6124 debug_optab_libfuncs (void)
6125 {
6126   int i, j, k;
6127
6128   /* Dump the arithmetic optabs.  */
6129   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
6130     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6131       {
6132         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
6133         if (l)
6134           {
6135             gcc_assert (GET_CODE (l) == SYMBOL_REF);
6136             fprintf (stderr, "%s\t%s:\t%s\n",
6137                      GET_RTX_NAME (optab_to_code ((optab) i)),
6138                      GET_MODE_NAME (j),
6139                      XSTR (l, 0));
6140           }
6141       }
6142
6143   /* Dump the conversion optabs.  */
6144   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
6145     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6146       for (k = 0; k < NUM_MACHINE_MODES; ++k)
6147         {
6148           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
6149                                          (machine_mode) k);
6150           if (l)
6151             {
6152               gcc_assert (GET_CODE (l) == SYMBOL_REF);
6153               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
6154                        GET_RTX_NAME (optab_to_code ((optab) i)),
6155                        GET_MODE_NAME (j),
6156                        GET_MODE_NAME (k),
6157                        XSTR (l, 0));
6158             }
6159         }
6160 }
6161
6162 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
6163    CODE.  Return 0 on failure.  */
6164
6165 rtx_insn *
6166 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
6167 {
6168   machine_mode mode = GET_MODE (op1);
6169   enum insn_code icode;
6170   rtx_insn *insn;
6171   rtx trap_rtx;
6172
6173   if (mode == VOIDmode)
6174     return 0;
6175
6176   icode = optab_handler (ctrap_optab, mode);
6177   if (icode == CODE_FOR_nothing)
6178     return 0;
6179
6180   /* Some targets only accept a zero trap code.  */
6181   if (!insn_operand_matches (icode, 3, tcode))
6182     return 0;
6183
6184   do_pending_stack_adjust ();
6185   start_sequence ();
6186   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
6187                     &trap_rtx, &mode);
6188   if (!trap_rtx)
6189     insn = NULL;
6190   else
6191     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
6192                             tcode);
6193
6194   /* If that failed, then give up.  */
6195   if (insn == 0)
6196     {
6197       end_sequence ();
6198       return 0;
6199     }
6200
6201   emit_insn (insn);
6202   insn = get_insns ();
6203   end_sequence ();
6204   return insn;
6205 }
6206
6207 /* Return rtx code for TCODE or UNKNOWN.  Use UNSIGNEDP to select signed
6208    or unsigned operation code.  */
6209
6210 enum rtx_code
6211 get_rtx_code_1 (enum tree_code tcode, bool unsignedp)
6212 {
6213   enum rtx_code code;
6214   switch (tcode)
6215     {
6216     case EQ_EXPR:
6217       code = EQ;
6218       break;
6219     case NE_EXPR:
6220       code = NE;
6221       break;
6222     case LT_EXPR:
6223       code = unsignedp ? LTU : LT;
6224       break;
6225     case LE_EXPR:
6226       code = unsignedp ? LEU : LE;
6227       break;
6228     case GT_EXPR:
6229       code = unsignedp ? GTU : GT;
6230       break;
6231     case GE_EXPR:
6232       code = unsignedp ? GEU : GE;
6233       break;
6234
6235     case UNORDERED_EXPR:
6236       code = UNORDERED;
6237       break;
6238     case ORDERED_EXPR:
6239       code = ORDERED;
6240       break;
6241     case UNLT_EXPR:
6242       code = UNLT;
6243       break;
6244     case UNLE_EXPR:
6245       code = UNLE;
6246       break;
6247     case UNGT_EXPR:
6248       code = UNGT;
6249       break;
6250     case UNGE_EXPR:
6251       code = UNGE;
6252       break;
6253     case UNEQ_EXPR:
6254       code = UNEQ;
6255       break;
6256     case LTGT_EXPR:
6257       code = LTGT;
6258       break;
6259
6260     case BIT_AND_EXPR:
6261       code = AND;
6262       break;
6263
6264     case BIT_IOR_EXPR:
6265       code = IOR;
6266       break;
6267
6268     default:
6269       code = UNKNOWN;
6270       break;
6271     }
6272   return code;
6273 }
6274
6275 /* Return rtx code for TCODE.  Use UNSIGNEDP to select signed
6276    or unsigned operation code.  */
6277
6278 enum rtx_code
6279 get_rtx_code (enum tree_code tcode, bool unsignedp)
6280 {
6281   enum rtx_code code = get_rtx_code_1 (tcode, unsignedp);
6282   gcc_assert (code != UNKNOWN);
6283   return code;
6284 }
6285
6286 /* Return a comparison rtx of mode CMP_MODE for COND.  Use UNSIGNEDP to
6287    select signed or unsigned operators.  OPNO holds the index of the
6288    first comparison operand for insn ICODE.  Do not generate the
6289    compare instruction itself.  */
6290
6291 rtx
6292 vector_compare_rtx (machine_mode cmp_mode, enum tree_code tcode,
6293                     tree t_op0, tree t_op1, bool unsignedp,
6294                     enum insn_code icode, unsigned int opno)
6295 {
6296   class expand_operand ops[2];
6297   rtx rtx_op0, rtx_op1;
6298   machine_mode m0, m1;
6299   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
6300
6301   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
6302
6303   /* Expand operands.  For vector types with scalar modes, e.g. where int64x1_t
6304      has mode DImode, this can produce a constant RTX of mode VOIDmode; in such
6305      cases, use the original mode.  */
6306   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
6307                          EXPAND_STACK_PARM);
6308   m0 = GET_MODE (rtx_op0);
6309   if (m0 == VOIDmode)
6310     m0 = TYPE_MODE (TREE_TYPE (t_op0));
6311
6312   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
6313                          EXPAND_STACK_PARM);
6314   m1 = GET_MODE (rtx_op1);
6315   if (m1 == VOIDmode)
6316     m1 = TYPE_MODE (TREE_TYPE (t_op1));
6317
6318   create_input_operand (&ops[0], rtx_op0, m0);
6319   create_input_operand (&ops[1], rtx_op1, m1);
6320   if (!maybe_legitimize_operands (icode, opno, 2, ops))
6321     gcc_unreachable ();
6322   return gen_rtx_fmt_ee (rcode, cmp_mode, ops[0].value, ops[1].value);
6323 }
6324
6325 /* Check if vec_perm mask SEL is a constant equivalent to a shift of
6326    the first vec_perm operand, assuming the second operand (for left shift
6327    first operand) is a constant vector of zeros.  Return the shift distance
6328    in bits if so, or NULL_RTX if the vec_perm is not a shift.  MODE is the
6329    mode of the value being shifted.  SHIFT_OPTAB is vec_shr_optab for right
6330    shift or vec_shl_optab for left shift.  */
6331 static rtx
6332 shift_amt_for_vec_perm_mask (machine_mode mode, const vec_perm_indices &sel,
6333                              optab shift_optab)
6334 {
6335   unsigned int bitsize = GET_MODE_UNIT_BITSIZE (mode);
6336   poly_int64 first = sel[0];
6337   if (maybe_ge (sel[0], GET_MODE_NUNITS (mode)))
6338     return NULL_RTX;
6339
6340   if (shift_optab == vec_shl_optab)
6341     {
6342       unsigned int nelt;
6343       if (!GET_MODE_NUNITS (mode).is_constant (&nelt))
6344         return NULL_RTX;
6345       unsigned firstidx = 0;
6346       for (unsigned int i = 0; i < nelt; i++)
6347         {
6348           if (known_eq (sel[i], nelt))
6349             {
6350               if (i == 0 || firstidx)
6351                 return NULL_RTX;
6352               firstidx = i;
6353             }
6354           else if (firstidx
6355                    ? maybe_ne (sel[i], nelt + i - firstidx)
6356                    : maybe_ge (sel[i], nelt))
6357             return NULL_RTX;
6358         }
6359
6360       if (firstidx == 0)
6361         return NULL_RTX;
6362       first = firstidx;
6363     }
6364   else if (!sel.series_p (0, 1, first, 1))
6365     {
6366       unsigned int nelt;
6367       if (!GET_MODE_NUNITS (mode).is_constant (&nelt))
6368         return NULL_RTX;
6369       for (unsigned int i = 1; i < nelt; i++)
6370         {
6371           poly_int64 expected = i + first;
6372           /* Indices into the second vector are all equivalent.  */
6373           if (maybe_lt (sel[i], nelt)
6374               ? maybe_ne (sel[i], expected)
6375               : maybe_lt (expected, nelt))
6376             return NULL_RTX;
6377         }
6378     }
6379
6380   return gen_int_shift_amount (mode, first * bitsize);
6381 }
6382
6383 /* A subroutine of expand_vec_perm_var for expanding one vec_perm insn.  */
6384
6385 static rtx
6386 expand_vec_perm_1 (enum insn_code icode, rtx target,
6387                    rtx v0, rtx v1, rtx sel)
6388 {
6389   machine_mode tmode = GET_MODE (target);
6390   machine_mode smode = GET_MODE (sel);
6391   class expand_operand ops[4];
6392
6393   gcc_assert (GET_MODE_CLASS (smode) == MODE_VECTOR_INT
6394               || related_int_vector_mode (tmode).require () == smode);
6395   create_output_operand (&ops[0], target, tmode);
6396   create_input_operand (&ops[3], sel, smode);
6397
6398   /* Make an effort to preserve v0 == v1.  The target expander is able to
6399      rely on this to determine if we're permuting a single input operand.  */
6400   if (rtx_equal_p (v0, v1))
6401     {
6402       if (!insn_operand_matches (icode, 1, v0))
6403         v0 = force_reg (tmode, v0);
6404       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
6405       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
6406
6407       create_fixed_operand (&ops[1], v0);
6408       create_fixed_operand (&ops[2], v0);
6409     }
6410   else
6411     {
6412       create_input_operand (&ops[1], v0, tmode);
6413       create_input_operand (&ops[2], v1, tmode);
6414     }
6415
6416   if (maybe_expand_insn (icode, 4, ops))
6417     return ops[0].value;
6418   return NULL_RTX;
6419 }
6420
6421 /* Implement a permutation of vectors v0 and v1 using the permutation
6422    vector in SEL and return the result.  Use TARGET to hold the result
6423    if nonnull and convenient.
6424
6425    MODE is the mode of the vectors being permuted (V0 and V1).  SEL_MODE
6426    is the TYPE_MODE associated with SEL, or BLKmode if SEL isn't known
6427    to have a particular mode.  */
6428
6429 rtx
6430 expand_vec_perm_const (machine_mode mode, rtx v0, rtx v1,
6431                        const vec_perm_builder &sel, machine_mode sel_mode,
6432                        rtx target)
6433 {
6434   if (!target || !register_operand (target, mode))
6435     target = gen_reg_rtx (mode);
6436
6437   /* Set QIMODE to a different vector mode with byte elements.
6438      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
6439   machine_mode qimode;
6440   if (!qimode_for_vec_perm (mode).exists (&qimode))
6441     qimode = VOIDmode;
6442
6443   rtx_insn *last = get_last_insn ();
6444
6445   bool single_arg_p = rtx_equal_p (v0, v1);
6446   /* Always specify two input vectors here and leave the target to handle
6447      cases in which the inputs are equal.  Not all backends can cope with
6448      the single-input representation when testing for a double-input
6449      target instruction.  */
6450   vec_perm_indices indices (sel, 2, GET_MODE_NUNITS (mode));
6451
6452   /* See if this can be handled with a vec_shr or vec_shl.  We only do this
6453      if the second (for vec_shr) or first (for vec_shl) vector is all
6454      zeroes.  */
6455   insn_code shift_code = CODE_FOR_nothing;
6456   insn_code shift_code_qi = CODE_FOR_nothing;
6457   optab shift_optab = unknown_optab;
6458   rtx v2 = v0;
6459   if (v1 == CONST0_RTX (GET_MODE (v1)))
6460     shift_optab = vec_shr_optab;
6461   else if (v0 == CONST0_RTX (GET_MODE (v0)))
6462     {
6463       shift_optab = vec_shl_optab;
6464       v2 = v1;
6465     }
6466   if (shift_optab != unknown_optab)
6467     {
6468       shift_code = optab_handler (shift_optab, mode);
6469       shift_code_qi = ((qimode != VOIDmode && qimode != mode)
6470                        ? optab_handler (shift_optab, qimode)
6471                        : CODE_FOR_nothing);
6472     }
6473   if (shift_code != CODE_FOR_nothing || shift_code_qi != CODE_FOR_nothing)
6474     {
6475       rtx shift_amt = shift_amt_for_vec_perm_mask (mode, indices, shift_optab);
6476       if (shift_amt)
6477         {
6478           class expand_operand ops[3];
6479           if (shift_amt == const0_rtx)
6480             return v2;
6481           if (shift_code != CODE_FOR_nothing)
6482             {
6483               create_output_operand (&ops[0], target, mode);
6484               create_input_operand (&ops[1], v2, mode);
6485               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
6486               if (maybe_expand_insn (shift_code, 3, ops))
6487                 return ops[0].value;
6488             }
6489           if (shift_code_qi != CODE_FOR_nothing)
6490             {
6491               rtx tmp = gen_reg_rtx (qimode);
6492               create_output_operand (&ops[0], tmp, qimode);
6493               create_input_operand (&ops[1], gen_lowpart (qimode, v2), qimode);
6494               create_convert_operand_from_type (&ops[2], shift_amt, sizetype);
6495               if (maybe_expand_insn (shift_code_qi, 3, ops))
6496                 return gen_lowpart (mode, ops[0].value);
6497             }
6498         }
6499     }
6500
6501   if (targetm.vectorize.vec_perm_const != NULL)
6502     {
6503       if (single_arg_p)
6504         v1 = v0;
6505
6506       gcc_checking_assert (GET_MODE (v0) == GET_MODE (v1));
6507       machine_mode op_mode = GET_MODE (v0);
6508       if (targetm.vectorize.vec_perm_const (mode, op_mode, target, v0, v1,
6509                                             indices))
6510         return target;
6511     }
6512
6513   /* Fall back to a constant byte-based permutation.  */
6514   vec_perm_indices qimode_indices;
6515   rtx target_qi = NULL_RTX, v0_qi = NULL_RTX, v1_qi = NULL_RTX;
6516   if (qimode != VOIDmode)
6517     {
6518       qimode_indices.new_expanded_vector (indices, GET_MODE_UNIT_SIZE (mode));
6519       target_qi = gen_reg_rtx (qimode);
6520       v0_qi = gen_lowpart (qimode, v0);
6521       v1_qi = gen_lowpart (qimode, v1);
6522       if (targetm.vectorize.vec_perm_const != NULL
6523           && targetm.vectorize.vec_perm_const (qimode, qimode, target_qi, v0_qi,
6524                                                v1_qi, qimode_indices))
6525         return gen_lowpart (mode, target_qi);
6526     }
6527
6528   v0 = force_reg (mode, v0);
6529   if (single_arg_p)
6530     v1 = v0;
6531   v1 = force_reg (mode, v1);
6532
6533   /* Otherwise expand as a fully variable permuation.  */
6534
6535   /* The optabs are only defined for selectors with the same width
6536      as the values being permuted.  */
6537   machine_mode required_sel_mode;
6538   if (!related_int_vector_mode (mode).exists (&required_sel_mode))
6539     {
6540       delete_insns_since (last);
6541       return NULL_RTX;
6542     }
6543
6544   /* We know that it is semantically valid to treat SEL as having SEL_MODE.
6545      If that isn't the mode we want then we need to prove that using
6546      REQUIRED_SEL_MODE is OK.  */
6547   if (sel_mode != required_sel_mode)
6548     {
6549       if (!selector_fits_mode_p (required_sel_mode, indices))
6550         {
6551           delete_insns_since (last);
6552           return NULL_RTX;
6553         }
6554       sel_mode = required_sel_mode;
6555     }
6556
6557   insn_code icode = direct_optab_handler (vec_perm_optab, mode);
6558   if (icode != CODE_FOR_nothing)
6559     {
6560       rtx sel_rtx = vec_perm_indices_to_rtx (sel_mode, indices);
6561       rtx tmp = expand_vec_perm_1 (icode, target, v0, v1, sel_rtx);
6562       if (tmp)
6563         return tmp;
6564     }
6565
6566   if (qimode != VOIDmode
6567       && selector_fits_mode_p (qimode, qimode_indices))
6568     {
6569       icode = direct_optab_handler (vec_perm_optab, qimode);
6570       if (icode != CODE_FOR_nothing)
6571         {
6572           rtx sel_qi = vec_perm_indices_to_rtx (qimode, qimode_indices);
6573           rtx tmp = expand_vec_perm_1 (icode, target_qi, v0_qi, v1_qi, sel_qi);
6574           if (tmp)
6575             return gen_lowpart (mode, tmp);
6576         }
6577     }
6578
6579   delete_insns_since (last);
6580   return NULL_RTX;
6581 }
6582
6583 /* Implement a permutation of vectors v0 and v1 using the permutation
6584    vector in SEL and return the result.  Use TARGET to hold the result
6585    if nonnull and convenient.
6586
6587    MODE is the mode of the vectors being permuted (V0 and V1).
6588    SEL must have the integer equivalent of MODE and is known to be
6589    unsuitable for permutes with a constant permutation vector.  */
6590
6591 rtx
6592 expand_vec_perm_var (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
6593 {
6594   enum insn_code icode;
6595   unsigned int i, u;
6596   rtx tmp, sel_qi;
6597
6598   u = GET_MODE_UNIT_SIZE (mode);
6599
6600   if (!target || GET_MODE (target) != mode)
6601     target = gen_reg_rtx (mode);
6602
6603   icode = direct_optab_handler (vec_perm_optab, mode);
6604   if (icode != CODE_FOR_nothing)
6605     {
6606       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6607       if (tmp)
6608         return tmp;
6609     }
6610
6611   /* As a special case to aid several targets, lower the element-based
6612      permutation to a byte-based permutation and try again.  */
6613   machine_mode qimode;
6614   if (!qimode_for_vec_perm (mode).exists (&qimode)
6615       || maybe_gt (GET_MODE_NUNITS (qimode), GET_MODE_MASK (QImode) + 1))
6616     return NULL_RTX;
6617   icode = direct_optab_handler (vec_perm_optab, qimode);
6618   if (icode == CODE_FOR_nothing)
6619     return NULL_RTX;
6620
6621   /* Multiply each element by its byte size.  */
6622   machine_mode selmode = GET_MODE (sel);
6623   if (u == 2)
6624     sel = expand_simple_binop (selmode, PLUS, sel, sel,
6625                                NULL, 0, OPTAB_DIRECT);
6626   else
6627     sel = expand_simple_binop (selmode, ASHIFT, sel,
6628                                gen_int_shift_amount (selmode, exact_log2 (u)),
6629                                NULL, 0, OPTAB_DIRECT);
6630   gcc_assert (sel != NULL);
6631
6632   /* Broadcast the low byte each element into each of its bytes.
6633      The encoding has U interleaved stepped patterns, one for each
6634      byte of an element.  */
6635   vec_perm_builder const_sel (GET_MODE_SIZE (mode), u, 3);
6636   unsigned int low_byte_in_u = BYTES_BIG_ENDIAN ? u - 1 : 0;
6637   for (i = 0; i < 3; ++i)
6638     for (unsigned int j = 0; j < u; ++j)
6639       const_sel.quick_push (i * u + low_byte_in_u);
6640   sel = gen_lowpart (qimode, sel);
6641   sel = expand_vec_perm_const (qimode, sel, sel, const_sel, qimode, NULL);
6642   gcc_assert (sel != NULL);
6643
6644   /* Add the byte offset to each byte element.  */
6645   /* Note that the definition of the indicies here is memory ordering,
6646      so there should be no difference between big and little endian.  */
6647   rtx_vector_builder byte_indices (qimode, u, 1);
6648   for (i = 0; i < u; ++i)
6649     byte_indices.quick_push (GEN_INT (i));
6650   tmp = byte_indices.build ();
6651   sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
6652                                 sel, 0, OPTAB_DIRECT);
6653   gcc_assert (sel_qi != NULL);
6654
6655   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6656   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6657                            gen_lowpart (qimode, v1), sel_qi);
6658   if (tmp)
6659     tmp = gen_lowpart (mode, tmp);
6660   return tmp;
6661 }
6662
6663 /* Generate VEC_SERIES_EXPR <OP0, OP1>, returning a value of mode VMODE.
6664    Use TARGET for the result if nonnull and convenient.  */
6665
6666 rtx
6667 expand_vec_series_expr (machine_mode vmode, rtx op0, rtx op1, rtx target)
6668 {
6669   class expand_operand ops[3];
6670   enum insn_code icode;
6671   machine_mode emode = GET_MODE_INNER (vmode);
6672
6673   icode = direct_optab_handler (vec_series_optab, vmode);
6674   gcc_assert (icode != CODE_FOR_nothing);
6675
6676   create_output_operand (&ops[0], target, vmode);
6677   create_input_operand (&ops[1], op0, emode);
6678   create_input_operand (&ops[2], op1, emode);
6679
6680   expand_insn (icode, 3, ops);
6681   return ops[0].value;
6682 }
6683
6684 /* Generate insns for a vector comparison into a mask.  */
6685
6686 rtx
6687 expand_vec_cmp_expr (tree type, tree exp, rtx target)
6688 {
6689   class expand_operand ops[4];
6690   enum insn_code icode;
6691   rtx comparison;
6692   machine_mode mask_mode = TYPE_MODE (type);
6693   machine_mode vmode;
6694   bool unsignedp;
6695   tree op0a, op0b;
6696   enum tree_code tcode;
6697
6698   op0a = TREE_OPERAND (exp, 0);
6699   op0b = TREE_OPERAND (exp, 1);
6700   tcode = TREE_CODE (exp);
6701
6702   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
6703   vmode = TYPE_MODE (TREE_TYPE (op0a));
6704
6705   icode = get_vec_cmp_icode (vmode, mask_mode, unsignedp);
6706   if (icode == CODE_FOR_nothing)
6707     {
6708       if (tcode == EQ_EXPR || tcode == NE_EXPR)
6709         icode = get_vec_cmp_eq_icode (vmode, mask_mode);
6710       if (icode == CODE_FOR_nothing)
6711         return 0;
6712     }
6713
6714   comparison = vector_compare_rtx (mask_mode, tcode, op0a, op0b,
6715                                    unsignedp, icode, 2);
6716   create_output_operand (&ops[0], target, mask_mode);
6717   create_fixed_operand (&ops[1], comparison);
6718   create_fixed_operand (&ops[2], XEXP (comparison, 0));
6719   create_fixed_operand (&ops[3], XEXP (comparison, 1));
6720   expand_insn (icode, 4, ops);
6721   return ops[0].value;
6722 }
6723
6724 /* Expand a highpart multiply.  */
6725
6726 rtx
6727 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
6728                       rtx target, bool uns_p)
6729 {
6730   class expand_operand eops[3];
6731   enum insn_code icode;
6732   int method, i;
6733   machine_mode wmode;
6734   rtx m1, m2;
6735   optab tab1, tab2;
6736
6737   method = can_mult_highpart_p (mode, uns_p);
6738   switch (method)
6739     {
6740     case 0:
6741       return NULL_RTX;
6742     case 1:
6743       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
6744       return expand_binop (mode, tab1, op0, op1, target, uns_p,
6745                            OPTAB_LIB_WIDEN);
6746     case 2:
6747       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6748       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6749       break;
6750     case 3:
6751       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6752       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6753       if (BYTES_BIG_ENDIAN)
6754         std::swap (tab1, tab2);
6755       break;
6756     default:
6757       gcc_unreachable ();
6758     }
6759
6760   icode = optab_handler (tab1, mode);
6761   wmode = insn_data[icode].operand[0].mode;
6762   gcc_checking_assert (known_eq (2 * GET_MODE_NUNITS (wmode),
6763                                  GET_MODE_NUNITS (mode)));
6764   gcc_checking_assert (known_eq (GET_MODE_SIZE (wmode), GET_MODE_SIZE (mode)));
6765
6766   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6767   create_input_operand (&eops[1], op0, mode);
6768   create_input_operand (&eops[2], op1, mode);
6769   expand_insn (icode, 3, eops);
6770   m1 = gen_lowpart (mode, eops[0].value);
6771
6772   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6773   create_input_operand (&eops[1], op0, mode);
6774   create_input_operand (&eops[2], op1, mode);
6775   expand_insn (optab_handler (tab2, mode), 3, eops);
6776   m2 = gen_lowpart (mode, eops[0].value);
6777
6778   vec_perm_builder sel;
6779   if (method == 2)
6780     {
6781       /* The encoding has 2 interleaved stepped patterns.  */
6782       sel.new_vector (GET_MODE_NUNITS (mode), 2, 3);
6783       for (i = 0; i < 6; ++i)
6784         sel.quick_push (!BYTES_BIG_ENDIAN + (i & ~1)
6785                         + ((i & 1) ? GET_MODE_NUNITS (mode) : 0));
6786     }
6787   else
6788     {
6789       /* The encoding has a single interleaved stepped pattern.  */
6790       sel.new_vector (GET_MODE_NUNITS (mode), 1, 3);
6791       for (i = 0; i < 3; ++i)
6792         sel.quick_push (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
6793     }
6794
6795   return expand_vec_perm_const (mode, m1, m2, sel, BLKmode, target);
6796 }
6797 \f
6798 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
6799    pattern.  */
6800
6801 static void
6802 find_cc_set (rtx x, const_rtx pat, void *data)
6803 {
6804   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
6805       && GET_CODE (pat) == SET)
6806     {
6807       rtx *p_cc_reg = (rtx *) data;
6808       gcc_assert (!*p_cc_reg);
6809       *p_cc_reg = x;
6810     }
6811 }
6812
6813 /* This is a helper function for the other atomic operations.  This function
6814    emits a loop that contains SEQ that iterates until a compare-and-swap
6815    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
6816    a set of instructions that takes a value from OLD_REG as an input and
6817    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
6818    set to the current contents of MEM.  After SEQ, a compare-and-swap will
6819    attempt to update MEM with NEW_REG.  The function returns true when the
6820    loop was generated successfully.  */
6821
6822 static bool
6823 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
6824 {
6825   machine_mode mode = GET_MODE (mem);
6826   rtx_code_label *label;
6827   rtx cmp_reg, success, oldval;
6828
6829   /* The loop we want to generate looks like
6830
6831         cmp_reg = mem;
6832       label:
6833         old_reg = cmp_reg;
6834         seq;
6835         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
6836         if (success)
6837           goto label;
6838
6839      Note that we only do the plain load from memory once.  Subsequent
6840      iterations use the value loaded by the compare-and-swap pattern.  */
6841
6842   label = gen_label_rtx ();
6843   cmp_reg = gen_reg_rtx (mode);
6844
6845   emit_move_insn (cmp_reg, mem);
6846   emit_label (label);
6847   emit_move_insn (old_reg, cmp_reg);
6848   if (seq)
6849     emit_insn (seq);
6850
6851   success = NULL_RTX;
6852   oldval = cmp_reg;
6853   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
6854                                        new_reg, false, MEMMODEL_SYNC_SEQ_CST,
6855                                        MEMMODEL_RELAXED))
6856     return false;
6857
6858   if (oldval != cmp_reg)
6859     emit_move_insn (cmp_reg, oldval);
6860
6861   /* Mark this jump predicted not taken.  */
6862   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
6863                            GET_MODE (success), 1, label,
6864                            profile_probability::guessed_never ());
6865   return true;
6866 }
6867
6868
6869 /* This function tries to emit an atomic_exchange intruction.  VAL is written
6870    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
6871    using TARGET if possible.  */
6872
6873 static rtx
6874 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6875 {
6876   machine_mode mode = GET_MODE (mem);
6877   enum insn_code icode;
6878
6879   /* If the target supports the exchange directly, great.  */
6880   icode = direct_optab_handler (atomic_exchange_optab, mode);
6881   if (icode != CODE_FOR_nothing)
6882     {
6883       class expand_operand ops[4];
6884
6885       create_output_operand (&ops[0], target, mode);
6886       create_fixed_operand (&ops[1], mem);
6887       create_input_operand (&ops[2], val, mode);
6888       create_integer_operand (&ops[3], model);
6889       if (maybe_expand_insn (icode, 4, ops))
6890         return ops[0].value;
6891     }
6892
6893   return NULL_RTX;
6894 }
6895
6896 /* This function tries to implement an atomic exchange operation using
6897    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
6898    The previous contents of *MEM are returned, using TARGET if possible.
6899    Since this instructionn is an acquire barrier only, stronger memory
6900    models may require additional barriers to be emitted.  */
6901
6902 static rtx
6903 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
6904                                    enum memmodel model)
6905 {
6906   machine_mode mode = GET_MODE (mem);
6907   enum insn_code icode;
6908   rtx_insn *last_insn = get_last_insn ();
6909
6910   icode = optab_handler (sync_lock_test_and_set_optab, mode);
6911
6912   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
6913      exists, and the memory model is stronger than acquire, add a release
6914      barrier before the instruction.  */
6915
6916   if (is_mm_seq_cst (model) || is_mm_release (model) || is_mm_acq_rel (model))
6917     expand_mem_thread_fence (model);
6918
6919   if (icode != CODE_FOR_nothing)
6920     {
6921       class expand_operand ops[3];
6922       create_output_operand (&ops[0], target, mode);
6923       create_fixed_operand (&ops[1], mem);
6924       create_input_operand (&ops[2], val, mode);
6925       if (maybe_expand_insn (icode, 3, ops))
6926         return ops[0].value;
6927     }
6928
6929   /* If an external test-and-set libcall is provided, use that instead of
6930      any external compare-and-swap that we might get from the compare-and-
6931      swap-loop expansion later.  */
6932   if (!can_compare_and_swap_p (mode, false))
6933     {
6934       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
6935       if (libfunc != NULL)
6936         {
6937           rtx addr;
6938
6939           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6940           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6941                                           mode, addr, ptr_mode,
6942                                           val, mode);
6943         }
6944     }
6945
6946   /* If the test_and_set can't be emitted, eliminate any barrier that might
6947      have been emitted.  */
6948   delete_insns_since (last_insn);
6949   return NULL_RTX;
6950 }
6951
6952 /* This function tries to implement an atomic exchange operation using a
6953    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
6954    *MEM are returned, using TARGET if possible.  No memory model is required
6955    since a compare_and_swap loop is seq-cst.  */
6956
6957 static rtx
6958 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
6959 {
6960   machine_mode mode = GET_MODE (mem);
6961
6962   if (can_compare_and_swap_p (mode, true))
6963     {
6964       if (!target || !register_operand (target, mode))
6965         target = gen_reg_rtx (mode);
6966       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
6967         return target;
6968     }
6969
6970   return NULL_RTX;
6971 }
6972
6973 /* This function tries to implement an atomic test-and-set operation
6974    using the atomic_test_and_set instruction pattern.  A boolean value
6975    is returned from the operation, using TARGET if possible.  */
6976
6977 static rtx
6978 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6979 {
6980   machine_mode pat_bool_mode;
6981   class expand_operand ops[3];
6982
6983   if (!targetm.have_atomic_test_and_set ())
6984     return NULL_RTX;
6985
6986   /* While we always get QImode from __atomic_test_and_set, we get
6987      other memory modes from __sync_lock_test_and_set.  Note that we
6988      use no endian adjustment here.  This matches the 4.6 behavior
6989      in the Sparc backend.  */
6990   enum insn_code icode = targetm.code_for_atomic_test_and_set;
6991   gcc_checking_assert (insn_data[icode].operand[1].mode == QImode);
6992   if (GET_MODE (mem) != QImode)
6993     mem = adjust_address_nv (mem, QImode, 0);
6994
6995   pat_bool_mode = insn_data[icode].operand[0].mode;
6996   create_output_operand (&ops[0], target, pat_bool_mode);
6997   create_fixed_operand (&ops[1], mem);
6998   create_integer_operand (&ops[2], model);
6999
7000   if (maybe_expand_insn (icode, 3, ops))
7001     return ops[0].value;
7002   return NULL_RTX;
7003 }
7004
7005 /* This function expands the legacy _sync_lock test_and_set operation which is
7006    generally an atomic exchange.  Some limited targets only allow the
7007    constant 1 to be stored.  This is an ACQUIRE operation.
7008
7009    TARGET is an optional place to stick the return value.
7010    MEM is where VAL is stored.  */
7011
7012 rtx
7013 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
7014 {
7015   rtx ret;
7016
7017   /* Try an atomic_exchange first.  */
7018   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_SYNC_ACQUIRE);
7019   if (ret)
7020     return ret;
7021
7022   ret = maybe_emit_sync_lock_test_and_set (target, mem, val,
7023                                            MEMMODEL_SYNC_ACQUIRE);
7024   if (ret)
7025     return ret;
7026
7027   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7028   if (ret)
7029     return ret;
7030
7031   /* If there are no other options, try atomic_test_and_set if the value
7032      being stored is 1.  */
7033   if (val == const1_rtx)
7034     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_SYNC_ACQUIRE);
7035
7036   return ret;
7037 }
7038
7039 /* This function expands the atomic test_and_set operation:
7040    atomically store a boolean TRUE into MEM and return the previous value.
7041
7042    MEMMODEL is the memory model variant to use.
7043    TARGET is an optional place to stick the return value.  */
7044
7045 rtx
7046 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7047 {
7048   machine_mode mode = GET_MODE (mem);
7049   rtx ret, trueval, subtarget;
7050
7051   ret = maybe_emit_atomic_test_and_set (target, mem, model);
7052   if (ret)
7053     return ret;
7054
7055   /* Be binary compatible with non-default settings of trueval, and different
7056      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
7057      another only has atomic-exchange.  */
7058   if (targetm.atomic_test_and_set_trueval == 1)
7059     {
7060       trueval = const1_rtx;
7061       subtarget = target ? target : gen_reg_rtx (mode);
7062     }
7063   else
7064     {
7065       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
7066       subtarget = gen_reg_rtx (mode);
7067     }
7068
7069   /* Try the atomic-exchange optab...  */
7070   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
7071
7072   /* ... then an atomic-compare-and-swap loop ... */
7073   if (!ret)
7074     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
7075
7076   /* ... before trying the vaguely defined legacy lock_test_and_set. */
7077   if (!ret)
7078     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
7079
7080   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
7081      things with the value 1.  Thus we try again without trueval.  */
7082   if (!ret && targetm.atomic_test_and_set_trueval != 1)
7083     {
7084       ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
7085
7086       if (ret)
7087         {
7088           /* Rectify the not-one trueval.  */
7089           ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
7090           gcc_assert (ret);
7091         }
7092     }
7093
7094   return ret;
7095 }
7096
7097 /* This function expands the atomic exchange operation:
7098    atomically store VAL in MEM and return the previous value in MEM.
7099
7100    MEMMODEL is the memory model variant to use.
7101    TARGET is an optional place to stick the return value.  */
7102
7103 rtx
7104 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7105 {
7106   machine_mode mode = GET_MODE (mem);
7107   rtx ret;
7108
7109   /* If loads are not atomic for the required size and we are not called to
7110      provide a __sync builtin, do not do anything so that we stay consistent
7111      with atomic loads of the same size.  */
7112   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
7113     return NULL_RTX;
7114
7115   ret = maybe_emit_atomic_exchange (target, mem, val, model);
7116
7117   /* Next try a compare-and-swap loop for the exchange.  */
7118   if (!ret)
7119     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7120
7121   return ret;
7122 }
7123
7124 /* This function expands the atomic compare exchange operation:
7125
7126    *PTARGET_BOOL is an optional place to store the boolean success/failure.
7127    *PTARGET_OVAL is an optional place to store the old value from memory.
7128    Both target parameters may be NULL or const0_rtx to indicate that we do
7129    not care about that return value.  Both target parameters are updated on
7130    success to the actual location of the corresponding result.
7131
7132    MEMMODEL is the memory model variant to use.
7133
7134    The return value of the function is true for success.  */
7135
7136 bool
7137 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
7138                                 rtx mem, rtx expected, rtx desired,
7139                                 bool is_weak, enum memmodel succ_model,
7140                                 enum memmodel fail_model)
7141 {
7142   machine_mode mode = GET_MODE (mem);
7143   class expand_operand ops[8];
7144   enum insn_code icode;
7145   rtx target_oval, target_bool = NULL_RTX;
7146   rtx libfunc;
7147
7148   /* If loads are not atomic for the required size and we are not called to
7149      provide a __sync builtin, do not do anything so that we stay consistent
7150      with atomic loads of the same size.  */
7151   if (!can_atomic_load_p (mode) && !is_mm_sync (succ_model))
7152     return false;
7153
7154   /* Load expected into a register for the compare and swap.  */
7155   if (MEM_P (expected))
7156     expected = copy_to_reg (expected);
7157
7158   /* Make sure we always have some place to put the return oldval.
7159      Further, make sure that place is distinct from the input expected,
7160      just in case we need that path down below.  */
7161   if (ptarget_oval && *ptarget_oval == const0_rtx)
7162     ptarget_oval = NULL;
7163
7164   if (ptarget_oval == NULL
7165       || (target_oval = *ptarget_oval) == NULL
7166       || reg_overlap_mentioned_p (expected, target_oval))
7167     target_oval = gen_reg_rtx (mode);
7168
7169   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7170   if (icode != CODE_FOR_nothing)
7171     {
7172       machine_mode bool_mode = insn_data[icode].operand[0].mode;
7173
7174       if (ptarget_bool && *ptarget_bool == const0_rtx)
7175         ptarget_bool = NULL;
7176
7177       /* Make sure we always have a place for the bool operand.  */
7178       if (ptarget_bool == NULL
7179           || (target_bool = *ptarget_bool) == NULL
7180           || GET_MODE (target_bool) != bool_mode)
7181         target_bool = gen_reg_rtx (bool_mode);
7182
7183       /* Emit the compare_and_swap.  */
7184       create_output_operand (&ops[0], target_bool, bool_mode);
7185       create_output_operand (&ops[1], target_oval, mode);
7186       create_fixed_operand (&ops[2], mem);
7187       create_input_operand (&ops[3], expected, mode);
7188       create_input_operand (&ops[4], desired, mode);
7189       create_integer_operand (&ops[5], is_weak);
7190       create_integer_operand (&ops[6], succ_model);
7191       create_integer_operand (&ops[7], fail_model);
7192       if (maybe_expand_insn (icode, 8, ops))
7193         {
7194           /* Return success/failure.  */
7195           target_bool = ops[0].value;
7196           target_oval = ops[1].value;
7197           goto success;
7198         }
7199     }
7200
7201   /* Otherwise fall back to the original __sync_val_compare_and_swap
7202      which is always seq-cst.  */
7203   icode = optab_handler (sync_compare_and_swap_optab, mode);
7204   if (icode != CODE_FOR_nothing)
7205     {
7206       rtx cc_reg;
7207
7208       create_output_operand (&ops[0], target_oval, mode);
7209       create_fixed_operand (&ops[1], mem);
7210       create_input_operand (&ops[2], expected, mode);
7211       create_input_operand (&ops[3], desired, mode);
7212       if (!maybe_expand_insn (icode, 4, ops))
7213         return false;
7214
7215       target_oval = ops[0].value;
7216
7217       /* If the caller isn't interested in the boolean return value,
7218          skip the computation of it.  */
7219       if (ptarget_bool == NULL)
7220         goto success;
7221
7222       /* Otherwise, work out if the compare-and-swap succeeded.  */
7223       cc_reg = NULL_RTX;
7224       if (have_insn_for (COMPARE, CCmode))
7225         note_stores (get_last_insn (), find_cc_set, &cc_reg);
7226       if (cc_reg)
7227         {
7228           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
7229                                                const0_rtx, VOIDmode, 0, 1);
7230           goto success;
7231         }
7232       goto success_bool_from_val;
7233     }
7234
7235   /* Also check for library support for __sync_val_compare_and_swap.  */
7236   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
7237   if (libfunc != NULL)
7238     {
7239       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7240       rtx target = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7241                                             mode, addr, ptr_mode,
7242                                             expected, mode, desired, mode);
7243       emit_move_insn (target_oval, target);
7244
7245       /* Compute the boolean return value only if requested.  */
7246       if (ptarget_bool)
7247         goto success_bool_from_val;
7248       else
7249         goto success;
7250     }
7251
7252   /* Failure.  */
7253   return false;
7254
7255  success_bool_from_val:
7256    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
7257                                         expected, VOIDmode, 1, 1);
7258  success:
7259   /* Make sure that the oval output winds up where the caller asked.  */
7260   if (ptarget_oval)
7261     *ptarget_oval = target_oval;
7262   if (ptarget_bool)
7263     *ptarget_bool = target_bool;
7264   return true;
7265 }
7266
7267 /* Generate asm volatile("" : : : "memory") as the memory blockage.  */
7268
7269 static void
7270 expand_asm_memory_blockage (void)
7271 {
7272   rtx asm_op, clob;
7273
7274   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, "", "", 0,
7275                                  rtvec_alloc (0), rtvec_alloc (0),
7276                                  rtvec_alloc (0), UNKNOWN_LOCATION);
7277   MEM_VOLATILE_P (asm_op) = 1;
7278
7279   clob = gen_rtx_SCRATCH (VOIDmode);
7280   clob = gen_rtx_MEM (BLKmode, clob);
7281   clob = gen_rtx_CLOBBER (VOIDmode, clob);
7282
7283   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
7284 }
7285
7286 /* Do not propagate memory accesses across this point.  */
7287
7288 static void
7289 expand_memory_blockage (void)
7290 {
7291   if (targetm.have_memory_blockage ())
7292     emit_insn (targetm.gen_memory_blockage ());
7293   else
7294     expand_asm_memory_blockage ();
7295 }
7296
7297 /* Generate asm volatile("" : : : "memory") as a memory blockage, at the
7298    same time clobbering the register set specified by REGS.  */
7299
7300 void
7301 expand_asm_reg_clobber_mem_blockage (HARD_REG_SET regs)
7302 {
7303   rtx asm_op, clob_mem;
7304
7305   unsigned int num_of_regs = 0;
7306   for (unsigned int i = 0; i < FIRST_PSEUDO_REGISTER; i++)
7307     if (TEST_HARD_REG_BIT (regs, i))
7308       num_of_regs++;
7309
7310   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, "", "", 0,
7311                                  rtvec_alloc (0), rtvec_alloc (0),
7312                                  rtvec_alloc (0), UNKNOWN_LOCATION);
7313   MEM_VOLATILE_P (asm_op) = 1;
7314
7315   rtvec v = rtvec_alloc (num_of_regs + 2);
7316
7317   clob_mem = gen_rtx_SCRATCH (VOIDmode);
7318   clob_mem = gen_rtx_MEM (BLKmode, clob_mem);
7319   clob_mem = gen_rtx_CLOBBER (VOIDmode, clob_mem);
7320
7321   RTVEC_ELT (v, 0) = asm_op;
7322   RTVEC_ELT (v, 1) = clob_mem;
7323
7324   if (num_of_regs > 0)
7325     {
7326       unsigned int j = 2;
7327       for (unsigned int i = 0; i < FIRST_PSEUDO_REGISTER; i++)
7328         if (TEST_HARD_REG_BIT (regs, i))
7329           {
7330             RTVEC_ELT (v, j) = gen_rtx_CLOBBER (VOIDmode, regno_reg_rtx[i]);
7331             j++;
7332           }
7333       gcc_assert (j == (num_of_regs + 2));
7334     }
7335
7336   emit_insn (gen_rtx_PARALLEL (VOIDmode, v));
7337 }
7338
7339 /* This routine will either emit the mem_thread_fence pattern or issue a
7340    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7341
7342 void
7343 expand_mem_thread_fence (enum memmodel model)
7344 {
7345   if (is_mm_relaxed (model))
7346     return;
7347   if (targetm.have_mem_thread_fence ())
7348     {
7349       emit_insn (targetm.gen_mem_thread_fence (GEN_INT (model)));
7350       expand_memory_blockage ();
7351     }
7352   else if (targetm.have_memory_barrier ())
7353     emit_insn (targetm.gen_memory_barrier ());
7354   else if (synchronize_libfunc != NULL_RTX)
7355     emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode);
7356   else
7357     expand_memory_blockage ();
7358 }
7359
7360 /* Emit a signal fence with given memory model.  */
7361
7362 void
7363 expand_mem_signal_fence (enum memmodel model)
7364 {
7365   /* No machine barrier is required to implement a signal fence, but
7366      a compiler memory barrier must be issued, except for relaxed MM.  */
7367   if (!is_mm_relaxed (model))
7368     expand_memory_blockage ();
7369 }
7370
7371 /* This function expands the atomic load operation:
7372    return the atomically loaded value in MEM.
7373
7374    MEMMODEL is the memory model variant to use.
7375    TARGET is an option place to stick the return value.  */
7376
7377 rtx
7378 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
7379 {
7380   machine_mode mode = GET_MODE (mem);
7381   enum insn_code icode;
7382
7383   /* If the target supports the load directly, great.  */
7384   icode = direct_optab_handler (atomic_load_optab, mode);
7385   if (icode != CODE_FOR_nothing)
7386     {
7387       class expand_operand ops[3];
7388       rtx_insn *last = get_last_insn ();
7389       if (is_mm_seq_cst (model))
7390         expand_memory_blockage ();
7391
7392       create_output_operand (&ops[0], target, mode);
7393       create_fixed_operand (&ops[1], mem);
7394       create_integer_operand (&ops[2], model);
7395       if (maybe_expand_insn (icode, 3, ops))
7396         {
7397           if (!is_mm_relaxed (model))
7398             expand_memory_blockage ();
7399           return ops[0].value;
7400         }
7401       delete_insns_since (last);
7402     }
7403
7404   /* If the size of the object is greater than word size on this target,
7405      then we assume that a load will not be atomic.  We could try to
7406      emulate a load with a compare-and-swap operation, but the store that
7407      doing this could result in would be incorrect if this is a volatile
7408      atomic load or targetting read-only-mapped memory.  */
7409   if (maybe_gt (GET_MODE_PRECISION (mode), BITS_PER_WORD))
7410     /* If there is no atomic load, leave the library call.  */
7411     return NULL_RTX;
7412
7413   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
7414   if (!target || target == const0_rtx)
7415     target = gen_reg_rtx (mode);
7416
7417   /* For SEQ_CST, emit a barrier before the load.  */
7418   if (is_mm_seq_cst (model))
7419     expand_mem_thread_fence (model);
7420
7421   emit_move_insn (target, mem);
7422
7423   /* Emit the appropriate barrier after the load.  */
7424   expand_mem_thread_fence (model);
7425
7426   return target;
7427 }
7428
7429 /* This function expands the atomic store operation:
7430    Atomically store VAL in MEM.
7431    MEMMODEL is the memory model variant to use.
7432    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
7433    function returns const0_rtx if a pattern was emitted.  */
7434
7435 rtx
7436 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
7437 {
7438   machine_mode mode = GET_MODE (mem);
7439   enum insn_code icode;
7440   class expand_operand ops[3];
7441
7442   /* If the target supports the store directly, great.  */
7443   icode = direct_optab_handler (atomic_store_optab, mode);
7444   if (icode != CODE_FOR_nothing)
7445     {
7446       rtx_insn *last = get_last_insn ();
7447       if (!is_mm_relaxed (model))
7448         expand_memory_blockage ();
7449       create_fixed_operand (&ops[0], mem);
7450       create_input_operand (&ops[1], val, mode);
7451       create_integer_operand (&ops[2], model);
7452       if (maybe_expand_insn (icode, 3, ops))
7453         {
7454           if (is_mm_seq_cst (model))
7455             expand_memory_blockage ();
7456           return const0_rtx;
7457         }
7458       delete_insns_since (last);
7459     }
7460
7461   /* If using __sync_lock_release is a viable alternative, try it.
7462      Note that this will not be set to true if we are expanding a generic
7463      __atomic_store_n.  */
7464   if (use_release)
7465     {
7466       icode = direct_optab_handler (sync_lock_release_optab, mode);
7467       if (icode != CODE_FOR_nothing)
7468         {
7469           create_fixed_operand (&ops[0], mem);
7470           create_input_operand (&ops[1], const0_rtx, mode);
7471           if (maybe_expand_insn (icode, 2, ops))
7472             {
7473               /* lock_release is only a release barrier.  */
7474               if (is_mm_seq_cst (model))
7475                 expand_mem_thread_fence (model);
7476               return const0_rtx;
7477             }
7478         }
7479     }
7480
7481   /* If the size of the object is greater than word size on this target,
7482      a default store will not be atomic.  */
7483   if (maybe_gt (GET_MODE_PRECISION (mode), BITS_PER_WORD))
7484     {
7485       /* If loads are atomic or we are called to provide a __sync builtin,
7486          we can try a atomic_exchange and throw away the result.  Otherwise,
7487          don't do anything so that we do not create an inconsistency between
7488          loads and stores.  */
7489       if (can_atomic_load_p (mode) || is_mm_sync (model))
7490         {
7491           rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
7492           if (!target)
7493             target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem,
7494                                                                 val);
7495           if (target)
7496             return const0_rtx;
7497         }
7498         return NULL_RTX;
7499     }
7500
7501   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
7502   expand_mem_thread_fence (model);
7503
7504   emit_move_insn (mem, val);
7505
7506   /* For SEQ_CST, also emit a barrier after the store.  */
7507   if (is_mm_seq_cst (model))
7508     expand_mem_thread_fence (model);
7509
7510   return const0_rtx;
7511 }
7512
7513
7514 /* Structure containing the pointers and values required to process the
7515    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
7516
7517 struct atomic_op_functions
7518 {
7519   direct_optab mem_fetch_before;
7520   direct_optab mem_fetch_after;
7521   direct_optab mem_no_result;
7522   optab fetch_before;
7523   optab fetch_after;
7524   direct_optab no_result;
7525   enum rtx_code reverse_code;
7526 };
7527
7528
7529 /* Fill in structure pointed to by OP with the various optab entries for an
7530    operation of type CODE.  */
7531
7532 static void
7533 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
7534 {
7535   gcc_assert (op!= NULL);
7536
7537   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
7538      in the source code during compilation, and the optab entries are not
7539      computable until runtime.  Fill in the values at runtime.  */
7540   switch (code)
7541     {
7542     case PLUS:
7543       op->mem_fetch_before = atomic_fetch_add_optab;
7544       op->mem_fetch_after = atomic_add_fetch_optab;
7545       op->mem_no_result = atomic_add_optab;
7546       op->fetch_before = sync_old_add_optab;
7547       op->fetch_after = sync_new_add_optab;
7548       op->no_result = sync_add_optab;
7549       op->reverse_code = MINUS;
7550       break;
7551     case MINUS:
7552       op->mem_fetch_before = atomic_fetch_sub_optab;
7553       op->mem_fetch_after = atomic_sub_fetch_optab;
7554       op->mem_no_result = atomic_sub_optab;
7555       op->fetch_before = sync_old_sub_optab;
7556       op->fetch_after = sync_new_sub_optab;
7557       op->no_result = sync_sub_optab;
7558       op->reverse_code = PLUS;
7559       break;
7560     case XOR:
7561       op->mem_fetch_before = atomic_fetch_xor_optab;
7562       op->mem_fetch_after = atomic_xor_fetch_optab;
7563       op->mem_no_result = atomic_xor_optab;
7564       op->fetch_before = sync_old_xor_optab;
7565       op->fetch_after = sync_new_xor_optab;
7566       op->no_result = sync_xor_optab;
7567       op->reverse_code = XOR;
7568       break;
7569     case AND:
7570       op->mem_fetch_before = atomic_fetch_and_optab;
7571       op->mem_fetch_after = atomic_and_fetch_optab;
7572       op->mem_no_result = atomic_and_optab;
7573       op->fetch_before = sync_old_and_optab;
7574       op->fetch_after = sync_new_and_optab;
7575       op->no_result = sync_and_optab;
7576       op->reverse_code = UNKNOWN;
7577       break;
7578     case IOR:
7579       op->mem_fetch_before = atomic_fetch_or_optab;
7580       op->mem_fetch_after = atomic_or_fetch_optab;
7581       op->mem_no_result = atomic_or_optab;
7582       op->fetch_before = sync_old_ior_optab;
7583       op->fetch_after = sync_new_ior_optab;
7584       op->no_result = sync_ior_optab;
7585       op->reverse_code = UNKNOWN;
7586       break;
7587     case NOT:
7588       op->mem_fetch_before = atomic_fetch_nand_optab;
7589       op->mem_fetch_after = atomic_nand_fetch_optab;
7590       op->mem_no_result = atomic_nand_optab;
7591       op->fetch_before = sync_old_nand_optab;
7592       op->fetch_after = sync_new_nand_optab;
7593       op->no_result = sync_nand_optab;
7594       op->reverse_code = UNKNOWN;
7595       break;
7596     default:
7597       gcc_unreachable ();
7598     }
7599 }
7600
7601 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
7602    using memory order MODEL.  If AFTER is true the operation needs to return
7603    the value of *MEM after the operation, otherwise the previous value.
7604    TARGET is an optional place to place the result.  The result is unused if
7605    it is const0_rtx.
7606    Return the result if there is a better sequence, otherwise NULL_RTX.  */
7607
7608 static rtx
7609 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7610                          enum memmodel model, bool after)
7611 {
7612   /* If the value is prefetched, or not used, it may be possible to replace
7613      the sequence with a native exchange operation.  */
7614   if (!after || target == const0_rtx)
7615     {
7616       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
7617       if (code == AND && val == const0_rtx)
7618         {
7619           if (target == const0_rtx)
7620             target = gen_reg_rtx (GET_MODE (mem));
7621           return maybe_emit_atomic_exchange (target, mem, val, model);
7622         }
7623
7624       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
7625       if (code == IOR && val == constm1_rtx)
7626         {
7627           if (target == const0_rtx)
7628             target = gen_reg_rtx (GET_MODE (mem));
7629           return maybe_emit_atomic_exchange (target, mem, val, model);
7630         }
7631     }
7632
7633   return NULL_RTX;
7634 }
7635
7636 /* Try to emit an instruction for a specific operation varaition.
7637    OPTAB contains the OP functions.
7638    TARGET is an optional place to return the result. const0_rtx means unused.
7639    MEM is the memory location to operate on.
7640    VAL is the value to use in the operation.
7641    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
7642    MODEL is the memory model, if used.
7643    AFTER is true if the returned result is the value after the operation.  */
7644
7645 static rtx
7646 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
7647                rtx val, bool use_memmodel, enum memmodel model, bool after)
7648 {
7649   machine_mode mode = GET_MODE (mem);
7650   class expand_operand ops[4];
7651   enum insn_code icode;
7652   int op_counter = 0;
7653   int num_ops;
7654
7655   /* Check to see if there is a result returned.  */
7656   if (target == const0_rtx)
7657     {
7658       if (use_memmodel)
7659         {
7660           icode = direct_optab_handler (optab->mem_no_result, mode);
7661           create_integer_operand (&ops[2], model);
7662           num_ops = 3;
7663         }
7664       else
7665         {
7666           icode = direct_optab_handler (optab->no_result, mode);
7667           num_ops = 2;
7668         }
7669     }
7670   /* Otherwise, we need to generate a result.  */
7671   else
7672     {
7673       if (use_memmodel)
7674         {
7675           icode = direct_optab_handler (after ? optab->mem_fetch_after
7676                                         : optab->mem_fetch_before, mode);
7677           create_integer_operand (&ops[3], model);
7678           num_ops = 4;
7679         }
7680       else
7681         {
7682           icode = optab_handler (after ? optab->fetch_after
7683                                  : optab->fetch_before, mode);
7684           num_ops = 3;
7685         }
7686       create_output_operand (&ops[op_counter++], target, mode);
7687     }
7688   if (icode == CODE_FOR_nothing)
7689     return NULL_RTX;
7690
7691   create_fixed_operand (&ops[op_counter++], mem);
7692   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
7693   create_convert_operand_to (&ops[op_counter++], val, mode, true);
7694
7695   if (maybe_expand_insn (icode, num_ops, ops))
7696     return (target == const0_rtx ? const0_rtx : ops[0].value);
7697
7698   return NULL_RTX;
7699 }
7700
7701
7702 /* This function expands an atomic fetch_OP or OP_fetch operation:
7703    TARGET is an option place to stick the return value.  const0_rtx indicates
7704    the result is unused.
7705    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7706    CODE is the operation being performed (OP)
7707    MEMMODEL is the memory model variant to use.
7708    AFTER is true to return the result of the operation (OP_fetch).
7709    AFTER is false to return the value before the operation (fetch_OP).
7710
7711    This function will *only* generate instructions if there is a direct
7712    optab. No compare and swap loops or libcalls will be generated. */
7713
7714 static rtx
7715 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
7716                                     enum rtx_code code, enum memmodel model,
7717                                     bool after)
7718 {
7719   machine_mode mode = GET_MODE (mem);
7720   struct atomic_op_functions optab;
7721   rtx result;
7722   bool unused_result = (target == const0_rtx);
7723
7724   get_atomic_op_for_code (&optab, code);
7725
7726   /* Check to see if there are any better instructions.  */
7727   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
7728   if (result)
7729     return result;
7730
7731   /* Check for the case where the result isn't used and try those patterns.  */
7732   if (unused_result)
7733     {
7734       /* Try the memory model variant first.  */
7735       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
7736       if (result)
7737         return result;
7738
7739       /* Next try the old style withuot a memory model.  */
7740       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
7741       if (result)
7742         return result;
7743
7744       /* There is no no-result pattern, so try patterns with a result.  */
7745       target = NULL_RTX;
7746     }
7747
7748   /* Try the __atomic version.  */
7749   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
7750   if (result)
7751     return result;
7752
7753   /* Try the older __sync version.  */
7754   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
7755   if (result)
7756     return result;
7757
7758   /* If the fetch value can be calculated from the other variation of fetch,
7759      try that operation.  */
7760   if (after || unused_result || optab.reverse_code != UNKNOWN)
7761     {
7762       /* Try the __atomic version, then the older __sync version.  */
7763       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
7764       if (!result)
7765         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
7766
7767       if (result)
7768         {
7769           /* If the result isn't used, no need to do compensation code.  */
7770           if (unused_result)
7771             return result;
7772
7773           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
7774              Fetch_before == after REVERSE_OP val.  */
7775           if (!after)
7776             code = optab.reverse_code;
7777           if (code == NOT)
7778             {
7779               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
7780                                             true, OPTAB_LIB_WIDEN);
7781               result = expand_simple_unop (mode, NOT, result, target, true);
7782             }
7783           else
7784             result = expand_simple_binop (mode, code, result, val, target,
7785                                           true, OPTAB_LIB_WIDEN);
7786           return result;
7787         }
7788     }
7789
7790   /* No direct opcode can be generated.  */
7791   return NULL_RTX;
7792 }
7793
7794
7795
7796 /* This function expands an atomic fetch_OP or OP_fetch operation:
7797    TARGET is an option place to stick the return value.  const0_rtx indicates
7798    the result is unused.
7799    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7800    CODE is the operation being performed (OP)
7801    MEMMODEL is the memory model variant to use.
7802    AFTER is true to return the result of the operation (OP_fetch).
7803    AFTER is false to return the value before the operation (fetch_OP).  */
7804 rtx
7805 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7806                         enum memmodel model, bool after)
7807 {
7808   machine_mode mode = GET_MODE (mem);
7809   rtx result;
7810   bool unused_result = (target == const0_rtx);
7811
7812   /* If loads are not atomic for the required size and we are not called to
7813      provide a __sync builtin, do not do anything so that we stay consistent
7814      with atomic loads of the same size.  */
7815   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
7816     return NULL_RTX;
7817
7818   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
7819                                                after);
7820
7821   if (result)
7822     return result;
7823
7824   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
7825   if (code == PLUS || code == MINUS)
7826     {
7827       rtx tmp;
7828       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
7829
7830       start_sequence ();
7831       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
7832       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
7833                                                    model, after);
7834       if (result)
7835         {
7836           /* PLUS worked so emit the insns and return.  */
7837           tmp = get_insns ();
7838           end_sequence ();
7839           emit_insn (tmp);
7840           return result;
7841         }
7842
7843       /* PLUS did not work, so throw away the negation code and continue.  */
7844       end_sequence ();
7845     }
7846
7847   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
7848   if (!can_compare_and_swap_p (mode, false))
7849     {
7850       rtx libfunc;
7851       bool fixup = false;
7852       enum rtx_code orig_code = code;
7853       struct atomic_op_functions optab;
7854
7855       get_atomic_op_for_code (&optab, code);
7856       libfunc = optab_libfunc (after ? optab.fetch_after
7857                                : optab.fetch_before, mode);
7858       if (libfunc == NULL
7859           && (after || unused_result || optab.reverse_code != UNKNOWN))
7860         {
7861           fixup = true;
7862           if (!after)
7863             code = optab.reverse_code;
7864           libfunc = optab_libfunc (after ? optab.fetch_before
7865                                    : optab.fetch_after, mode);
7866         }
7867       if (libfunc != NULL)
7868         {
7869           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7870           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
7871                                             addr, ptr_mode, val, mode);
7872
7873           if (!unused_result && fixup)
7874             result = expand_simple_binop (mode, code, result, val, target,
7875                                           true, OPTAB_LIB_WIDEN);
7876           return result;
7877         }
7878
7879       /* We need the original code for any further attempts.  */
7880       code = orig_code;
7881     }
7882
7883   /* If nothing else has succeeded, default to a compare and swap loop.  */
7884   if (can_compare_and_swap_p (mode, true))
7885     {
7886       rtx_insn *insn;
7887       rtx t0 = gen_reg_rtx (mode), t1;
7888
7889       start_sequence ();
7890
7891       /* If the result is used, get a register for it.  */
7892       if (!unused_result)
7893         {
7894           if (!target || !register_operand (target, mode))
7895             target = gen_reg_rtx (mode);
7896           /* If fetch_before, copy the value now.  */
7897           if (!after)
7898             emit_move_insn (target, t0);
7899         }
7900       else
7901         target = const0_rtx;
7902
7903       t1 = t0;
7904       if (code == NOT)
7905         {
7906           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
7907                                     true, OPTAB_LIB_WIDEN);
7908           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
7909         }
7910       else
7911         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
7912                                   OPTAB_LIB_WIDEN);
7913
7914       /* For after, copy the value now.  */
7915       if (!unused_result && after)
7916         emit_move_insn (target, t1);
7917       insn = get_insns ();
7918       end_sequence ();
7919
7920       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
7921         return target;
7922     }
7923
7924   return NULL_RTX;
7925 }
7926 \f
7927 /* Return true if OPERAND is suitable for operand number OPNO of
7928    instruction ICODE.  */
7929
7930 bool
7931 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
7932 {
7933   return (!insn_data[(int) icode].operand[opno].predicate
7934           || (insn_data[(int) icode].operand[opno].predicate
7935               (operand, insn_data[(int) icode].operand[opno].mode)));
7936 }
7937 \f
7938 /* TARGET is a target of a multiword operation that we are going to
7939    implement as a series of word-mode operations.  Return true if
7940    TARGET is suitable for this purpose.  */
7941
7942 bool
7943 valid_multiword_target_p (rtx target)
7944 {
7945   machine_mode mode;
7946   int i, size;
7947
7948   mode = GET_MODE (target);
7949   if (!GET_MODE_SIZE (mode).is_constant (&size))
7950     return false;
7951   for (i = 0; i < size; i += UNITS_PER_WORD)
7952     if (!validate_subreg (word_mode, mode, target, i))
7953       return false;
7954   return true;
7955 }
7956
7957 /* Make OP describe an input operand that has value INTVAL and that has
7958    no inherent mode.  This function should only be used for operands that
7959    are always expand-time constants.  The backend may request that INTVAL
7960    be copied into a different kind of rtx, but it must specify the mode
7961    of that rtx if so.  */
7962
7963 void
7964 create_integer_operand (class expand_operand *op, poly_int64 intval)
7965 {
7966   create_expand_operand (op, EXPAND_INTEGER,
7967                          gen_int_mode (intval, MAX_MODE_INT),
7968                          VOIDmode, false, intval);
7969 }
7970
7971 /* Like maybe_legitimize_operand, but do not change the code of the
7972    current rtx value.  */
7973
7974 static bool
7975 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
7976                                     class expand_operand *op)
7977 {
7978   /* See if the operand matches in its current form.  */
7979   if (insn_operand_matches (icode, opno, op->value))
7980     return true;
7981
7982   /* If the operand is a memory whose address has no side effects,
7983      try forcing the address into a non-virtual pseudo register.
7984      The check for side effects is important because copy_to_mode_reg
7985      cannot handle things like auto-modified addresses.  */
7986   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
7987     {
7988       rtx addr, mem;
7989
7990       mem = op->value;
7991       addr = XEXP (mem, 0);
7992       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
7993           && !side_effects_p (addr))
7994         {
7995           rtx_insn *last;
7996           machine_mode mode;
7997
7998           last = get_last_insn ();
7999           mode = get_address_mode (mem);
8000           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
8001           if (insn_operand_matches (icode, opno, mem))
8002             {
8003               op->value = mem;
8004               return true;
8005             }
8006           delete_insns_since (last);
8007         }
8008     }
8009
8010   return false;
8011 }
8012
8013 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
8014    on success, storing the new operand value back in OP.  */
8015
8016 static bool
8017 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
8018                           class expand_operand *op)
8019 {
8020   machine_mode mode, imode, tmode;
8021
8022   mode = op->mode;
8023   switch (op->type)
8024     {
8025     case EXPAND_FIXED:
8026       {
8027         temporary_volatile_ok v (true);
8028         return maybe_legitimize_operand_same_code (icode, opno, op);
8029       }
8030
8031     case EXPAND_OUTPUT:
8032       gcc_assert (mode != VOIDmode);
8033       if (op->value
8034           && op->value != const0_rtx
8035           && GET_MODE (op->value) == mode
8036           && maybe_legitimize_operand_same_code (icode, opno, op))
8037         return true;
8038
8039       op->value = gen_reg_rtx (mode);
8040       op->target = 0;
8041       break;
8042
8043     case EXPAND_INPUT:
8044     input:
8045       gcc_assert (mode != VOIDmode);
8046       gcc_assert (GET_MODE (op->value) == VOIDmode
8047                   || GET_MODE (op->value) == mode);
8048       if (maybe_legitimize_operand_same_code (icode, opno, op))
8049         return true;
8050
8051       op->value = copy_to_mode_reg (mode, op->value);
8052       break;
8053
8054     case EXPAND_CONVERT_TO:
8055       gcc_assert (mode != VOIDmode);
8056       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
8057       goto input;
8058
8059     case EXPAND_CONVERT_FROM:
8060       if (GET_MODE (op->value) != VOIDmode)
8061         mode = GET_MODE (op->value);
8062       else
8063         /* The caller must tell us what mode this value has.  */
8064         gcc_assert (mode != VOIDmode);
8065
8066       imode = insn_data[(int) icode].operand[opno].mode;
8067       tmode = (VECTOR_MODE_P (imode) && !VECTOR_MODE_P (mode)
8068                ? GET_MODE_INNER (imode) : imode);
8069       if (tmode != VOIDmode && tmode != mode)
8070         {
8071           op->value = convert_modes (tmode, mode, op->value, op->unsigned_p);
8072           mode = tmode;
8073         }
8074       if (imode != VOIDmode && imode != mode)
8075         {
8076           gcc_assert (VECTOR_MODE_P (imode) && !VECTOR_MODE_P (mode));
8077           op->value = expand_vector_broadcast (imode, op->value);
8078           mode = imode;
8079         }
8080       goto input;
8081
8082     case EXPAND_ADDRESS:
8083       op->value = convert_memory_address (as_a <scalar_int_mode> (mode),
8084                                           op->value);
8085       goto input;
8086
8087     case EXPAND_INTEGER:
8088       mode = insn_data[(int) icode].operand[opno].mode;
8089       if (mode != VOIDmode
8090           && known_eq (trunc_int_for_mode (op->int_value, mode),
8091                        op->int_value))
8092         {
8093           op->value = gen_int_mode (op->int_value, mode);
8094           goto input;
8095         }
8096       break;
8097
8098     case EXPAND_UNDEFINED_INPUT:
8099       /* See if the predicate accepts a SCRATCH rtx, which in this context
8100          indicates an undefined value.  Use an uninitialized register if not. */
8101       if (!insn_operand_matches (icode, opno, op->value))
8102         {
8103           op->value = gen_reg_rtx (op->mode);
8104           goto input;
8105         }
8106       return true;
8107     }
8108   return insn_operand_matches (icode, opno, op->value);
8109 }
8110
8111 /* Make OP describe an input operand that should have the same value
8112    as VALUE, after any mode conversion that the target might request.
8113    TYPE is the type of VALUE.  */
8114
8115 void
8116 create_convert_operand_from_type (class expand_operand *op,
8117                                   rtx value, tree type)
8118 {
8119   create_convert_operand_from (op, value, TYPE_MODE (type),
8120                                TYPE_UNSIGNED (type));
8121 }
8122
8123 /* Return true if the requirements on operands OP1 and OP2 of instruction
8124    ICODE are similar enough for the result of legitimizing OP1 to be
8125    reusable for OP2.  OPNO1 and OPNO2 are the operand numbers associated
8126    with OP1 and OP2 respectively.  */
8127
8128 static inline bool
8129 can_reuse_operands_p (enum insn_code icode,
8130                       unsigned int opno1, unsigned int opno2,
8131                       const class expand_operand *op1,
8132                       const class expand_operand *op2)
8133 {
8134   /* Check requirements that are common to all types.  */
8135   if (op1->type != op2->type
8136       || op1->mode != op2->mode
8137       || (insn_data[(int) icode].operand[opno1].mode
8138           != insn_data[(int) icode].operand[opno2].mode))
8139     return false;
8140
8141   /* Check the requirements for specific types.  */
8142   switch (op1->type)
8143     {
8144     case EXPAND_OUTPUT:
8145     case EXPAND_UNDEFINED_INPUT:
8146       /* Outputs and undefined intputs must remain distinct.  */
8147       return false;
8148
8149     case EXPAND_FIXED:
8150     case EXPAND_INPUT:
8151     case EXPAND_ADDRESS:
8152     case EXPAND_INTEGER:
8153       return true;
8154
8155     case EXPAND_CONVERT_TO:
8156     case EXPAND_CONVERT_FROM:
8157       return op1->unsigned_p == op2->unsigned_p;
8158     }
8159   gcc_unreachable ();
8160 }
8161
8162 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
8163    of instruction ICODE.  Return true on success, leaving the new operand
8164    values in the OPS themselves.  Emit no code on failure.  */
8165
8166 bool
8167 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
8168                            unsigned int nops, class expand_operand *ops)
8169 {
8170   rtx_insn *last = get_last_insn ();
8171   rtx *orig_values = XALLOCAVEC (rtx, nops);
8172   for (unsigned int i = 0; i < nops; i++)
8173     {
8174       orig_values[i] = ops[i].value;
8175
8176       /* First try reusing the result of an earlier legitimization.
8177          This avoids duplicate rtl and ensures that tied operands
8178          remain tied.
8179
8180          This search is linear, but NOPS is bounded at compile time
8181          to a small number (current a single digit).  */
8182       unsigned int j = 0;
8183       for (; j < i; ++j)
8184         if (can_reuse_operands_p (icode, opno + j, opno + i, &ops[j], &ops[i])
8185             && rtx_equal_p (orig_values[j], orig_values[i])
8186             && ops[j].value
8187             && insn_operand_matches (icode, opno + i, ops[j].value))
8188           {
8189             ops[i].value = copy_rtx (ops[j].value);
8190             break;
8191           }
8192
8193       /* Otherwise try legitimizing the operand on its own.  */
8194       if (j == i && !maybe_legitimize_operand (icode, opno + i, &ops[i]))
8195         {
8196           delete_insns_since (last);
8197           return false;
8198         }
8199     }
8200   return true;
8201 }
8202
8203 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
8204    as its operands.  Return the instruction pattern on success,
8205    and emit any necessary set-up code.  Return null and emit no
8206    code on failure.  */
8207
8208 rtx_insn *
8209 maybe_gen_insn (enum insn_code icode, unsigned int nops,
8210                 class expand_operand *ops)
8211 {
8212   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
8213   if (!maybe_legitimize_operands (icode, 0, nops, ops))
8214     return NULL;
8215
8216   switch (nops)
8217     {
8218     case 0:
8219       return GEN_FCN (icode) ();
8220     case 1:
8221       return GEN_FCN (icode) (ops[0].value);
8222     case 2:
8223       return GEN_FCN (icode) (ops[0].value, ops[1].value);
8224     case 3:
8225       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
8226     case 4:
8227       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8228                               ops[3].value);
8229     case 5:
8230       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8231                               ops[3].value, ops[4].value);
8232     case 6:
8233       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8234                               ops[3].value, ops[4].value, ops[5].value);
8235     case 7:
8236       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8237                               ops[3].value, ops[4].value, ops[5].value,
8238                               ops[6].value);
8239     case 8:
8240       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8241                               ops[3].value, ops[4].value, ops[5].value,
8242                               ops[6].value, ops[7].value);
8243     case 9:
8244       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8245                               ops[3].value, ops[4].value, ops[5].value,
8246                               ops[6].value, ops[7].value, ops[8].value);
8247     case 10:
8248       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8249                               ops[3].value, ops[4].value, ops[5].value,
8250                               ops[6].value, ops[7].value, ops[8].value,
8251                               ops[9].value);
8252     case 11:
8253       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8254                               ops[3].value, ops[4].value, ops[5].value,
8255                               ops[6].value, ops[7].value, ops[8].value,
8256                               ops[9].value, ops[10].value);
8257     }
8258   gcc_unreachable ();
8259 }
8260
8261 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
8262    as its operands.  Return true on success and emit no code on failure.  */
8263
8264 bool
8265 maybe_expand_insn (enum insn_code icode, unsigned int nops,
8266                    class expand_operand *ops)
8267 {
8268   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
8269   if (pat)
8270     {
8271       emit_insn (pat);
8272       return true;
8273     }
8274   return false;
8275 }
8276
8277 /* Like maybe_expand_insn, but for jumps.  */
8278
8279 bool
8280 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
8281                         class expand_operand *ops)
8282 {
8283   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
8284   if (pat)
8285     {
8286       emit_jump_insn (pat);
8287       return true;
8288     }
8289   return false;
8290 }
8291
8292 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
8293    as its operands.  */
8294
8295 void
8296 expand_insn (enum insn_code icode, unsigned int nops,
8297              class expand_operand *ops)
8298 {
8299   if (!maybe_expand_insn (icode, nops, ops))
8300     gcc_unreachable ();
8301 }
8302
8303 /* Like expand_insn, but for jumps.  */
8304
8305 void
8306 expand_jump_insn (enum insn_code icode, unsigned int nops,
8307                   class expand_operand *ops)
8308 {
8309   if (!maybe_expand_jump_insn (icode, nops, ops))
8310     gcc_unreachable ();
8311 }