gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2017 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "backend.h"
  25 #include "target.h"
  26 #include "rtl.h"
  27 #include "tree.h"
  28 #include "memmodel.h"
  29 #include "predict.h"
  30 #include "tm_p.h"
  31 #include "expmed.h"
  32 #include "optabs.h"
  33 #include "emit-rtl.h"
  34 #include "recog.h"
  35 #include "diagnostic-core.h"
  36
  37 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  38    is properly defined.  */
  39 #include "stor-layout.h"
  40 #include "except.h"
  41 #include "dojump.h"
  42 #include "explow.h"
  43 #include "expr.h"
  44 #include "optabs-tree.h"
  45 #include "libfuncs.h"
  46
  47 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  48                                    machine_mode *);
  49 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  50 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  51
  52 /* Debug facility for use in GDB.  */
  53 void debug_optab_libfuncs (void);
  54 \f
  55 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
  56    the result of operation CODE applied to OP0 (and OP1 if it is a binary
  57    operation).
  58
  59    If the last insn does not set TARGET, don't do anything, but return 1.
  60
  61    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
  62    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
  63    try again, ensuring that TARGET is not one of the operands.  */
  64
  65 static int
  66 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
  67 {
  68   rtx_insn *last_insn;
  69   rtx set;
  70   rtx note;
  71
  72   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
  73
  74   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
  75       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
  76       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
  77       && GET_RTX_CLASS (code) != RTX_COMPARE
  78       && GET_RTX_CLASS (code) != RTX_UNARY)
  79     return 1;
  80
  81   if (GET_CODE (target) == ZERO_EXTRACT)
  82     return 1;
  83
  84   for (last_insn = insns;
  85        NEXT_INSN (last_insn) != NULL_RTX;
  86        last_insn = NEXT_INSN (last_insn))
  87     ;
  88
  89   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
  90      a value changing in the insn, so the note would be invalid for CSE.  */
  91   if (reg_overlap_mentioned_p (target, op0)
  92       || (op1 && reg_overlap_mentioned_p (target, op1)))
  93     {
  94       if (MEM_P (target)
  95           && (rtx_equal_p (target, op0)
  96               || (op1 && rtx_equal_p (target, op1))))
  97         {
  98           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
  99              over expanding it as temp = MEM op X, MEM = temp.  If the target
 100              supports MEM = MEM op X instructions, it is sometimes too hard
 101              to reconstruct that form later, especially if X is also a memory,
 102              and due to multiple occurrences of addresses the address might
 103              be forced into register unnecessarily.
 104              Note that not emitting the REG_EQUIV note might inhibit
 105              CSE in some cases.  */
 106           set = single_set (last_insn);
 107           if (set
 108               && GET_CODE (SET_SRC (set)) == code
 109               && MEM_P (SET_DEST (set))
 110               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 111                   || (op1 && rtx_equal_p (SET_DEST (set),
 112                                           XEXP (SET_SRC (set), 1)))))
 113             return 1;
 114         }
 115       return 0;
 116     }
 117
 118   set = set_for_reg_notes (last_insn);
 119   if (set == NULL_RTX)
 120     return 1;
 121
 122   if (! rtx_equal_p (SET_DEST (set), target)
 123       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 124       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 125           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 126     return 1;
 127
 128   if (GET_RTX_CLASS (code) == RTX_UNARY)
 129     switch (code)
 130       {
 131       case FFS:
 132       case CLZ:
 133       case CTZ:
 134       case CLRSB:
 135       case POPCOUNT:
 136       case PARITY:
 137       case BSWAP:
 138         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 139           {
 140             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 141             if (GET_MODE_SIZE (GET_MODE (op0))
 142                 > GET_MODE_SIZE (GET_MODE (target)))
 143               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 144                                          note, GET_MODE (op0));
 145             else
 146               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 147                                          note, GET_MODE (op0));
 148             break;
 149           }
 150         /* FALLTHRU */
 151       default:
 152         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 153         break;
 154       }
 155   else
 156     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 157
 158   set_unique_reg_note (last_insn, REG_EQUAL, note);
 159
 160   return 1;
 161 }
 162 \f
 163 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 164    for a widening operation would be.  In most cases this would be OP0, but if
 165    that's a constant it'll be VOIDmode, which isn't useful.  */
 166
 167 static machine_mode
 168 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 169 {
 170   machine_mode m0 = GET_MODE (op0);
 171   machine_mode m1 = GET_MODE (op1);
 172   machine_mode result;
 173
 174   if (m0 == VOIDmode && m1 == VOIDmode)
 175     return to_mode;
 176   else if (m0 == VOIDmode || GET_MODE_SIZE (m0) < GET_MODE_SIZE (m1))
 177     result = m1;
 178   else
 179     result = m0;
 180
 181   if (GET_MODE_SIZE (result) > GET_MODE_SIZE (to_mode))
 182     return to_mode;
 183
 184   return result;
 185 }
 186 \f
 187 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 188    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 189    not actually do a sign-extend or zero-extend, but can leave the
 190    higher-order bits of the result rtx undefined, for example, in the case
 191    of logical operations, but not right shifts.  */
 192
 193 static rtx
 194 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 195                int unsignedp, int no_extend)
 196 {
 197   rtx result;
 198
 199   /* If we don't have to extend and this is a constant, return it.  */
 200   if (no_extend && GET_MODE (op) == VOIDmode)
 201     return op;
 202
 203   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 204      extend since it will be more efficient to do so unless the signedness of
 205      a promoted object differs from our extension.  */
 206   if (! no_extend
 207       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 208           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 209     return convert_modes (mode, oldmode, op, unsignedp);
 210
 211   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 212      SUBREG.  */
 213   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
 214     return gen_lowpart (mode, force_reg (GET_MODE (op), op));
 215
 216   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 217      part to OP.  */
 218
 219   result = gen_reg_rtx (mode);
 220   emit_clobber (result);
 221   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 222   return result;
 223 }
 224 \f
 225 /* Expand vector widening operations.
 226
 227    There are two different classes of operations handled here:
 228    1) Operations whose result is wider than all the arguments to the operation.
 229       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 230       In this case OP0 and optionally OP1 would be initialized,
 231       but WIDE_OP wouldn't (not relevant for this case).
 232    2) Operations whose result is of the same size as the last argument to the
 233       operation, but wider than all the other arguments to the operation.
 234       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 235       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 236
 237    E.g, when called to expand the following operations, this is how
 238    the arguments will be initialized:
 239                                 nops    OP0     OP1     WIDE_OP
 240    widening-sum                 2       oprnd0  -       oprnd1
 241    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 242    widening-mult                2       oprnd0  oprnd1  -
 243    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 244
 245 rtx
 246 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 247                            rtx target, int unsignedp)
 248 {
 249   struct expand_operand eops[4];
 250   tree oprnd0, oprnd1, oprnd2;
 251   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 252   optab widen_pattern_optab;
 253   enum insn_code icode;
 254   int nops = TREE_CODE_LENGTH (ops->code);
 255   int op;
 256
 257   oprnd0 = ops->op0;
 258   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 259   widen_pattern_optab =
 260     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 261   if (ops->code == WIDEN_MULT_PLUS_EXPR
 262       || ops->code == WIDEN_MULT_MINUS_EXPR)
 263     icode = find_widening_optab_handler (widen_pattern_optab,
 264                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 265                                          tmode0, 0);
 266   else
 267     icode = optab_handler (widen_pattern_optab, tmode0);
 268   gcc_assert (icode != CODE_FOR_nothing);
 269
 270   if (nops >= 2)
 271     {
 272       oprnd1 = ops->op1;
 273       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 274     }
 275
 276   /* The last operand is of a wider mode than the rest of the operands.  */
 277   if (nops == 2)
 278     wmode = tmode1;
 279   else if (nops == 3)
 280     {
 281       gcc_assert (tmode1 == tmode0);
 282       gcc_assert (op1);
 283       oprnd2 = ops->op2;
 284       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 285     }
 286
 287   op = 0;
 288   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 289   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 290   if (op1)
 291     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 292   if (wide_op)
 293     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 294   expand_insn (icode, op, eops);
 295   return eops[0].value;
 296 }
 297
 298 /* Generate code to perform an operation specified by TERNARY_OPTAB
 299    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 300
 301    UNSIGNEDP is for the case where we have to widen the operands
 302    to perform the operation.  It says to use zero-extension.
 303
 304    If TARGET is nonzero, the value
 305    is generated there, if it is convenient to do so.
 306    In all cases an rtx is returned for the locus of the value;
 307    this may or may not be TARGET.  */
 308
 309 rtx
 310 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 311                    rtx op1, rtx op2, rtx target, int unsignedp)
 312 {
 313   struct expand_operand ops[4];
 314   enum insn_code icode = optab_handler (ternary_optab, mode);
 315
 316   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 317
 318   create_output_operand (&ops[0], target, mode);
 319   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 320   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 321   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 322   expand_insn (icode, 4, ops);
 323   return ops[0].value;
 324 }
 325
 326
 327 /* Like expand_binop, but return a constant rtx if the result can be
 328    calculated at compile time.  The arguments and return value are
 329    otherwise the same as for expand_binop.  */
 330
 331 rtx
 332 simplify_expand_binop (machine_mode mode, optab binoptab,
 333                        rtx op0, rtx op1, rtx target, int unsignedp,
 334                        enum optab_methods methods)
 335 {
 336   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 337     {
 338       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 339                                          mode, op0, op1);
 340       if (x)
 341         return x;
 342     }
 343
 344   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 345 }
 346
 347 /* Like simplify_expand_binop, but always put the result in TARGET.
 348    Return true if the expansion succeeded.  */
 349
 350 bool
 351 force_expand_binop (machine_mode mode, optab binoptab,
 352                     rtx op0, rtx op1, rtx target, int unsignedp,
 353                     enum optab_methods methods)
 354 {
 355   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 356                                  target, unsignedp, methods);
 357   if (x == 0)
 358     return false;
 359   if (x != target)
 360     emit_move_insn (target, x);
 361   return true;
 362 }
 363
 364 /* Create a new vector value in VMODE with all elements set to OP.  The
 365    mode of OP must be the element mode of VMODE.  If OP is a constant,
 366    then the return value will be a constant.  */
 367
 368 static rtx
 369 expand_vector_broadcast (machine_mode vmode, rtx op)
 370 {
 371   enum insn_code icode;
 372   rtvec vec;
 373   rtx ret;
 374   int i, n;
 375
 376   gcc_checking_assert (VECTOR_MODE_P (vmode));
 377
 378   n = GET_MODE_NUNITS (vmode);
 379   vec = rtvec_alloc (n);
 380   for (i = 0; i < n; ++i)
 381     RTVEC_ELT (vec, i) = op;
 382
 383   if (CONSTANT_P (op))
 384     return gen_rtx_CONST_VECTOR (vmode, vec);
 385
 386   /* ??? If the target doesn't have a vec_init, then we have no easy way
 387      of performing this operation.  Most of this sort of generic support
 388      is hidden away in the vector lowering support in gimple.  */
 389   icode = convert_optab_handler (vec_init_optab, vmode,
 390                                  GET_MODE_INNER (vmode));
 391   if (icode == CODE_FOR_nothing)
 392     return NULL;
 393
 394   ret = gen_reg_rtx (vmode);
 395   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 396
 397   return ret;
 398 }
 399
 400 /* This subroutine of expand_doubleword_shift handles the cases in which
 401    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 402    value are the same as for the parent routine, except that SUPERWORD_OP1
 403    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 404    INTO_TARGET may be null if the caller has decided to calculate it.  */
 405
 406 static bool
 407 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 408                         rtx outof_target, rtx into_target,
 409                         int unsignedp, enum optab_methods methods)
 410 {
 411   if (into_target != 0)
 412     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 413                              into_target, unsignedp, methods))
 414       return false;
 415
 416   if (outof_target != 0)
 417     {
 418       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 419          of the sign bit, otherwise we must fill it with zeros.  */
 420       if (binoptab != ashr_optab)
 421         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 422       else
 423         if (!force_expand_binop (word_mode, binoptab,
 424                                  outof_input, GEN_INT (BITS_PER_WORD - 1),
 425                                  outof_target, unsignedp, methods))
 426           return false;
 427     }
 428   return true;
 429 }
 430
 431 /* This subroutine of expand_doubleword_shift handles the cases in which
 432    the effective shift value is < BITS_PER_WORD.  The arguments and return
 433    value are the same as for the parent routine.  */
 434
 435 static bool
 436 expand_subword_shift (machine_mode op1_mode, optab binoptab,
 437                       rtx outof_input, rtx into_input, rtx op1,
 438                       rtx outof_target, rtx into_target,
 439                       int unsignedp, enum optab_methods methods,
 440                       unsigned HOST_WIDE_INT shift_mask)
 441 {
 442   optab reverse_unsigned_shift, unsigned_shift;
 443   rtx tmp, carries;
 444
 445   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 446   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 447
 448   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 449      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 450      the opposite direction to BINOPTAB.  */
 451   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 452     {
 453       carries = outof_input;
 454       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 455                                             op1_mode), op1_mode);
 456       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 457                                    0, true, methods);
 458     }
 459   else
 460     {
 461       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 462          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 463          has unknown behavior.  Do a single shift first, then shift by the
 464          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 465          are truncated to the mode size.  */
 466       carries = expand_binop (word_mode, reverse_unsigned_shift,
 467                               outof_input, const1_rtx, 0, unsignedp, methods);
 468       if (shift_mask == BITS_PER_WORD - 1)
 469         {
 470           tmp = immed_wide_int_const
 471             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 472           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 473                                        0, true, methods);
 474         }
 475       else
 476         {
 477           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 478                                                 op1_mode), op1_mode);
 479           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 480                                        0, true, methods);
 481         }
 482     }
 483   if (tmp == 0 || carries == 0)
 484     return false;
 485   carries = expand_binop (word_mode, reverse_unsigned_shift,
 486                           carries, tmp, 0, unsignedp, methods);
 487   if (carries == 0)
 488     return false;
 489
 490   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 491      so the result can go directly into INTO_TARGET if convenient.  */
 492   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 493                       into_target, unsignedp, methods);
 494   if (tmp == 0)
 495     return false;
 496
 497   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 498   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 499                            into_target, unsignedp, methods))
 500     return false;
 501
 502   /* Use a standard word_mode shift for the out-of half.  */
 503   if (outof_target != 0)
 504     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 505                              outof_target, unsignedp, methods))
 506       return false;
 507
 508   return true;
 509 }
 510
 511
 512 /* Try implementing expand_doubleword_shift using conditional moves.
 513    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 514    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 515    are the shift counts to use in the former and latter case.  All other
 516    arguments are the same as the parent routine.  */
 517
 518 static bool
 519 expand_doubleword_shift_condmove (machine_mode op1_mode, optab binoptab,
 520                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 521                                   rtx outof_input, rtx into_input,
 522                                   rtx subword_op1, rtx superword_op1,
 523                                   rtx outof_target, rtx into_target,
 524                                   int unsignedp, enum optab_methods methods,
 525                                   unsigned HOST_WIDE_INT shift_mask)
 526 {
 527   rtx outof_superword, into_superword;
 528
 529   /* Put the superword version of the output into OUTOF_SUPERWORD and
 530      INTO_SUPERWORD.  */
 531   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 532   if (outof_target != 0 && subword_op1 == superword_op1)
 533     {
 534       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 535          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 536       into_superword = outof_target;
 537       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 538                                    outof_superword, 0, unsignedp, methods))
 539         return false;
 540     }
 541   else
 542     {
 543       into_superword = gen_reg_rtx (word_mode);
 544       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 545                                    outof_superword, into_superword,
 546                                    unsignedp, methods))
 547         return false;
 548     }
 549
 550   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 551   if (!expand_subword_shift (op1_mode, binoptab,
 552                              outof_input, into_input, subword_op1,
 553                              outof_target, into_target,
 554                              unsignedp, methods, shift_mask))
 555     return false;
 556
 557   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 558      might be the current value of OUTOF_TARGET.  */
 559   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 560                               into_target, into_superword, word_mode, false))
 561     return false;
 562
 563   if (outof_target != 0)
 564     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 565                                 outof_target, outof_superword,
 566                                 word_mode, false))
 567       return false;
 568
 569   return true;
 570 }
 571
 572 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 573    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 574    input operand; the shift moves bits in the direction OUTOF_INPUT->
 575    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 576    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 577    If OP1 is constant, it will have been truncated as appropriate
 578    and is known to be nonzero.
 579
 580    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 581    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 582    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 583
 584    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 585    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 586    fill with zeros or sign bits as appropriate.
 587
 588    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 589    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 590    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
 591    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
 592    are undefined.
 593
 594    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
 595    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
 596    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
 597    function wants to calculate it itself.
 598
 599    Return true if the shift could be successfully synthesized.  */
 600
 601 static bool
 602 expand_doubleword_shift (machine_mode op1_mode, optab binoptab,
 603                          rtx outof_input, rtx into_input, rtx op1,
 604                          rtx outof_target, rtx into_target,
 605                          int unsignedp, enum optab_methods methods,
 606                          unsigned HOST_WIDE_INT shift_mask)
 607 {
 608   rtx superword_op1, tmp, cmp1, cmp2;
 609   enum rtx_code cmp_code;
 610
 611   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
 612      fill the result with sign or zero bits as appropriate.  If so, the value
 613      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
 614      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
 615      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
 616
 617      This isn't worthwhile for constant shifts since the optimizers will
 618      cope better with in-range shift counts.  */
 619   if (shift_mask >= BITS_PER_WORD
 620       && outof_target != 0
 621       && !CONSTANT_P (op1))
 622     {
 623       if (!expand_doubleword_shift (op1_mode, binoptab,
 624                                     outof_input, into_input, op1,
 625                                     0, into_target,
 626                                     unsignedp, methods, shift_mask))
 627         return false;
 628       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 629                                outof_target, unsignedp, methods))
 630         return false;
 631       return true;
 632     }
 633
 634   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
 635      is true when the effective shift value is less than BITS_PER_WORD.
 636      Set SUPERWORD_OP1 to the shift count that should be used to shift
 637      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
 638   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
 639   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
 640     {
 641       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
 642          is a subword shift count.  */
 643       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
 644                                     0, true, methods);
 645       cmp2 = CONST0_RTX (op1_mode);
 646       cmp_code = EQ;
 647       superword_op1 = op1;
 648     }
 649   else
 650     {
 651       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
 652       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
 653                                     0, true, methods);
 654       cmp2 = CONST0_RTX (op1_mode);
 655       cmp_code = LT;
 656       superword_op1 = cmp1;
 657     }
 658   if (cmp1 == 0)
 659     return false;
 660
 661   /* If we can compute the condition at compile time, pick the
 662      appropriate subroutine.  */
 663   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
 664   if (tmp != 0 && CONST_INT_P (tmp))
 665     {
 666       if (tmp == const0_rtx)
 667         return expand_superword_shift (binoptab, outof_input, superword_op1,
 668                                        outof_target, into_target,
 669                                        unsignedp, methods);
 670       else
 671         return expand_subword_shift (op1_mode, binoptab,
 672                                      outof_input, into_input, op1,
 673                                      outof_target, into_target,
 674                                      unsignedp, methods, shift_mask);
 675     }
 676
 677   /* Try using conditional moves to generate straight-line code.  */
 678   if (HAVE_conditional_move)
 679     {
 680       rtx_insn *start = get_last_insn ();
 681       if (expand_doubleword_shift_condmove (op1_mode, binoptab,
 682                                             cmp_code, cmp1, cmp2,
 683                                             outof_input, into_input,
 684                                             op1, superword_op1,
 685                                             outof_target, into_target,
 686                                             unsignedp, methods, shift_mask))
 687         return true;
 688       delete_insns_since (start);
 689     }
 690
 691   /* As a last resort, use branches to select the correct alternative.  */
 692   rtx_code_label *subword_label = gen_label_rtx ();
 693   rtx_code_label *done_label = gen_label_rtx ();
 694
 695   NO_DEFER_POP;
 696   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
 697                            0, 0, subword_label,
 698                            profile_probability::uninitialized ());
 699   OK_DEFER_POP;
 700
 701   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 702                                outof_target, into_target,
 703                                unsignedp, methods))
 704     return false;
 705
 706   emit_jump_insn (targetm.gen_jump (done_label));
 707   emit_barrier ();
 708   emit_label (subword_label);
 709
 710   if (!expand_subword_shift (op1_mode, binoptab,
 711                              outof_input, into_input, op1,
 712                              outof_target, into_target,
 713                              unsignedp, methods, shift_mask))
 714     return false;
 715
 716   emit_label (done_label);
 717   return true;
 718 }
 719 \f
 720 /* Subroutine of expand_binop.  Perform a double word multiplication of
 721    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
 722    as the target's word_mode.  This function return NULL_RTX if anything
 723    goes wrong, in which case it may have already emitted instructions
 724    which need to be deleted.
 725
 726    If we want to multiply two two-word values and have normal and widening
 727    multiplies of single-word values, we can do this with three smaller
 728    multiplications.
 729
 730    The multiplication proceeds as follows:
 731                                  _______________________
 732                                 [__op0_high_|__op0_low__]
 733                                  _______________________
 734         *                       [__op1_high_|__op1_low__]
 735         _______________________________________________
 736                                  _______________________
 737     (1)                         [__op0_low__*__op1_low__]
 738                      _______________________
 739     (2a)            [__op0_low__*__op1_high_]
 740                      _______________________
 741     (2b)            [__op0_high_*__op1_low__]
 742          _______________________
 743     (3) [__op0_high_*__op1_high_]
 744
 745
 746   This gives a 4-word result.  Since we are only interested in the
 747   lower 2 words, partial result (3) and the upper words of (2a) and
 748   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
 749   calculated using non-widening multiplication.
 750
 751   (1), however, needs to be calculated with an unsigned widening
 752   multiplication.  If this operation is not directly supported we
 753   try using a signed widening multiplication and adjust the result.
 754   This adjustment works as follows:
 755
 756       If both operands are positive then no adjustment is needed.
 757
 758       If the operands have different signs, for example op0_low < 0 and
 759       op1_low >= 0, the instruction treats the most significant bit of
 760       op0_low as a sign bit instead of a bit with significance
 761       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
 762       with 2**BITS_PER_WORD - op0_low, and two's complements the
 763       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
 764       the result.
 765
 766       Similarly, if both operands are negative, we need to add
 767       (op0_low + op1_low) * 2**BITS_PER_WORD.
 768
 769       We use a trick to adjust quickly.  We logically shift op0_low right
 770       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
 771       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
 772       logical shift exists, we do an arithmetic right shift and subtract
 773       the 0 or -1.  */
 774
 775 static rtx
 776 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
 777                        bool umulp, enum optab_methods methods)
 778 {
 779   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
 780   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
 781   rtx wordm1 = umulp ? NULL_RTX : GEN_INT (BITS_PER_WORD - 1);
 782   rtx product, adjust, product_high, temp;
 783
 784   rtx op0_high = operand_subword_force (op0, high, mode);
 785   rtx op0_low = operand_subword_force (op0, low, mode);
 786   rtx op1_high = operand_subword_force (op1, high, mode);
 787   rtx op1_low = operand_subword_force (op1, low, mode);
 788
 789   /* If we're using an unsigned multiply to directly compute the product
 790      of the low-order words of the operands and perform any required
 791      adjustments of the operands, we begin by trying two more multiplications
 792      and then computing the appropriate sum.
 793
 794      We have checked above that the required addition is provided.
 795      Full-word addition will normally always succeed, especially if
 796      it is provided at all, so we don't worry about its failure.  The
 797      multiplication may well fail, however, so we do handle that.  */
 798
 799   if (!umulp)
 800     {
 801       /* ??? This could be done with emit_store_flag where available.  */
 802       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
 803                            NULL_RTX, 1, methods);
 804       if (temp)
 805         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
 806                                  NULL_RTX, 0, OPTAB_DIRECT);
 807       else
 808         {
 809           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
 810                                NULL_RTX, 0, methods);
 811           if (!temp)
 812             return NULL_RTX;
 813           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
 814                                    NULL_RTX, 0, OPTAB_DIRECT);
 815         }
 816
 817       if (!op0_high)
 818         return NULL_RTX;
 819     }
 820
 821   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
 822                          NULL_RTX, 0, OPTAB_DIRECT);
 823   if (!adjust)
 824     return NULL_RTX;
 825
 826   /* OP0_HIGH should now be dead.  */
 827
 828   if (!umulp)
 829     {
 830       /* ??? This could be done with emit_store_flag where available.  */
 831       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
 832                            NULL_RTX, 1, methods);
 833       if (temp)
 834         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
 835                                  NULL_RTX, 0, OPTAB_DIRECT);
 836       else
 837         {
 838           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
 839                                NULL_RTX, 0, methods);
 840           if (!temp)
 841             return NULL_RTX;
 842           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
 843                                    NULL_RTX, 0, OPTAB_DIRECT);
 844         }
 845
 846       if (!op1_high)
 847         return NULL_RTX;
 848     }
 849
 850   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
 851                        NULL_RTX, 0, OPTAB_DIRECT);
 852   if (!temp)
 853     return NULL_RTX;
 854
 855   /* OP1_HIGH should now be dead.  */
 856
 857   adjust = expand_binop (word_mode, add_optab, adjust, temp,
 858                          NULL_RTX, 0, OPTAB_DIRECT);
 859
 860   if (target && !REG_P (target))
 861     target = NULL_RTX;
 862
 863   if (umulp)
 864     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
 865                             target, 1, OPTAB_DIRECT);
 866   else
 867     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
 868                             target, 1, OPTAB_DIRECT);
 869
 870   if (!product)
 871     return NULL_RTX;
 872
 873   product_high = operand_subword (product, high, 1, mode);
 874   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
 875                          NULL_RTX, 0, OPTAB_DIRECT);
 876   emit_move_insn (product_high, adjust);
 877   return product;
 878 }
 879 \f
 880 /* Wrapper around expand_binop which takes an rtx code to specify
 881    the operation to perform, not an optab pointer.  All other
 882    arguments are the same.  */
 883 rtx
 884 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
 885                      rtx op1, rtx target, int unsignedp,
 886                      enum optab_methods methods)
 887 {
 888   optab binop = code_to_optab (code);
 889   gcc_assert (binop);
 890
 891   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
 892 }
 893
 894 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
 895    binop.  Order them according to commutative_operand_precedence and, if
 896    possible, try to put TARGET or a pseudo first.  */
 897 static bool
 898 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
 899 {
 900   int op0_prec = commutative_operand_precedence (op0);
 901   int op1_prec = commutative_operand_precedence (op1);
 902
 903   if (op0_prec < op1_prec)
 904     return true;
 905
 906   if (op0_prec > op1_prec)
 907     return false;
 908
 909   /* With equal precedence, both orders are ok, but it is better if the
 910      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
 911   if (target == 0 || REG_P (target))
 912     return (REG_P (op1) && !REG_P (op0)) || target == op1;
 913   else
 914     return rtx_equal_p (op1, target);
 915 }
 916
 917 /* Return true if BINOPTAB implements a shift operation.  */
 918
 919 static bool
 920 shift_optab_p (optab binoptab)
 921 {
 922   switch (optab_to_code (binoptab))
 923     {
 924     case ASHIFT:
 925     case SS_ASHIFT:
 926     case US_ASHIFT:
 927     case ASHIFTRT:
 928     case LSHIFTRT:
 929     case ROTATE:
 930     case ROTATERT:
 931       return true;
 932
 933     default:
 934       return false;
 935     }
 936 }
 937
 938 /* Return true if BINOPTAB implements a commutative binary operation.  */
 939
 940 static bool
 941 commutative_optab_p (optab binoptab)
 942 {
 943   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
 944           || binoptab == smul_widen_optab
 945           || binoptab == umul_widen_optab
 946           || binoptab == smul_highpart_optab
 947           || binoptab == umul_highpart_optab);
 948 }
 949
 950 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
 951    optimizing, and if the operand is a constant that costs more than
 952    1 instruction, force the constant into a register and return that
 953    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
 954
 955 static rtx
 956 avoid_expensive_constant (machine_mode mode, optab binoptab,
 957                           int opn, rtx x, bool unsignedp)
 958 {
 959   bool speed = optimize_insn_for_speed_p ();
 960
 961   if (mode != VOIDmode
 962       && optimize
 963       && CONSTANT_P (x)
 964       && (rtx_cost (x, mode, optab_to_code (binoptab), opn, speed)
 965           > set_src_cost (x, mode, speed)))
 966     {
 967       if (CONST_INT_P (x))
 968         {
 969           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
 970           if (intval != INTVAL (x))
 971             x = GEN_INT (intval);
 972         }
 973       else
 974         x = convert_modes (mode, VOIDmode, x, unsignedp);
 975       x = force_reg (mode, x);
 976     }
 977   return x;
 978 }
 979
 980 /* Helper function for expand_binop: handle the case where there
 981    is an insn that directly implements the indicated operation.
 982    Returns null if this is not possible.  */
 983 static rtx
 984 expand_binop_directly (machine_mode mode, optab binoptab,
 985                        rtx op0, rtx op1,
 986                        rtx target, int unsignedp, enum optab_methods methods,
 987                        rtx_insn *last)
 988 {
 989   machine_mode from_mode = widened_mode (mode, op0, op1);
 990   enum insn_code icode = find_widening_optab_handler (binoptab, mode,
 991                                                       from_mode, 1);
 992   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
 993   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
 994   machine_mode mode0, mode1, tmp_mode;
 995   struct expand_operand ops[3];
 996   bool commutative_p;
 997   rtx_insn *pat;
 998   rtx xop0 = op0, xop1 = op1;
 999   bool canonicalize_op1 = false;
1000
1001   /* If it is a commutative operator and the modes would match
1002      if we would swap the operands, we can save the conversions.  */
1003   commutative_p = commutative_optab_p (binoptab);
1004   if (commutative_p
1005       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1006       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1007     std::swap (xop0, xop1);
1008
1009   /* If we are optimizing, force expensive constants into a register.  */
1010   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1011   if (!shift_optab_p (binoptab))
1012     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1013   else
1014     /* Shifts and rotates often use a different mode for op1 from op0;
1015        for VOIDmode constants we don't know the mode, so force it
1016        to be canonicalized using convert_modes.  */
1017     canonicalize_op1 = true;
1018
1019   /* In case the insn wants input operands in modes different from
1020      those of the actual operands, convert the operands.  It would
1021      seem that we don't need to convert CONST_INTs, but we do, so
1022      that they're properly zero-extended, sign-extended or truncated
1023      for their mode.  */
1024
1025   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1026   if (xmode0 != VOIDmode && xmode0 != mode0)
1027     {
1028       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1029       mode0 = xmode0;
1030     }
1031
1032   mode1 = ((GET_MODE (xop1) != VOIDmode || canonicalize_op1)
1033            ? GET_MODE (xop1) : mode);
1034   if (xmode1 != VOIDmode && xmode1 != mode1)
1035     {
1036       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1037       mode1 = xmode1;
1038     }
1039
1040   /* If operation is commutative,
1041      try to make the first operand a register.
1042      Even better, try to make it the same as the target.
1043      Also try to make the last operand a constant.  */
1044   if (commutative_p
1045       && swap_commutative_operands_with_target (target, xop0, xop1))
1046     std::swap (xop0, xop1);
1047
1048   /* Now, if insn's predicates don't allow our operands, put them into
1049      pseudo regs.  */
1050
1051   if (binoptab == vec_pack_trunc_optab
1052       || binoptab == vec_pack_usat_optab
1053       || binoptab == vec_pack_ssat_optab
1054       || binoptab == vec_pack_ufix_trunc_optab
1055       || binoptab == vec_pack_sfix_trunc_optab)
1056     {
1057       /* The mode of the result is different then the mode of the
1058          arguments.  */
1059       tmp_mode = insn_data[(int) icode].operand[0].mode;
1060       if (VECTOR_MODE_P (mode)
1061           && GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1062         {
1063           delete_insns_since (last);
1064           return NULL_RTX;
1065         }
1066     }
1067   else
1068     tmp_mode = mode;
1069
1070   create_output_operand (&ops[0], target, tmp_mode);
1071   create_input_operand (&ops[1], xop0, mode0);
1072   create_input_operand (&ops[2], xop1, mode1);
1073   pat = maybe_gen_insn (icode, 3, ops);
1074   if (pat)
1075     {
1076       /* If PAT is composed of more than one insn, try to add an appropriate
1077          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1078          operand, call expand_binop again, this time without a target.  */
1079       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1080           && ! add_equal_note (pat, ops[0].value,
1081                                optab_to_code (binoptab),
1082                                ops[1].value, ops[2].value))
1083         {
1084           delete_insns_since (last);
1085           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1086                                unsignedp, methods);
1087         }
1088
1089       emit_insn (pat);
1090       return ops[0].value;
1091     }
1092   delete_insns_since (last);
1093   return NULL_RTX;
1094 }
1095
1096 /* Generate code to perform an operation specified by BINOPTAB
1097    on operands OP0 and OP1, with result having machine-mode MODE.
1098
1099    UNSIGNEDP is for the case where we have to widen the operands
1100    to perform the operation.  It says to use zero-extension.
1101
1102    If TARGET is nonzero, the value
1103    is generated there, if it is convenient to do so.
1104    In all cases an rtx is returned for the locus of the value;
1105    this may or may not be TARGET.  */
1106
1107 rtx
1108 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1109               rtx target, int unsignedp, enum optab_methods methods)
1110 {
1111   enum optab_methods next_methods
1112     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1113        ? OPTAB_WIDEN : methods);
1114   enum mode_class mclass;
1115   machine_mode wider_mode;
1116   rtx libfunc;
1117   rtx temp;
1118   rtx_insn *entry_last = get_last_insn ();
1119   rtx_insn *last;
1120
1121   mclass = GET_MODE_CLASS (mode);
1122
1123   /* If subtracting an integer constant, convert this into an addition of
1124      the negated constant.  */
1125
1126   if (binoptab == sub_optab && CONST_INT_P (op1))
1127     {
1128       op1 = negate_rtx (mode, op1);
1129       binoptab = add_optab;
1130     }
1131   /* For shifts, constant invalid op1 might be expanded from different
1132      mode than MODE.  As those are invalid, force them to a register
1133      to avoid further problems during expansion.  */
1134   else if (CONST_INT_P (op1)
1135            && shift_optab_p (binoptab)
1136            && UINTVAL (op1) >= GET_MODE_BITSIZE (GET_MODE_INNER (mode)))
1137     {
1138       op1 = gen_int_mode (INTVAL (op1), GET_MODE_INNER (mode));
1139       op1 = force_reg (GET_MODE_INNER (mode), op1);
1140     }
1141
1142   /* Record where to delete back to if we backtrack.  */
1143   last = get_last_insn ();
1144
1145   /* If we can do it with a three-operand insn, do so.  */
1146
1147   if (methods != OPTAB_MUST_WIDEN
1148       && find_widening_optab_handler (binoptab, mode,
1149                                       widened_mode (mode, op0, op1), 1)
1150             != CODE_FOR_nothing)
1151     {
1152       temp = expand_binop_directly (mode, binoptab, op0, op1, target,
1153                                     unsignedp, methods, last);
1154       if (temp)
1155         return temp;
1156     }
1157
1158   /* If we were trying to rotate, and that didn't work, try rotating
1159      the other direction before falling back to shifts and bitwise-or.  */
1160   if (((binoptab == rotl_optab
1161         && optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
1162        || (binoptab == rotr_optab
1163            && optab_handler (rotl_optab, mode) != CODE_FOR_nothing))
1164       && mclass == MODE_INT)
1165     {
1166       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1167       rtx newop1;
1168       unsigned int bits = GET_MODE_PRECISION (mode);
1169
1170       if (CONST_INT_P (op1))
1171         newop1 = GEN_INT (bits - INTVAL (op1));
1172       else if (targetm.shift_truncation_mask (mode) == bits - 1)
1173         newop1 = negate_rtx (GET_MODE (op1), op1);
1174       else
1175         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1176                                gen_int_mode (bits, GET_MODE (op1)), op1,
1177                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1178
1179       temp = expand_binop_directly (mode, otheroptab, op0, newop1,
1180                                     target, unsignedp, methods, last);
1181       if (temp)
1182         return temp;
1183     }
1184
1185   /* If this is a multiply, see if we can do a widening operation that
1186      takes operands of this mode and makes a wider mode.  */
1187
1188   if (binoptab == smul_optab
1189       && GET_MODE_2XWIDER_MODE (mode).exists (&wider_mode)
1190       && (convert_optab_handler ((unsignedp
1191                                   ? umul_widen_optab
1192                                   : smul_widen_optab),
1193                                  wider_mode, mode) != CODE_FOR_nothing))
1194     {
1195       temp = expand_binop (wider_mode,
1196                            unsignedp ? umul_widen_optab : smul_widen_optab,
1197                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1198
1199       if (temp != 0)
1200         {
1201           if (GET_MODE_CLASS (mode) == MODE_INT
1202               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1203             return gen_lowpart (mode, temp);
1204           else
1205             return convert_to_mode (mode, temp, unsignedp);
1206         }
1207     }
1208
1209   /* If this is a vector shift by a scalar, see if we can do a vector
1210      shift by a vector.  If so, broadcast the scalar into a vector.  */
1211   if (mclass == MODE_VECTOR_INT)
1212     {
1213       optab otheroptab = unknown_optab;
1214
1215       if (binoptab == ashl_optab)
1216         otheroptab = vashl_optab;
1217       else if (binoptab == ashr_optab)
1218         otheroptab = vashr_optab;
1219       else if (binoptab == lshr_optab)
1220         otheroptab = vlshr_optab;
1221       else if (binoptab == rotl_optab)
1222         otheroptab = vrotl_optab;
1223       else if (binoptab == rotr_optab)
1224         otheroptab = vrotr_optab;
1225
1226       if (otheroptab && optab_handler (otheroptab, mode) != CODE_FOR_nothing)
1227         {
1228           /* The scalar may have been extended to be too wide.  Truncate
1229              it back to the proper size to fit in the broadcast vector.  */
1230           machine_mode inner_mode = GET_MODE_INNER (mode);
1231           if (!CONST_INT_P (op1)
1232               && (GET_MODE_BITSIZE (inner_mode)
1233                   < GET_MODE_BITSIZE (GET_MODE (op1))))
1234             op1 = force_reg (inner_mode,
1235                              simplify_gen_unary (TRUNCATE, inner_mode, op1,
1236                                                  GET_MODE (op1)));
1237           rtx vop1 = expand_vector_broadcast (mode, op1);
1238           if (vop1)
1239             {
1240               temp = expand_binop_directly (mode, otheroptab, op0, vop1,
1241                                             target, unsignedp, methods, last);
1242               if (temp)
1243                 return temp;
1244             }
1245         }
1246     }
1247
1248   /* Look for a wider mode of the same class for which we think we
1249      can open-code the operation.  Check for a widening multiply at the
1250      wider mode as well.  */
1251
1252   if (CLASS_HAS_WIDER_MODES_P (mclass)
1253       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1254     FOR_EACH_WIDER_MODE (wider_mode, mode)
1255       {
1256         machine_mode next_mode;
1257         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1258             || (binoptab == smul_optab
1259                 && GET_MODE_WIDER_MODE (wider_mode).exists (&next_mode)
1260                 && (find_widening_optab_handler ((unsignedp
1261                                                   ? umul_widen_optab
1262                                                   : smul_widen_optab),
1263                                                  next_mode, mode, 0)
1264                     != CODE_FOR_nothing)))
1265           {
1266             rtx xop0 = op0, xop1 = op1;
1267             int no_extend = 0;
1268
1269             /* For certain integer operations, we need not actually extend
1270                the narrow operands, as long as we will truncate
1271                the results to the same narrowness.  */
1272
1273             if ((binoptab == ior_optab || binoptab == and_optab
1274                  || binoptab == xor_optab
1275                  || binoptab == add_optab || binoptab == sub_optab
1276                  || binoptab == smul_optab || binoptab == ashl_optab)
1277                 && mclass == MODE_INT)
1278               {
1279                 no_extend = 1;
1280                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1281                                                  xop0, unsignedp);
1282                 if (binoptab != ashl_optab)
1283                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1284                                                    xop1, unsignedp);
1285               }
1286
1287             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1288
1289             /* The second operand of a shift must always be extended.  */
1290             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1291                                   no_extend && binoptab != ashl_optab);
1292
1293             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1294                                  unsignedp, OPTAB_DIRECT);
1295             if (temp)
1296               {
1297                 if (mclass != MODE_INT
1298                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1299                   {
1300                     if (target == 0)
1301                       target = gen_reg_rtx (mode);
1302                     convert_move (target, temp, 0);
1303                     return target;
1304                   }
1305                 else
1306                   return gen_lowpart (mode, temp);
1307               }
1308             else
1309               delete_insns_since (last);
1310           }
1311       }
1312
1313   /* If operation is commutative,
1314      try to make the first operand a register.
1315      Even better, try to make it the same as the target.
1316      Also try to make the last operand a constant.  */
1317   if (commutative_optab_p (binoptab)
1318       && swap_commutative_operands_with_target (target, op0, op1))
1319     std::swap (op0, op1);
1320
1321   /* These can be done a word at a time.  */
1322   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1323       && mclass == MODE_INT
1324       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
1325       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1326     {
1327       int i;
1328       rtx_insn *insns;
1329
1330       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1331          won't be accurate, so use a new target.  */
1332       if (target == 0
1333           || target == op0
1334           || target == op1
1335           || !valid_multiword_target_p (target))
1336         target = gen_reg_rtx (mode);
1337
1338       start_sequence ();
1339
1340       /* Do the actual arithmetic.  */
1341       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
1342         {
1343           rtx target_piece = operand_subword (target, i, 1, mode);
1344           rtx x = expand_binop (word_mode, binoptab,
1345                                 operand_subword_force (op0, i, mode),
1346                                 operand_subword_force (op1, i, mode),
1347                                 target_piece, unsignedp, next_methods);
1348
1349           if (x == 0)
1350             break;
1351
1352           if (target_piece != x)
1353             emit_move_insn (target_piece, x);
1354         }
1355
1356       insns = get_insns ();
1357       end_sequence ();
1358
1359       if (i == GET_MODE_BITSIZE (mode) / BITS_PER_WORD)
1360         {
1361           emit_insn (insns);
1362           return target;
1363         }
1364     }
1365
1366   /* Synthesize double word shifts from single word shifts.  */
1367   if ((binoptab == lshr_optab || binoptab == ashl_optab
1368        || binoptab == ashr_optab)
1369       && mclass == MODE_INT
1370       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1371       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
1372       && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode)
1373       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1374       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1375       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1376     {
1377       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1378       machine_mode op1_mode;
1379
1380       double_shift_mask = targetm.shift_truncation_mask (mode);
1381       shift_mask = targetm.shift_truncation_mask (word_mode);
1382       op1_mode = GET_MODE (op1) != VOIDmode ? GET_MODE (op1) : word_mode;
1383
1384       /* Apply the truncation to constant shifts.  */
1385       if (double_shift_mask > 0 && CONST_INT_P (op1))
1386         op1 = GEN_INT (INTVAL (op1) & double_shift_mask);
1387
1388       if (op1 == CONST0_RTX (op1_mode))
1389         return op0;
1390
1391       /* Make sure that this is a combination that expand_doubleword_shift
1392          can handle.  See the comments there for details.  */
1393       if (double_shift_mask == 0
1394           || (shift_mask == BITS_PER_WORD - 1
1395               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1396         {
1397           rtx_insn *insns;
1398           rtx into_target, outof_target;
1399           rtx into_input, outof_input;
1400           int left_shift, outof_word;
1401
1402           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1403              won't be accurate, so use a new target.  */
1404           if (target == 0
1405               || target == op0
1406               || target == op1
1407               || !valid_multiword_target_p (target))
1408             target = gen_reg_rtx (mode);
1409
1410           start_sequence ();
1411
1412           /* OUTOF_* is the word we are shifting bits away from, and
1413              INTO_* is the word that we are shifting bits towards, thus
1414              they differ depending on the direction of the shift and
1415              WORDS_BIG_ENDIAN.  */
1416
1417           left_shift = binoptab == ashl_optab;
1418           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1419
1420           outof_target = operand_subword (target, outof_word, 1, mode);
1421           into_target = operand_subword (target, 1 - outof_word, 1, mode);
1422
1423           outof_input = operand_subword_force (op0, outof_word, mode);
1424           into_input = operand_subword_force (op0, 1 - outof_word, mode);
1425
1426           if (expand_doubleword_shift (op1_mode, binoptab,
1427                                        outof_input, into_input, op1,
1428                                        outof_target, into_target,
1429                                        unsignedp, next_methods, shift_mask))
1430             {
1431               insns = get_insns ();
1432               end_sequence ();
1433
1434               emit_insn (insns);
1435               return target;
1436             }
1437           end_sequence ();
1438         }
1439     }
1440
1441   /* Synthesize double word rotates from single word shifts.  */
1442   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1443       && mclass == MODE_INT
1444       && CONST_INT_P (op1)
1445       && GET_MODE_PRECISION (mode) == 2 * BITS_PER_WORD
1446       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1447       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1448     {
1449       rtx_insn *insns;
1450       rtx into_target, outof_target;
1451       rtx into_input, outof_input;
1452       rtx inter;
1453       int shift_count, left_shift, outof_word;
1454
1455       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1456          won't be accurate, so use a new target. Do this also if target is not
1457          a REG, first because having a register instead may open optimization
1458          opportunities, and second because if target and op0 happen to be MEMs
1459          designating the same location, we would risk clobbering it too early
1460          in the code sequence we generate below.  */
1461       if (target == 0
1462           || target == op0
1463           || target == op1
1464           || !REG_P (target)
1465           || !valid_multiword_target_p (target))
1466         target = gen_reg_rtx (mode);
1467
1468       start_sequence ();
1469
1470       shift_count = INTVAL (op1);
1471
1472       /* OUTOF_* is the word we are shifting bits away from, and
1473          INTO_* is the word that we are shifting bits towards, thus
1474          they differ depending on the direction of the shift and
1475          WORDS_BIG_ENDIAN.  */
1476
1477       left_shift = (binoptab == rotl_optab);
1478       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1479
1480       outof_target = operand_subword (target, outof_word, 1, mode);
1481       into_target = operand_subword (target, 1 - outof_word, 1, mode);
1482
1483       outof_input = operand_subword_force (op0, outof_word, mode);
1484       into_input = operand_subword_force (op0, 1 - outof_word, mode);
1485
1486       if (shift_count == BITS_PER_WORD)
1487         {
1488           /* This is just a word swap.  */
1489           emit_move_insn (outof_target, into_input);
1490           emit_move_insn (into_target, outof_input);
1491           inter = const0_rtx;
1492         }
1493       else
1494         {
1495           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1496           rtx first_shift_count, second_shift_count;
1497           optab reverse_unsigned_shift, unsigned_shift;
1498
1499           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1500                                     ? lshr_optab : ashl_optab);
1501
1502           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1503                             ? ashl_optab : lshr_optab);
1504
1505           if (shift_count > BITS_PER_WORD)
1506             {
1507               first_shift_count = GEN_INT (shift_count - BITS_PER_WORD);
1508               second_shift_count = GEN_INT (2 * BITS_PER_WORD - shift_count);
1509             }
1510           else
1511             {
1512               first_shift_count = GEN_INT (BITS_PER_WORD - shift_count);
1513               second_shift_count = GEN_INT (shift_count);
1514             }
1515
1516           into_temp1 = expand_binop (word_mode, unsigned_shift,
1517                                      outof_input, first_shift_count,
1518                                      NULL_RTX, unsignedp, next_methods);
1519           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1520                                      into_input, second_shift_count,
1521                                      NULL_RTX, unsignedp, next_methods);
1522
1523           if (into_temp1 != 0 && into_temp2 != 0)
1524             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1525                                   into_target, unsignedp, next_methods);
1526           else
1527             inter = 0;
1528
1529           if (inter != 0 && inter != into_target)
1530             emit_move_insn (into_target, inter);
1531
1532           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1533                                       into_input, first_shift_count,
1534                                       NULL_RTX, unsignedp, next_methods);
1535           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1536                                       outof_input, second_shift_count,
1537                                       NULL_RTX, unsignedp, next_methods);
1538
1539           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1540             inter = expand_binop (word_mode, ior_optab,
1541                                   outof_temp1, outof_temp2,
1542                                   outof_target, unsignedp, next_methods);
1543
1544           if (inter != 0 && inter != outof_target)
1545             emit_move_insn (outof_target, inter);
1546         }
1547
1548       insns = get_insns ();
1549       end_sequence ();
1550
1551       if (inter != 0)
1552         {
1553           emit_insn (insns);
1554           return target;
1555         }
1556     }
1557
1558   /* These can be done a word at a time by propagating carries.  */
1559   if ((binoptab == add_optab || binoptab == sub_optab)
1560       && mclass == MODE_INT
1561       && GET_MODE_SIZE (mode) >= 2 * UNITS_PER_WORD
1562       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1563     {
1564       unsigned int i;
1565       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1566       const unsigned int nwords = GET_MODE_BITSIZE (mode) / BITS_PER_WORD;
1567       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1568       rtx xop0, xop1, xtarget;
1569
1570       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1571          value is one of those, use it.  Otherwise, use 1 since it is the
1572          one easiest to get.  */
1573 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1574       int normalizep = STORE_FLAG_VALUE;
1575 #else
1576       int normalizep = 1;
1577 #endif
1578
1579       /* Prepare the operands.  */
1580       xop0 = force_reg (mode, op0);
1581       xop1 = force_reg (mode, op1);
1582
1583       xtarget = gen_reg_rtx (mode);
1584
1585       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1586         target = xtarget;
1587
1588       /* Indicate for flow that the entire target reg is being set.  */
1589       if (REG_P (target))
1590         emit_clobber (xtarget);
1591
1592       /* Do the actual arithmetic.  */
1593       for (i = 0; i < nwords; i++)
1594         {
1595           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1596           rtx target_piece = operand_subword (xtarget, index, 1, mode);
1597           rtx op0_piece = operand_subword_force (xop0, index, mode);
1598           rtx op1_piece = operand_subword_force (xop1, index, mode);
1599           rtx x;
1600
1601           /* Main add/subtract of the input operands.  */
1602           x = expand_binop (word_mode, binoptab,
1603                             op0_piece, op1_piece,
1604                             target_piece, unsignedp, next_methods);
1605           if (x == 0)
1606             break;
1607
1608           if (i + 1 < nwords)
1609             {
1610               /* Store carry from main add/subtract.  */
1611               carry_out = gen_reg_rtx (word_mode);
1612               carry_out = emit_store_flag_force (carry_out,
1613                                                  (binoptab == add_optab
1614                                                   ? LT : GT),
1615                                                  x, op0_piece,
1616                                                  word_mode, 1, normalizep);
1617             }
1618
1619           if (i > 0)
1620             {
1621               rtx newx;
1622
1623               /* Add/subtract previous carry to main result.  */
1624               newx = expand_binop (word_mode,
1625                                    normalizep == 1 ? binoptab : otheroptab,
1626                                    x, carry_in,
1627                                    NULL_RTX, 1, next_methods);
1628
1629               if (i + 1 < nwords)
1630                 {
1631                   /* Get out carry from adding/subtracting carry in.  */
1632                   rtx carry_tmp = gen_reg_rtx (word_mode);
1633                   carry_tmp = emit_store_flag_force (carry_tmp,
1634                                                      (binoptab == add_optab
1635                                                       ? LT : GT),
1636                                                      newx, x,
1637                                                      word_mode, 1, normalizep);
1638
1639                   /* Logical-ior the two poss. carry together.  */
1640                   carry_out = expand_binop (word_mode, ior_optab,
1641                                             carry_out, carry_tmp,
1642                                             carry_out, 0, next_methods);
1643                   if (carry_out == 0)
1644                     break;
1645                 }
1646               emit_move_insn (target_piece, newx);
1647             }
1648           else
1649             {
1650               if (x != target_piece)
1651                 emit_move_insn (target_piece, x);
1652             }
1653
1654           carry_in = carry_out;
1655         }
1656
1657       if (i == GET_MODE_BITSIZE (mode) / (unsigned) BITS_PER_WORD)
1658         {
1659           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing
1660               || ! rtx_equal_p (target, xtarget))
1661             {
1662               rtx_insn *temp = emit_move_insn (target, xtarget);
1663
1664               set_dst_reg_note (temp, REG_EQUAL,
1665                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
1666                                                 mode, copy_rtx (xop0),
1667                                                 copy_rtx (xop1)),
1668                                 target);
1669             }
1670           else
1671             target = xtarget;
1672
1673           return target;
1674         }
1675
1676       else
1677         delete_insns_since (last);
1678     }
1679
1680   /* Attempt to synthesize double word multiplies using a sequence of word
1681      mode multiplications.  We first attempt to generate a sequence using a
1682      more efficient unsigned widening multiply, and if that fails we then
1683      try using a signed widening multiply.  */
1684
1685   if (binoptab == smul_optab
1686       && mclass == MODE_INT
1687       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
1688       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
1689       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
1690     {
1691       rtx product = NULL_RTX;
1692       if (widening_optab_handler (umul_widen_optab, mode, word_mode)
1693             != CODE_FOR_nothing)
1694         {
1695           product = expand_doubleword_mult (mode, op0, op1, target,
1696                                             true, methods);
1697           if (!product)
1698             delete_insns_since (last);
1699         }
1700
1701       if (product == NULL_RTX
1702           && widening_optab_handler (smul_widen_optab, mode, word_mode)
1703                 != CODE_FOR_nothing)
1704         {
1705           product = expand_doubleword_mult (mode, op0, op1, target,
1706                                             false, methods);
1707           if (!product)
1708             delete_insns_since (last);
1709         }
1710
1711       if (product != NULL_RTX)
1712         {
1713           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing)
1714             {
1715               rtx_insn *move = emit_move_insn (target ? target : product,
1716                                                product);
1717               set_dst_reg_note (move,
1718                                 REG_EQUAL,
1719                                 gen_rtx_fmt_ee (MULT, mode,
1720                                                 copy_rtx (op0),
1721                                                 copy_rtx (op1)),
1722                                 target ? target : product);
1723             }
1724           return product;
1725         }
1726     }
1727
1728   /* It can't be open-coded in this mode.
1729      Use a library call if one is available and caller says that's ok.  */
1730
1731   libfunc = optab_libfunc (binoptab, mode);
1732   if (libfunc
1733       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
1734     {
1735       rtx_insn *insns;
1736       rtx op1x = op1;
1737       machine_mode op1_mode = mode;
1738       rtx value;
1739
1740       start_sequence ();
1741
1742       if (shift_optab_p (binoptab))
1743         {
1744           op1_mode = targetm.libgcc_shift_count_mode ();
1745           /* Specify unsigned here,
1746              since negative shift counts are meaningless.  */
1747           op1x = convert_to_mode (op1_mode, op1, 1);
1748         }
1749
1750       if (GET_MODE (op0) != VOIDmode
1751           && GET_MODE (op0) != mode)
1752         op0 = convert_to_mode (mode, op0, unsignedp);
1753
1754       /* Pass 1 for NO_QUEUE so we don't lose any increments
1755          if the libcall is cse'd or moved.  */
1756       value = emit_library_call_value (libfunc,
1757                                        NULL_RTX, LCT_CONST, mode, 2,
1758                                        op0, mode, op1x, op1_mode);
1759
1760       insns = get_insns ();
1761       end_sequence ();
1762
1763       bool trapv = trapv_binoptab_p (binoptab);
1764       target = gen_reg_rtx (mode);
1765       emit_libcall_block_1 (insns, target, value,
1766                             trapv ? NULL_RTX
1767                             : gen_rtx_fmt_ee (optab_to_code (binoptab),
1768                                               mode, op0, op1), trapv);
1769
1770       return target;
1771     }
1772
1773   delete_insns_since (last);
1774
1775   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1776
1777   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
1778          || methods == OPTAB_MUST_WIDEN))
1779     {
1780       /* Caller says, don't even try.  */
1781       delete_insns_since (entry_last);
1782       return 0;
1783     }
1784
1785   /* Compute the value of METHODS to pass to recursive calls.
1786      Don't allow widening to be tried recursively.  */
1787
1788   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
1789
1790   /* Look for a wider mode of the same class for which it appears we can do
1791      the operation.  */
1792
1793   if (CLASS_HAS_WIDER_MODES_P (mclass))
1794     {
1795       FOR_EACH_WIDER_MODE (wider_mode, mode)
1796         {
1797           if (find_widening_optab_handler (binoptab, wider_mode, mode, 1)
1798                   != CODE_FOR_nothing
1799               || (methods == OPTAB_LIB
1800                   && optab_libfunc (binoptab, wider_mode)))
1801             {
1802               rtx xop0 = op0, xop1 = op1;
1803               int no_extend = 0;
1804
1805               /* For certain integer operations, we need not actually extend
1806                  the narrow operands, as long as we will truncate
1807                  the results to the same narrowness.  */
1808
1809               if ((binoptab == ior_optab || binoptab == and_optab
1810                    || binoptab == xor_optab
1811                    || binoptab == add_optab || binoptab == sub_optab
1812                    || binoptab == smul_optab || binoptab == ashl_optab)
1813                   && mclass == MODE_INT)
1814                 no_extend = 1;
1815
1816               xop0 = widen_operand (xop0, wider_mode, mode,
1817                                     unsignedp, no_extend);
1818
1819               /* The second operand of a shift must always be extended.  */
1820               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1821                                     no_extend && binoptab != ashl_optab);
1822
1823               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1824                                    unsignedp, methods);
1825               if (temp)
1826                 {
1827                   if (mclass != MODE_INT
1828                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1829                     {
1830                       if (target == 0)
1831                         target = gen_reg_rtx (mode);
1832                       convert_move (target, temp, 0);
1833                       return target;
1834                     }
1835                   else
1836                     return gen_lowpart (mode, temp);
1837                 }
1838               else
1839                 delete_insns_since (last);
1840             }
1841         }
1842     }
1843
1844   delete_insns_since (entry_last);
1845   return 0;
1846 }
1847 \f
1848 /* Expand a binary operator which has both signed and unsigned forms.
1849    UOPTAB is the optab for unsigned operations, and SOPTAB is for
1850    signed operations.
1851
1852    If we widen unsigned operands, we may use a signed wider operation instead
1853    of an unsigned wider operation, since the result would be the same.  */
1854
1855 rtx
1856 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
1857                    rtx op0, rtx op1, rtx target, int unsignedp,
1858                    enum optab_methods methods)
1859 {
1860   rtx temp;
1861   optab direct_optab = unsignedp ? uoptab : soptab;
1862   bool save_enable;
1863
1864   /* Do it without widening, if possible.  */
1865   temp = expand_binop (mode, direct_optab, op0, op1, target,
1866                        unsignedp, OPTAB_DIRECT);
1867   if (temp || methods == OPTAB_DIRECT)
1868     return temp;
1869
1870   /* Try widening to a signed int.  Disable any direct use of any
1871      signed insn in the current mode.  */
1872   save_enable = swap_optab_enable (soptab, mode, false);
1873
1874   temp = expand_binop (mode, soptab, op0, op1, target,
1875                        unsignedp, OPTAB_WIDEN);
1876
1877   /* For unsigned operands, try widening to an unsigned int.  */
1878   if (!temp && unsignedp)
1879     temp = expand_binop (mode, uoptab, op0, op1, target,
1880                          unsignedp, OPTAB_WIDEN);
1881   if (temp || methods == OPTAB_WIDEN)
1882     goto egress;
1883
1884   /* Use the right width libcall if that exists.  */
1885   temp = expand_binop (mode, direct_optab, op0, op1, target,
1886                        unsignedp, OPTAB_LIB);
1887   if (temp || methods == OPTAB_LIB)
1888     goto egress;
1889
1890   /* Must widen and use a libcall, use either signed or unsigned.  */
1891   temp = expand_binop (mode, soptab, op0, op1, target,
1892                        unsignedp, methods);
1893   if (!temp && unsignedp)
1894     temp = expand_binop (mode, uoptab, op0, op1, target,
1895                          unsignedp, methods);
1896
1897  egress:
1898   /* Undo the fiddling above.  */
1899   if (save_enable)
1900     swap_optab_enable (soptab, mode, true);
1901   return temp;
1902 }
1903 \f
1904 /* Generate code to perform an operation specified by UNOPPTAB
1905    on operand OP0, with two results to TARG0 and TARG1.
1906    We assume that the order of the operands for the instruction
1907    is TARG0, TARG1, OP0.
1908
1909    Either TARG0 or TARG1 may be zero, but what that means is that
1910    the result is not actually wanted.  We will generate it into
1911    a dummy pseudo-reg and discard it.  They may not both be zero.
1912
1913    Returns 1 if this operation can be performed; 0 if not.  */
1914
1915 int
1916 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
1917                     int unsignedp)
1918 {
1919   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
1920   enum mode_class mclass;
1921   machine_mode wider_mode;
1922   rtx_insn *entry_last = get_last_insn ();
1923   rtx_insn *last;
1924
1925   mclass = GET_MODE_CLASS (mode);
1926
1927   if (!targ0)
1928     targ0 = gen_reg_rtx (mode);
1929   if (!targ1)
1930     targ1 = gen_reg_rtx (mode);
1931
1932   /* Record where to go back to if we fail.  */
1933   last = get_last_insn ();
1934
1935   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
1936     {
1937       struct expand_operand ops[3];
1938       enum insn_code icode = optab_handler (unoptab, mode);
1939
1940       create_fixed_operand (&ops[0], targ0);
1941       create_fixed_operand (&ops[1], targ1);
1942       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
1943       if (maybe_expand_insn (icode, 3, ops))
1944         return 1;
1945     }
1946
1947   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1948
1949   if (CLASS_HAS_WIDER_MODES_P (mclass))
1950     {
1951       FOR_EACH_WIDER_MODE (wider_mode, mode)
1952         {
1953           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
1954             {
1955               rtx t0 = gen_reg_rtx (wider_mode);
1956               rtx t1 = gen_reg_rtx (wider_mode);
1957               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
1958
1959               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
1960                 {
1961                   convert_move (targ0, t0, unsignedp);
1962                   convert_move (targ1, t1, unsignedp);
1963                   return 1;
1964                 }
1965               else
1966                 delete_insns_since (last);
1967             }
1968         }
1969     }
1970
1971   delete_insns_since (entry_last);
1972   return 0;
1973 }
1974 \f
1975 /* Generate code to perform an operation specified by BINOPTAB
1976    on operands OP0 and OP1, with two results to TARG1 and TARG2.
1977    We assume that the order of the operands for the instruction
1978    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
1979    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
1980
1981    Either TARG0 or TARG1 may be zero, but what that means is that
1982    the result is not actually wanted.  We will generate it into
1983    a dummy pseudo-reg and discard it.  They may not both be zero.
1984
1985    Returns 1 if this operation can be performed; 0 if not.  */
1986
1987 int
1988 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
1989                      int unsignedp)
1990 {
1991   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
1992   enum mode_class mclass;
1993   machine_mode wider_mode;
1994   rtx_insn *entry_last = get_last_insn ();
1995   rtx_insn *last;
1996
1997   mclass = GET_MODE_CLASS (mode);
1998
1999   if (!targ0)
2000     targ0 = gen_reg_rtx (mode);
2001   if (!targ1)
2002     targ1 = gen_reg_rtx (mode);
2003
2004   /* Record where to go back to if we fail.  */
2005   last = get_last_insn ();
2006
2007   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2008     {
2009       struct expand_operand ops[4];
2010       enum insn_code icode = optab_handler (binoptab, mode);
2011       machine_mode mode0 = insn_data[icode].operand[1].mode;
2012       machine_mode mode1 = insn_data[icode].operand[2].mode;
2013       rtx xop0 = op0, xop1 = op1;
2014
2015       /* If we are optimizing, force expensive constants into a register.  */
2016       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2017       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2018
2019       create_fixed_operand (&ops[0], targ0);
2020       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2021       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2022       create_fixed_operand (&ops[3], targ1);
2023       if (maybe_expand_insn (icode, 4, ops))
2024         return 1;
2025       delete_insns_since (last);
2026     }
2027
2028   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2029
2030   if (CLASS_HAS_WIDER_MODES_P (mclass))
2031     {
2032       FOR_EACH_WIDER_MODE (wider_mode, mode)
2033         {
2034           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2035             {
2036               rtx t0 = gen_reg_rtx (wider_mode);
2037               rtx t1 = gen_reg_rtx (wider_mode);
2038               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2039               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2040
2041               if (expand_twoval_binop (binoptab, cop0, cop1,
2042                                        t0, t1, unsignedp))
2043                 {
2044                   convert_move (targ0, t0, unsignedp);
2045                   convert_move (targ1, t1, unsignedp);
2046                   return 1;
2047                 }
2048               else
2049                 delete_insns_since (last);
2050             }
2051         }
2052     }
2053
2054   delete_insns_since (entry_last);
2055   return 0;
2056 }
2057
2058 /* Expand the two-valued library call indicated by BINOPTAB, but
2059    preserve only one of the values.  If TARG0 is non-NULL, the first
2060    value is placed into TARG0; otherwise the second value is placed
2061    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2062    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2063    This routine assumes that the value returned by the library call is
2064    as if the return value was of an integral mode twice as wide as the
2065    mode of OP0.  Returns 1 if the call was successful.  */
2066
2067 bool
2068 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2069                              rtx targ0, rtx targ1, enum rtx_code code)
2070 {
2071   machine_mode mode;
2072   machine_mode libval_mode;
2073   rtx libval;
2074   rtx_insn *insns;
2075   rtx libfunc;
2076
2077   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2078   gcc_assert (!targ0 != !targ1);
2079
2080   mode = GET_MODE (op0);
2081   libfunc = optab_libfunc (binoptab, mode);
2082   if (!libfunc)
2083     return false;
2084
2085   /* The value returned by the library function will have twice as
2086      many bits as the nominal MODE.  */
2087   libval_mode = smallest_int_mode_for_size (2 * GET_MODE_BITSIZE (mode));
2088   start_sequence ();
2089   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2090                                     libval_mode, 2,
2091                                     op0, mode,
2092                                     op1, mode);
2093   /* Get the part of VAL containing the value that we want.  */
2094   libval = simplify_gen_subreg (mode, libval, libval_mode,
2095                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2096   insns = get_insns ();
2097   end_sequence ();
2098   /* Move the into the desired location.  */
2099   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2100                       gen_rtx_fmt_ee (code, mode, op0, op1));
2101
2102   return true;
2103 }
2104
2105 \f
2106 /* Wrapper around expand_unop which takes an rtx code to specify
2107    the operation to perform, not an optab pointer.  All other
2108    arguments are the same.  */
2109 rtx
2110 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2111                     rtx target, int unsignedp)
2112 {
2113   optab unop = code_to_optab (code);
2114   gcc_assert (unop);
2115
2116   return expand_unop (mode, unop, op0, target, unsignedp);
2117 }
2118
2119 /* Try calculating
2120         (clz:narrow x)
2121    as
2122         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2123
2124    A similar operation can be used for clrsb.  UNOPTAB says which operation
2125    we are trying to expand.  */
2126 static rtx
2127 widen_leading (machine_mode mode, rtx op0, rtx target, optab unoptab)
2128 {
2129   enum mode_class mclass = GET_MODE_CLASS (mode);
2130   if (CLASS_HAS_WIDER_MODES_P (mclass))
2131     {
2132       machine_mode wider_mode;
2133       FOR_EACH_WIDER_MODE (wider_mode, mode)
2134         {
2135           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2136             {
2137               rtx xop0, temp;
2138               rtx_insn *last;
2139
2140               last = get_last_insn ();
2141
2142               if (target == 0)
2143                 target = gen_reg_rtx (mode);
2144               xop0 = widen_operand (op0, wider_mode, mode,
2145                                     unoptab != clrsb_optab, false);
2146               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2147                                   unoptab != clrsb_optab);
2148               if (temp != 0)
2149                 temp = expand_binop
2150                   (wider_mode, sub_optab, temp,
2151                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
2152                                  - GET_MODE_PRECISION (mode),
2153                                  wider_mode),
2154                    target, true, OPTAB_DIRECT);
2155               if (temp == 0)
2156                 delete_insns_since (last);
2157
2158               return temp;
2159             }
2160         }
2161     }
2162   return 0;
2163 }
2164
2165 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2166    quantities, choosing which based on whether the high word is nonzero.  */
2167 static rtx
2168 expand_doubleword_clz (machine_mode mode, rtx op0, rtx target)
2169 {
2170   rtx xop0 = force_reg (mode, op0);
2171   rtx subhi = gen_highpart (word_mode, xop0);
2172   rtx sublo = gen_lowpart (word_mode, xop0);
2173   rtx_code_label *hi0_label = gen_label_rtx ();
2174   rtx_code_label *after_label = gen_label_rtx ();
2175   rtx_insn *seq;
2176   rtx temp, result;
2177
2178   /* If we were not given a target, use a word_mode register, not a
2179      'mode' register.  The result will fit, and nobody is expecting
2180      anything bigger (the return type of __builtin_clz* is int).  */
2181   if (!target)
2182     target = gen_reg_rtx (word_mode);
2183
2184   /* In any case, write to a word_mode scratch in both branches of the
2185      conditional, so we can ensure there is a single move insn setting
2186      'target' to tag a REG_EQUAL note on.  */
2187   result = gen_reg_rtx (word_mode);
2188
2189   start_sequence ();
2190
2191   /* If the high word is not equal to zero,
2192      then clz of the full value is clz of the high word.  */
2193   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2194                            word_mode, true, hi0_label);
2195
2196   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2197   if (!temp)
2198     goto fail;
2199
2200   if (temp != result)
2201     convert_move (result, temp, true);
2202
2203   emit_jump_insn (targetm.gen_jump (after_label));
2204   emit_barrier ();
2205
2206   /* Else clz of the full value is clz of the low word plus the number
2207      of bits in the high word.  */
2208   emit_label (hi0_label);
2209
2210   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2211   if (!temp)
2212     goto fail;
2213   temp = expand_binop (word_mode, add_optab, temp,
2214                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2215                        result, true, OPTAB_DIRECT);
2216   if (!temp)
2217     goto fail;
2218   if (temp != result)
2219     convert_move (result, temp, true);
2220
2221   emit_label (after_label);
2222   convert_move (target, result, true);
2223
2224   seq = get_insns ();
2225   end_sequence ();
2226
2227   add_equal_note (seq, target, CLZ, xop0, 0);
2228   emit_insn (seq);
2229   return target;
2230
2231  fail:
2232   end_sequence ();
2233   return 0;
2234 }
2235
2236 /* Try calculating popcount of a double-word quantity as two popcount's of
2237    word-sized quantities and summing up the results.  */
2238 static rtx
2239 expand_doubleword_popcount (machine_mode mode, rtx op0, rtx target)
2240 {
2241   rtx t0, t1, t;
2242   rtx_insn *seq;
2243
2244   start_sequence ();
2245
2246   t0 = expand_unop_direct (word_mode, popcount_optab,
2247                            operand_subword_force (op0, 0, mode), NULL_RTX,
2248                            true);
2249   t1 = expand_unop_direct (word_mode, popcount_optab,
2250                            operand_subword_force (op0, 1, mode), NULL_RTX,
2251                            true);
2252   if (!t0 || !t1)
2253     {
2254       end_sequence ();
2255       return NULL_RTX;
2256     }
2257
2258   /* If we were not given a target, use a word_mode register, not a
2259      'mode' register.  The result will fit, and nobody is expecting
2260      anything bigger (the return type of __builtin_popcount* is int).  */
2261   if (!target)
2262     target = gen_reg_rtx (word_mode);
2263
2264   t = expand_binop (word_mode, add_optab, t0, t1, target, 0, OPTAB_DIRECT);
2265
2266   seq = get_insns ();
2267   end_sequence ();
2268
2269   add_equal_note (seq, t, POPCOUNT, op0, 0);
2270   emit_insn (seq);
2271   return t;
2272 }
2273
2274 /* Try calculating
2275         (parity:wide x)
2276    as
2277         (parity:narrow (low (x) ^ high (x))) */
2278 static rtx
2279 expand_doubleword_parity (machine_mode mode, rtx op0, rtx target)
2280 {
2281   rtx t = expand_binop (word_mode, xor_optab,
2282                         operand_subword_force (op0, 0, mode),
2283                         operand_subword_force (op0, 1, mode),
2284                         NULL_RTX, 0, OPTAB_DIRECT);
2285   return expand_unop (word_mode, parity_optab, t, target, true);
2286 }
2287
2288 /* Try calculating
2289         (bswap:narrow x)
2290    as
2291         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2292 static rtx
2293 widen_bswap (machine_mode mode, rtx op0, rtx target)
2294 {
2295   enum mode_class mclass = GET_MODE_CLASS (mode);
2296   machine_mode wider_mode;
2297   rtx x;
2298   rtx_insn *last;
2299
2300   if (!CLASS_HAS_WIDER_MODES_P (mclass))
2301     return NULL_RTX;
2302
2303   FOR_EACH_WIDER_MODE (wider_mode, mode)
2304     if (optab_handler (bswap_optab, wider_mode) != CODE_FOR_nothing)
2305       goto found;
2306   return NULL_RTX;
2307
2308  found:
2309   last = get_last_insn ();
2310
2311   x = widen_operand (op0, wider_mode, mode, true, true);
2312   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2313
2314   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2315               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2316   if (x != 0)
2317     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2318                       GET_MODE_BITSIZE (wider_mode)
2319                       - GET_MODE_BITSIZE (mode),
2320                       NULL_RTX, true);
2321
2322   if (x != 0)
2323     {
2324       if (target == 0)
2325         target = gen_reg_rtx (mode);
2326       emit_move_insn (target, gen_lowpart (mode, x));
2327     }
2328   else
2329     delete_insns_since (last);
2330
2331   return target;
2332 }
2333
2334 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2335
2336 static rtx
2337 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2338 {
2339   rtx t0, t1;
2340
2341   t1 = expand_unop (word_mode, bswap_optab,
2342                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2343   t0 = expand_unop (word_mode, bswap_optab,
2344                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2345
2346   if (target == 0 || !valid_multiword_target_p (target))
2347     target = gen_reg_rtx (mode);
2348   if (REG_P (target))
2349     emit_clobber (target);
2350   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2351   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2352
2353   return target;
2354 }
2355
2356 /* Try calculating (parity x) as (and (popcount x) 1), where
2357    popcount can also be done in a wider mode.  */
2358 static rtx
2359 expand_parity (machine_mode mode, rtx op0, rtx target)
2360 {
2361   enum mode_class mclass = GET_MODE_CLASS (mode);
2362   if (CLASS_HAS_WIDER_MODES_P (mclass))
2363     {
2364       machine_mode wider_mode;
2365       FOR_EACH_MODE_FROM (wider_mode, mode)
2366         {
2367           if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2368             {
2369               rtx xop0, temp;
2370               rtx_insn *last;
2371
2372               last = get_last_insn ();
2373
2374               if (target == 0 || GET_MODE (target) != wider_mode)
2375                 target = gen_reg_rtx (wider_mode);
2376
2377               xop0 = widen_operand (op0, wider_mode, mode, true, false);
2378               temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2379                                   true);
2380               if (temp != 0)
2381                 temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2382                                      target, true, OPTAB_DIRECT);
2383
2384               if (temp)
2385                 {
2386                   if (mclass != MODE_INT
2387                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2388                     return convert_to_mode (mode, temp, 0);
2389                   else
2390                     return gen_lowpart (mode, temp);
2391                 }
2392               else
2393                 delete_insns_since (last);
2394             }
2395         }
2396     }
2397   return 0;
2398 }
2399
2400 /* Try calculating ctz(x) as K - clz(x & -x) ,
2401    where K is GET_MODE_PRECISION(mode) - 1.
2402
2403    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2404    don't have to worry about what the hardware does in that case.  (If
2405    the clz instruction produces the usual value at 0, which is K, the
2406    result of this code sequence will be -1; expand_ffs, below, relies
2407    on this.  It might be nice to have it be K instead, for consistency
2408    with the (very few) processors that provide a ctz with a defined
2409    value, but that would take one more instruction, and it would be
2410    less convenient for expand_ffs anyway.  */
2411
2412 static rtx
2413 expand_ctz (machine_mode mode, rtx op0, rtx target)
2414 {
2415   rtx_insn *seq;
2416   rtx temp;
2417
2418   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2419     return 0;
2420
2421   start_sequence ();
2422
2423   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2424   if (temp)
2425     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2426                          true, OPTAB_DIRECT);
2427   if (temp)
2428     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2429   if (temp)
2430     temp = expand_binop (mode, sub_optab,
2431                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2432                          temp, target,
2433                          true, OPTAB_DIRECT);
2434   if (temp == 0)
2435     {
2436       end_sequence ();
2437       return 0;
2438     }
2439
2440   seq = get_insns ();
2441   end_sequence ();
2442
2443   add_equal_note (seq, temp, CTZ, op0, 0);
2444   emit_insn (seq);
2445   return temp;
2446 }
2447
2448
2449 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2450    else with the sequence used by expand_clz.
2451
2452    The ffs builtin promises to return zero for a zero value and ctz/clz
2453    may have an undefined value in that case.  If they do not give us a
2454    convenient value, we have to generate a test and branch.  */
2455 static rtx
2456 expand_ffs (machine_mode mode, rtx op0, rtx target)
2457 {
2458   HOST_WIDE_INT val = 0;
2459   bool defined_at_zero = false;
2460   rtx temp;
2461   rtx_insn *seq;
2462
2463   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2464     {
2465       start_sequence ();
2466
2467       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2468       if (!temp)
2469         goto fail;
2470
2471       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2472     }
2473   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2474     {
2475       start_sequence ();
2476       temp = expand_ctz (mode, op0, 0);
2477       if (!temp)
2478         goto fail;
2479
2480       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2481         {
2482           defined_at_zero = true;
2483           val = (GET_MODE_PRECISION (mode) - 1) - val;
2484         }
2485     }
2486   else
2487     return 0;
2488
2489   if (defined_at_zero && val == -1)
2490     /* No correction needed at zero.  */;
2491   else
2492     {
2493       /* We don't try to do anything clever with the situation found
2494          on some processors (eg Alpha) where ctz(0:mode) ==
2495          bitsize(mode).  If someone can think of a way to send N to -1
2496          and leave alone all values in the range 0..N-1 (where N is a
2497          power of two), cheaper than this test-and-branch, please add it.
2498
2499          The test-and-branch is done after the operation itself, in case
2500          the operation sets condition codes that can be recycled for this.
2501          (This is true on i386, for instance.)  */
2502
2503       rtx_code_label *nonzero_label = gen_label_rtx ();
2504       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2505                                mode, true, nonzero_label);
2506
2507       convert_move (temp, GEN_INT (-1), false);
2508       emit_label (nonzero_label);
2509     }
2510
2511   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2512      to produce a value in the range 0..bitsize.  */
2513   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2514                        target, false, OPTAB_DIRECT);
2515   if (!temp)
2516     goto fail;
2517
2518   seq = get_insns ();
2519   end_sequence ();
2520
2521   add_equal_note (seq, temp, FFS, op0, 0);
2522   emit_insn (seq);
2523   return temp;
2524
2525  fail:
2526   end_sequence ();
2527   return 0;
2528 }
2529
2530 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2531    conditions, VAL may already be a SUBREG against which we cannot generate
2532    a further SUBREG.  In this case, we expect forcing the value into a
2533    register will work around the situation.  */
2534
2535 static rtx
2536 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
2537                            machine_mode imode)
2538 {
2539   rtx ret;
2540   ret = lowpart_subreg (omode, val, imode);
2541   if (ret == NULL)
2542     {
2543       val = force_reg (imode, val);
2544       ret = lowpart_subreg (omode, val, imode);
2545       gcc_assert (ret != NULL);
2546     }
2547   return ret;
2548 }
2549
2550 /* Expand a floating point absolute value or negation operation via a
2551    logical operation on the sign bit.  */
2552
2553 static rtx
2554 expand_absneg_bit (enum rtx_code code, scalar_float_mode mode,
2555                    rtx op0, rtx target)
2556 {
2557   const struct real_format *fmt;
2558   int bitpos, word, nwords, i;
2559   machine_mode imode;
2560   rtx temp;
2561   rtx_insn *insns;
2562
2563   /* The format has to have a simple sign bit.  */
2564   fmt = REAL_MODE_FORMAT (mode);
2565   if (fmt == NULL)
2566     return NULL_RTX;
2567
2568   bitpos = fmt->signbit_rw;
2569   if (bitpos < 0)
2570     return NULL_RTX;
2571
2572   /* Don't create negative zeros if the format doesn't support them.  */
2573   if (code == NEG && !fmt->has_signed_zero)
2574     return NULL_RTX;
2575
2576   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2577     {
2578       if (!int_mode_for_mode (mode).exists (&imode))
2579         return NULL_RTX;
2580       word = 0;
2581       nwords = 1;
2582     }
2583   else
2584     {
2585       imode = word_mode;
2586
2587       if (FLOAT_WORDS_BIG_ENDIAN)
2588         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2589       else
2590         word = bitpos / BITS_PER_WORD;
2591       bitpos = bitpos % BITS_PER_WORD;
2592       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2593     }
2594
2595   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2596   if (code == ABS)
2597     mask = ~mask;
2598
2599   if (target == 0
2600       || target == op0
2601       || (nwords > 1 && !valid_multiword_target_p (target)))
2602     target = gen_reg_rtx (mode);
2603
2604   if (nwords > 1)
2605     {
2606       start_sequence ();
2607
2608       for (i = 0; i < nwords; ++i)
2609         {
2610           rtx targ_piece = operand_subword (target, i, 1, mode);
2611           rtx op0_piece = operand_subword_force (op0, i, mode);
2612
2613           if (i == word)
2614             {
2615               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2616                                    op0_piece,
2617                                    immed_wide_int_const (mask, imode),
2618                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2619               if (temp != targ_piece)
2620                 emit_move_insn (targ_piece, temp);
2621             }
2622           else
2623             emit_move_insn (targ_piece, op0_piece);
2624         }
2625
2626       insns = get_insns ();
2627       end_sequence ();
2628
2629       emit_insn (insns);
2630     }
2631   else
2632     {
2633       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2634                            gen_lowpart (imode, op0),
2635                            immed_wide_int_const (mask, imode),
2636                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2637       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2638
2639       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2640                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2641                         target);
2642     }
2643
2644   return target;
2645 }
2646
2647 /* As expand_unop, but will fail rather than attempt the operation in a
2648    different mode or with a libcall.  */
2649 static rtx
2650 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
2651                     int unsignedp)
2652 {
2653   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2654     {
2655       struct expand_operand ops[2];
2656       enum insn_code icode = optab_handler (unoptab, mode);
2657       rtx_insn *last = get_last_insn ();
2658       rtx_insn *pat;
2659
2660       create_output_operand (&ops[0], target, mode);
2661       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2662       pat = maybe_gen_insn (icode, 2, ops);
2663       if (pat)
2664         {
2665           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
2666               && ! add_equal_note (pat, ops[0].value,
2667                                    optab_to_code (unoptab),
2668                                    ops[1].value, NULL_RTX))
2669             {
2670               delete_insns_since (last);
2671               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
2672             }
2673
2674           emit_insn (pat);
2675
2676           return ops[0].value;
2677         }
2678     }
2679   return 0;
2680 }
2681
2682 /* Generate code to perform an operation specified by UNOPTAB
2683    on operand OP0, with result having machine-mode MODE.
2684
2685    UNSIGNEDP is for the case where we have to widen the operands
2686    to perform the operation.  It says to use zero-extension.
2687
2688    If TARGET is nonzero, the value
2689    is generated there, if it is convenient to do so.
2690    In all cases an rtx is returned for the locus of the value;
2691    this may or may not be TARGET.  */
2692
2693 rtx
2694 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
2695              int unsignedp)
2696 {
2697   enum mode_class mclass = GET_MODE_CLASS (mode);
2698   machine_mode wider_mode;
2699   scalar_float_mode float_mode;
2700   rtx temp;
2701   rtx libfunc;
2702
2703   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
2704   if (temp)
2705     return temp;
2706
2707   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
2708
2709   /* Widening (or narrowing) clz needs special treatment.  */
2710   if (unoptab == clz_optab)
2711     {
2712       temp = widen_leading (mode, op0, target, unoptab);
2713       if (temp)
2714         return temp;
2715
2716       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2717           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2718         {
2719           temp = expand_doubleword_clz (mode, op0, target);
2720           if (temp)
2721             return temp;
2722         }
2723
2724       goto try_libcall;
2725     }
2726
2727   if (unoptab == clrsb_optab)
2728     {
2729       temp = widen_leading (mode, op0, target, unoptab);
2730       if (temp)
2731         return temp;
2732       goto try_libcall;
2733     }
2734
2735   if (unoptab == popcount_optab
2736       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2737       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2738       && optimize_insn_for_speed_p ())
2739     {
2740       temp = expand_doubleword_popcount (mode, op0, target);
2741       if (temp)
2742         return temp;
2743     }
2744
2745   if (unoptab == parity_optab
2746       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2747       && (optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2748           || optab_handler (popcount_optab, word_mode) != CODE_FOR_nothing)
2749       && optimize_insn_for_speed_p ())
2750     {
2751       temp = expand_doubleword_parity (mode, op0, target);
2752       if (temp)
2753         return temp;
2754     }
2755
2756   /* Widening (or narrowing) bswap needs special treatment.  */
2757   if (unoptab == bswap_optab)
2758     {
2759       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
2760          or ROTATERT.  First try these directly; if this fails, then try the
2761          obvious pair of shifts with allowed widening, as this will probably
2762          be always more efficient than the other fallback methods.  */
2763       if (mode == HImode)
2764         {
2765           rtx_insn *last;
2766           rtx temp1, temp2;
2767
2768           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
2769             {
2770               temp = expand_binop (mode, rotl_optab, op0, GEN_INT (8), target,
2771                                    unsignedp, OPTAB_DIRECT);
2772               if (temp)
2773                 return temp;
2774              }
2775
2776           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
2777             {
2778               temp = expand_binop (mode, rotr_optab, op0, GEN_INT (8), target,
2779                                    unsignedp, OPTAB_DIRECT);
2780               if (temp)
2781                 return temp;
2782             }
2783
2784           last = get_last_insn ();
2785
2786           temp1 = expand_binop (mode, ashl_optab, op0, GEN_INT (8), NULL_RTX,
2787                                 unsignedp, OPTAB_WIDEN);
2788           temp2 = expand_binop (mode, lshr_optab, op0, GEN_INT (8), NULL_RTX,
2789                                 unsignedp, OPTAB_WIDEN);
2790           if (temp1 && temp2)
2791             {
2792               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
2793                                    unsignedp, OPTAB_WIDEN);
2794               if (temp)
2795                 return temp;
2796             }
2797
2798           delete_insns_since (last);
2799         }
2800
2801       temp = widen_bswap (mode, op0, target);
2802       if (temp)
2803         return temp;
2804
2805       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2806           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2807         {
2808           temp = expand_doubleword_bswap (mode, op0, target);
2809           if (temp)
2810             return temp;
2811         }
2812
2813       goto try_libcall;
2814     }
2815
2816   if (CLASS_HAS_WIDER_MODES_P (mclass))
2817     FOR_EACH_WIDER_MODE (wider_mode, mode)
2818       {
2819         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2820           {
2821             rtx xop0 = op0;
2822             rtx_insn *last = get_last_insn ();
2823
2824             /* For certain operations, we need not actually extend
2825                the narrow operand, as long as we will truncate the
2826                results to the same narrowness.  */
2827
2828             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
2829                                   (unoptab == neg_optab
2830                                    || unoptab == one_cmpl_optab)
2831                                   && mclass == MODE_INT);
2832
2833             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2834                                 unsignedp);
2835
2836             if (temp)
2837               {
2838                 if (mclass != MODE_INT
2839                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2840                   {
2841                     if (target == 0)
2842                       target = gen_reg_rtx (mode);
2843                     convert_move (target, temp, 0);
2844                     return target;
2845                   }
2846                 else
2847                   return gen_lowpart (mode, temp);
2848               }
2849             else
2850               delete_insns_since (last);
2851           }
2852       }
2853
2854   /* These can be done a word at a time.  */
2855   if (unoptab == one_cmpl_optab
2856       && mclass == MODE_INT
2857       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
2858       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2859     {
2860       int i;
2861       rtx_insn *insns;
2862
2863       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
2864         target = gen_reg_rtx (mode);
2865
2866       start_sequence ();
2867
2868       /* Do the actual arithmetic.  */
2869       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
2870         {
2871           rtx target_piece = operand_subword (target, i, 1, mode);
2872           rtx x = expand_unop (word_mode, unoptab,
2873                                operand_subword_force (op0, i, mode),
2874                                target_piece, unsignedp);
2875
2876           if (target_piece != x)
2877             emit_move_insn (target_piece, x);
2878         }
2879
2880       insns = get_insns ();
2881       end_sequence ();
2882
2883       emit_insn (insns);
2884       return target;
2885     }
2886
2887   if (optab_to_code (unoptab) == NEG)
2888     {
2889       /* Try negating floating point values by flipping the sign bit.  */
2890       if (is_a <scalar_float_mode> (mode, &float_mode))
2891         {
2892           temp = expand_absneg_bit (NEG, float_mode, op0, target);
2893           if (temp)
2894             return temp;
2895         }
2896
2897       /* If there is no negation pattern, and we have no negative zero,
2898          try subtracting from zero.  */
2899       if (!HONOR_SIGNED_ZEROS (mode))
2900         {
2901           temp = expand_binop (mode, (unoptab == negv_optab
2902                                       ? subv_optab : sub_optab),
2903                                CONST0_RTX (mode), op0, target,
2904                                unsignedp, OPTAB_DIRECT);
2905           if (temp)
2906             return temp;
2907         }
2908     }
2909
2910   /* Try calculating parity (x) as popcount (x) % 2.  */
2911   if (unoptab == parity_optab)
2912     {
2913       temp = expand_parity (mode, op0, target);
2914       if (temp)
2915         return temp;
2916     }
2917
2918   /* Try implementing ffs (x) in terms of clz (x).  */
2919   if (unoptab == ffs_optab)
2920     {
2921       temp = expand_ffs (mode, op0, target);
2922       if (temp)
2923         return temp;
2924     }
2925
2926   /* Try implementing ctz (x) in terms of clz (x).  */
2927   if (unoptab == ctz_optab)
2928     {
2929       temp = expand_ctz (mode, op0, target);
2930       if (temp)
2931         return temp;
2932     }
2933
2934  try_libcall:
2935   /* Now try a library call in this mode.  */
2936   libfunc = optab_libfunc (unoptab, mode);
2937   if (libfunc)
2938     {
2939       rtx_insn *insns;
2940       rtx value;
2941       rtx eq_value;
2942       machine_mode outmode = mode;
2943
2944       /* All of these functions return small values.  Thus we choose to
2945          have them return something that isn't a double-word.  */
2946       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
2947           || unoptab == clrsb_optab || unoptab == popcount_optab
2948           || unoptab == parity_optab)
2949         outmode
2950           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
2951                                           optab_libfunc (unoptab, mode)));
2952
2953       start_sequence ();
2954
2955       /* Pass 1 for NO_QUEUE so we don't lose any increments
2956          if the libcall is cse'd or moved.  */
2957       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
2958                                        1, op0, mode);
2959       insns = get_insns ();
2960       end_sequence ();
2961
2962       target = gen_reg_rtx (outmode);
2963       bool trapv = trapv_unoptab_p (unoptab);
2964       if (trapv)
2965         eq_value = NULL_RTX;
2966       else
2967         {
2968           eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
2969           if (GET_MODE_SIZE (outmode) < GET_MODE_SIZE (mode))
2970             eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
2971           else if (GET_MODE_SIZE (outmode) > GET_MODE_SIZE (mode))
2972             eq_value = simplify_gen_unary (ZERO_EXTEND,
2973                                            outmode, eq_value, mode);
2974         }
2975       emit_libcall_block_1 (insns, target, value, eq_value, trapv);
2976
2977       return target;
2978     }
2979
2980   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2981
2982   if (CLASS_HAS_WIDER_MODES_P (mclass))
2983     {
2984       FOR_EACH_WIDER_MODE (wider_mode, mode)
2985         {
2986           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
2987               || optab_libfunc (unoptab, wider_mode))
2988             {
2989               rtx xop0 = op0;
2990               rtx_insn *last = get_last_insn ();
2991
2992               /* For certain operations, we need not actually extend
2993                  the narrow operand, as long as we will truncate the
2994                  results to the same narrowness.  */
2995               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
2996                                     (unoptab == neg_optab
2997                                      || unoptab == one_cmpl_optab
2998                                      || unoptab == bswap_optab)
2999                                     && mclass == MODE_INT);
3000
3001               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3002                                   unsignedp);
3003
3004               /* If we are generating clz using wider mode, adjust the
3005                  result.  Similarly for clrsb.  */
3006               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3007                   && temp != 0)
3008                 temp = expand_binop
3009                   (wider_mode, sub_optab, temp,
3010                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
3011                                  - GET_MODE_PRECISION (mode),
3012                                  wider_mode),
3013                    target, true, OPTAB_DIRECT);
3014
3015               /* Likewise for bswap.  */
3016               if (unoptab == bswap_optab && temp != 0)
3017                 {
3018                   gcc_assert (GET_MODE_PRECISION (wider_mode)
3019                               == GET_MODE_BITSIZE (wider_mode)
3020                               && GET_MODE_PRECISION (mode)
3021                                  == GET_MODE_BITSIZE (mode));
3022
3023                   temp = expand_shift (RSHIFT_EXPR, wider_mode, temp,
3024                                        GET_MODE_BITSIZE (wider_mode)
3025                                        - GET_MODE_BITSIZE (mode),
3026                                        NULL_RTX, true);
3027                 }
3028
3029               if (temp)
3030                 {
3031                   if (mclass != MODE_INT)
3032                     {
3033                       if (target == 0)
3034                         target = gen_reg_rtx (mode);
3035                       convert_move (target, temp, 0);
3036                       return target;
3037                     }
3038                   else
3039                     return gen_lowpart (mode, temp);
3040                 }
3041               else
3042                 delete_insns_since (last);
3043             }
3044         }
3045     }
3046
3047   /* One final attempt at implementing negation via subtraction,
3048      this time allowing widening of the operand.  */
3049   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3050     {
3051       rtx temp;
3052       temp = expand_binop (mode,
3053                            unoptab == negv_optab ? subv_optab : sub_optab,
3054                            CONST0_RTX (mode), op0,
3055                            target, unsignedp, OPTAB_LIB_WIDEN);
3056       if (temp)
3057         return temp;
3058     }
3059
3060   return 0;
3061 }
3062 \f
3063 /* Emit code to compute the absolute value of OP0, with result to
3064    TARGET if convenient.  (TARGET may be 0.)  The return value says
3065    where the result actually is to be found.
3066
3067    MODE is the mode of the operand; the mode of the result is
3068    different but can be deduced from MODE.
3069
3070  */
3071
3072 rtx
3073 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3074                    int result_unsignedp)
3075 {
3076   rtx temp;
3077
3078   if (GET_MODE_CLASS (mode) != MODE_INT
3079       || ! flag_trapv)
3080     result_unsignedp = 1;
3081
3082   /* First try to do it with a special abs instruction.  */
3083   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3084                       op0, target, 0);
3085   if (temp != 0)
3086     return temp;
3087
3088   /* For floating point modes, try clearing the sign bit.  */
3089   scalar_float_mode float_mode;
3090   if (is_a <scalar_float_mode> (mode, &float_mode))
3091     {
3092       temp = expand_absneg_bit (ABS, float_mode, op0, target);
3093       if (temp)
3094         return temp;
3095     }
3096
3097   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3098   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3099       && !HONOR_SIGNED_ZEROS (mode))
3100     {
3101       rtx_insn *last = get_last_insn ();
3102
3103       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3104                           op0, NULL_RTX, 0);
3105       if (temp != 0)
3106         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3107                              OPTAB_WIDEN);
3108
3109       if (temp != 0)
3110         return temp;
3111
3112       delete_insns_since (last);
3113     }
3114
3115   /* If this machine has expensive jumps, we can do integer absolute
3116      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3117      where W is the width of MODE.  */
3118
3119   if (GET_MODE_CLASS (mode) == MODE_INT
3120       && BRANCH_COST (optimize_insn_for_speed_p (),
3121                       false) >= 2)
3122     {
3123       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3124                                    GET_MODE_PRECISION (mode) - 1,
3125                                    NULL_RTX, 0);
3126
3127       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3128                            OPTAB_LIB_WIDEN);
3129       if (temp != 0)
3130         temp = expand_binop (mode, result_unsignedp ? sub_optab : subv_optab,
3131                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3132
3133       if (temp != 0)
3134         return temp;
3135     }
3136
3137   return NULL_RTX;
3138 }
3139
3140 rtx
3141 expand_abs (machine_mode mode, rtx op0, rtx target,
3142             int result_unsignedp, int safe)
3143 {
3144   rtx temp;
3145   rtx_code_label *op1;
3146
3147   if (GET_MODE_CLASS (mode) != MODE_INT
3148       || ! flag_trapv)
3149     result_unsignedp = 1;
3150
3151   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3152   if (temp != 0)
3153     return temp;
3154
3155   /* If that does not win, use conditional jump and negate.  */
3156
3157   /* It is safe to use the target if it is the same
3158      as the source if this is also a pseudo register */
3159   if (op0 == target && REG_P (op0)
3160       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3161     safe = 1;
3162
3163   op1 = gen_label_rtx ();
3164   if (target == 0 || ! safe
3165       || GET_MODE (target) != mode
3166       || (MEM_P (target) && MEM_VOLATILE_P (target))
3167       || (REG_P (target)
3168           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3169     target = gen_reg_rtx (mode);
3170
3171   emit_move_insn (target, op0);
3172   NO_DEFER_POP;
3173
3174   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3175                            NULL_RTX, NULL, op1,
3176                            profile_probability::uninitialized ());
3177
3178   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3179                      target, target, 0);
3180   if (op0 != target)
3181     emit_move_insn (target, op0);
3182   emit_label (op1);
3183   OK_DEFER_POP;
3184   return target;
3185 }
3186
3187 /* Emit code to compute the one's complement absolute value of OP0
3188    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3189    (TARGET may be NULL_RTX.)  The return value says where the result
3190    actually is to be found.
3191
3192    MODE is the mode of the operand; the mode of the result is
3193    different but can be deduced from MODE.  */
3194
3195 rtx
3196 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3197 {
3198   rtx temp;
3199
3200   /* Not applicable for floating point modes.  */
3201   if (FLOAT_MODE_P (mode))
3202     return NULL_RTX;
3203
3204   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3205   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3206     {
3207       rtx_insn *last = get_last_insn ();
3208
3209       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3210       if (temp != 0)
3211         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3212                              OPTAB_WIDEN);
3213
3214       if (temp != 0)
3215         return temp;
3216
3217       delete_insns_since (last);
3218     }
3219
3220   /* If this machine has expensive jumps, we can do one's complement
3221      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3222
3223   if (GET_MODE_CLASS (mode) == MODE_INT
3224       && BRANCH_COST (optimize_insn_for_speed_p (),
3225                      false) >= 2)
3226     {
3227       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3228                                    GET_MODE_PRECISION (mode) - 1,
3229                                    NULL_RTX, 0);
3230
3231       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3232                            OPTAB_LIB_WIDEN);
3233
3234       if (temp != 0)
3235         return temp;
3236     }
3237
3238   return NULL_RTX;
3239 }
3240
3241 /* A subroutine of expand_copysign, perform the copysign operation using the
3242    abs and neg primitives advertised to exist on the target.  The assumption
3243    is that we have a split register file, and leaving op0 in fp registers,
3244    and not playing with subregs so much, will help the register allocator.  */
3245
3246 static rtx
3247 expand_copysign_absneg (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3248                         int bitpos, bool op0_is_abs)
3249 {
3250   machine_mode imode;
3251   enum insn_code icode;
3252   rtx sign;
3253   rtx_code_label *label;
3254
3255   if (target == op1)
3256     target = NULL_RTX;
3257
3258   /* Check if the back end provides an insn that handles signbit for the
3259      argument's mode. */
3260   icode = optab_handler (signbit_optab, mode);
3261   if (icode != CODE_FOR_nothing)
3262     {
3263       imode = insn_data[(int) icode].operand[0].mode;
3264       sign = gen_reg_rtx (imode);
3265       emit_unop_insn (icode, sign, op1, UNKNOWN);
3266     }
3267   else
3268     {
3269       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3270         {
3271           if (!int_mode_for_mode (mode).exists (&imode))
3272             return NULL_RTX;
3273           op1 = gen_lowpart (imode, op1);
3274         }
3275       else
3276         {
3277           int word;
3278
3279           imode = word_mode;
3280           if (FLOAT_WORDS_BIG_ENDIAN)
3281             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3282           else
3283             word = bitpos / BITS_PER_WORD;
3284           bitpos = bitpos % BITS_PER_WORD;
3285           op1 = operand_subword_force (op1, word, mode);
3286         }
3287
3288       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3289       sign = expand_binop (imode, and_optab, op1,
3290                            immed_wide_int_const (mask, imode),
3291                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3292     }
3293
3294   if (!op0_is_abs)
3295     {
3296       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3297       if (op0 == NULL)
3298         return NULL_RTX;
3299       target = op0;
3300     }
3301   else
3302     {
3303       if (target == NULL_RTX)
3304         target = copy_to_reg (op0);
3305       else
3306         emit_move_insn (target, op0);
3307     }
3308
3309   label = gen_label_rtx ();
3310   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3311
3312   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3313     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3314   else
3315     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3316   if (op0 != target)
3317     emit_move_insn (target, op0);
3318
3319   emit_label (label);
3320
3321   return target;
3322 }
3323
3324
3325 /* A subroutine of expand_copysign, perform the entire copysign operation
3326    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3327    is true if op0 is known to have its sign bit clear.  */
3328
3329 static rtx
3330 expand_copysign_bit (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3331                      int bitpos, bool op0_is_abs)
3332 {
3333   scalar_int_mode imode;
3334   int word, nwords, i;
3335   rtx temp;
3336   rtx_insn *insns;
3337
3338   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3339     {
3340       if (!int_mode_for_mode (mode).exists (&imode))
3341         return NULL_RTX;
3342       word = 0;
3343       nwords = 1;
3344     }
3345   else
3346     {
3347       imode = word_mode;
3348
3349       if (FLOAT_WORDS_BIG_ENDIAN)
3350         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3351       else
3352         word = bitpos / BITS_PER_WORD;
3353       bitpos = bitpos % BITS_PER_WORD;
3354       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3355     }
3356
3357   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3358
3359   if (target == 0
3360       || target == op0
3361       || target == op1
3362       || (nwords > 1 && !valid_multiword_target_p (target)))
3363     target = gen_reg_rtx (mode);
3364
3365   if (nwords > 1)
3366     {
3367       start_sequence ();
3368
3369       for (i = 0; i < nwords; ++i)
3370         {
3371           rtx targ_piece = operand_subword (target, i, 1, mode);
3372           rtx op0_piece = operand_subword_force (op0, i, mode);
3373
3374           if (i == word)
3375             {
3376               if (!op0_is_abs)
3377                 op0_piece
3378                   = expand_binop (imode, and_optab, op0_piece,
3379                                   immed_wide_int_const (~mask, imode),
3380                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3381               op1 = expand_binop (imode, and_optab,
3382                                   operand_subword_force (op1, i, mode),
3383                                   immed_wide_int_const (mask, imode),
3384                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3385
3386               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3387                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3388               if (temp != targ_piece)
3389                 emit_move_insn (targ_piece, temp);
3390             }
3391           else
3392             emit_move_insn (targ_piece, op0_piece);
3393         }
3394
3395       insns = get_insns ();
3396       end_sequence ();
3397
3398       emit_insn (insns);
3399     }
3400   else
3401     {
3402       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3403                           immed_wide_int_const (mask, imode),
3404                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3405
3406       op0 = gen_lowpart (imode, op0);
3407       if (!op0_is_abs)
3408         op0 = expand_binop (imode, and_optab, op0,
3409                             immed_wide_int_const (~mask, imode),
3410                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3411
3412       temp = expand_binop (imode, ior_optab, op0, op1,
3413                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3414       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3415     }
3416
3417   return target;
3418 }
3419
3420 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3421    scalar floating point mode.  Return NULL if we do not know how to
3422    expand the operation inline.  */
3423
3424 rtx
3425 expand_copysign (rtx op0, rtx op1, rtx target)
3426 {
3427   scalar_float_mode mode;
3428   const struct real_format *fmt;
3429   bool op0_is_abs;
3430   rtx temp;
3431
3432   mode = as_a <scalar_float_mode> (GET_MODE (op0));
3433   gcc_assert (GET_MODE (op1) == mode);
3434
3435   /* First try to do it with a special instruction.  */
3436   temp = expand_binop (mode, copysign_optab, op0, op1,
3437                        target, 0, OPTAB_DIRECT);
3438   if (temp)
3439     return temp;
3440
3441   fmt = REAL_MODE_FORMAT (mode);
3442   if (fmt == NULL || !fmt->has_signed_zero)
3443     return NULL_RTX;
3444
3445   op0_is_abs = false;
3446   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3447     {
3448       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3449         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3450       op0_is_abs = true;
3451     }
3452
3453   if (fmt->signbit_ro >= 0
3454       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3455           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3456               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3457     {
3458       temp = expand_copysign_absneg (mode, op0, op1, target,
3459                                      fmt->signbit_ro, op0_is_abs);
3460       if (temp)
3461         return temp;
3462     }
3463
3464   if (fmt->signbit_rw < 0)
3465     return NULL_RTX;
3466   return expand_copysign_bit (mode, op0, op1, target,
3467                               fmt->signbit_rw, op0_is_abs);
3468 }
3469 \f
3470 /* Generate an instruction whose insn-code is INSN_CODE,
3471    with two operands: an output TARGET and an input OP0.
3472    TARGET *must* be nonzero, and the output is always stored there.
3473    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3474    the value that is stored into TARGET.
3475
3476    Return false if expansion failed.  */
3477
3478 bool
3479 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3480                       enum rtx_code code)
3481 {
3482   struct expand_operand ops[2];
3483   rtx_insn *pat;
3484
3485   create_output_operand (&ops[0], target, GET_MODE (target));
3486   create_input_operand (&ops[1], op0, GET_MODE (op0));
3487   pat = maybe_gen_insn (icode, 2, ops);
3488   if (!pat)
3489     return false;
3490
3491   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3492       && code != UNKNOWN)
3493     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3494
3495   emit_insn (pat);
3496
3497   if (ops[0].value != target)
3498     emit_move_insn (target, ops[0].value);
3499   return true;
3500 }
3501 /* Generate an instruction whose insn-code is INSN_CODE,
3502    with two operands: an output TARGET and an input OP0.
3503    TARGET *must* be nonzero, and the output is always stored there.
3504    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3505    the value that is stored into TARGET.  */
3506
3507 void
3508 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3509 {
3510   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3511   gcc_assert (ok);
3512 }
3513 \f
3514 struct no_conflict_data
3515 {
3516   rtx target;
3517   rtx_insn *first, *insn;
3518   bool must_stay;
3519 };
3520
3521 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3522    the currently examined clobber / store has to stay in the list of
3523    insns that constitute the actual libcall block.  */
3524 static void
3525 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3526 {
3527   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3528
3529   /* If this inns directly contributes to setting the target, it must stay.  */
3530   if (reg_overlap_mentioned_p (p->target, dest))
3531     p->must_stay = true;
3532   /* If we haven't committed to keeping any other insns in the list yet,
3533      there is nothing more to check.  */
3534   else if (p->insn == p->first)
3535     return;
3536   /* If this insn sets / clobbers a register that feeds one of the insns
3537      already in the list, this insn has to stay too.  */
3538   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3539            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3540            || reg_used_between_p (dest, p->first, p->insn)
3541            /* Likewise if this insn depends on a register set by a previous
3542               insn in the list, or if it sets a result (presumably a hard
3543               register) that is set or clobbered by a previous insn.
3544               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3545               SET_DEST perform the former check on the address, and the latter
3546               check on the MEM.  */
3547            || (GET_CODE (set) == SET
3548                && (modified_in_p (SET_SRC (set), p->first)
3549                    || modified_in_p (SET_DEST (set), p->first)
3550                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3551                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3552     p->must_stay = true;
3553 }
3554
3555 \f
3556 /* Emit code to make a call to a constant function or a library call.
3557
3558    INSNS is a list containing all insns emitted in the call.
3559    These insns leave the result in RESULT.  Our block is to copy RESULT
3560    to TARGET, which is logically equivalent to EQUIV.
3561
3562    We first emit any insns that set a pseudo on the assumption that these are
3563    loading constants into registers; doing so allows them to be safely cse'ed
3564    between blocks.  Then we emit all the other insns in the block, followed by
3565    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3566    note with an operand of EQUIV.  */
3567
3568 static void
3569 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3570                       bool equiv_may_trap)
3571 {
3572   rtx final_dest = target;
3573   rtx_insn *next, *last, *insn;
3574
3575   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3576      into a MEM later.  Protect the libcall block from this change.  */
3577   if (! REG_P (target) || REG_USERVAR_P (target))
3578     target = gen_reg_rtx (GET_MODE (target));
3579
3580   /* If we're using non-call exceptions, a libcall corresponding to an
3581      operation that may trap may also trap.  */
3582   /* ??? See the comment in front of make_reg_eh_region_note.  */
3583   if (cfun->can_throw_non_call_exceptions
3584       && (equiv_may_trap || may_trap_p (equiv)))
3585     {
3586       for (insn = insns; insn; insn = NEXT_INSN (insn))
3587         if (CALL_P (insn))
3588           {
3589             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3590             if (note)
3591               {
3592                 int lp_nr = INTVAL (XEXP (note, 0));
3593                 if (lp_nr == 0 || lp_nr == INT_MIN)
3594                   remove_note (insn, note);
3595               }
3596           }
3597     }
3598   else
3599     {
3600       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3601          reg note to indicate that this call cannot throw or execute a nonlocal
3602          goto (unless there is already a REG_EH_REGION note, in which case
3603          we update it).  */
3604       for (insn = insns; insn; insn = NEXT_INSN (insn))
3605         if (CALL_P (insn))
3606           make_reg_eh_region_note_nothrow_nononlocal (insn);
3607     }
3608
3609   /* First emit all insns that set pseudos.  Remove them from the list as
3610      we go.  Avoid insns that set pseudos which were referenced in previous
3611      insns.  These can be generated by move_by_pieces, for example,
3612      to update an address.  Similarly, avoid insns that reference things
3613      set in previous insns.  */
3614
3615   for (insn = insns; insn; insn = next)
3616     {
3617       rtx set = single_set (insn);
3618
3619       next = NEXT_INSN (insn);
3620
3621       if (set != 0 && REG_P (SET_DEST (set))
3622           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3623         {
3624           struct no_conflict_data data;
3625
3626           data.target = const0_rtx;
3627           data.first = insns;
3628           data.insn = insn;
3629           data.must_stay = 0;
3630           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3631           if (! data.must_stay)
3632             {
3633               if (PREV_INSN (insn))
3634                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3635               else
3636                 insns = next;
3637
3638               if (next)
3639                 SET_PREV_INSN (next) = PREV_INSN (insn);
3640
3641               add_insn (insn);
3642             }
3643         }
3644
3645       /* Some ports use a loop to copy large arguments onto the stack.
3646          Don't move anything outside such a loop.  */
3647       if (LABEL_P (insn))
3648         break;
3649     }
3650
3651   /* Write the remaining insns followed by the final copy.  */
3652   for (insn = insns; insn; insn = next)
3653     {
3654       next = NEXT_INSN (insn);
3655
3656       add_insn (insn);
3657     }
3658
3659   last = emit_move_insn (target, result);
3660   if (equiv)
3661     set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3662
3663   if (final_dest != target)
3664     emit_move_insn (final_dest, target);
3665 }
3666
3667 void
3668 emit_libcall_block (rtx_insn *insns, rtx target, rtx result, rtx equiv)
3669 {
3670   emit_libcall_block_1 (insns, target, result, equiv, false);
3671 }
3672 \f
3673 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3674    PURPOSE describes how this comparison will be used.  CODE is the rtx
3675    comparison code we will be using.
3676
3677    ??? Actually, CODE is slightly weaker than that.  A target is still
3678    required to implement all of the normal bcc operations, but not
3679    required to implement all (or any) of the unordered bcc operations.  */
3680
3681 int
3682 can_compare_p (enum rtx_code code, machine_mode mode,
3683                enum can_compare_purpose purpose)
3684 {
3685   rtx test;
3686   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
3687   do
3688     {
3689       enum insn_code icode;
3690
3691       if (purpose == ccp_jump
3692           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
3693           && insn_operand_matches (icode, 0, test))
3694         return 1;
3695       if (purpose == ccp_store_flag
3696           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
3697           && insn_operand_matches (icode, 1, test))
3698         return 1;
3699       if (purpose == ccp_cmov
3700           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
3701         return 1;
3702
3703       mode = GET_MODE_WIDER_MODE (mode).else_void ();
3704       PUT_MODE (test, mode);
3705     }
3706   while (mode != VOIDmode);
3707
3708   return 0;
3709 }
3710
3711 /* This function is called when we are going to emit a compare instruction that
3712    compares the values found in X and Y, using the rtl operator COMPARISON.
3713
3714    If they have mode BLKmode, then SIZE specifies the size of both operands.
3715
3716    UNSIGNEDP nonzero says that the operands are unsigned;
3717    this matters if they need to be widened (as given by METHODS).
3718
3719    *PTEST is where the resulting comparison RTX is returned or NULL_RTX
3720    if we failed to produce one.
3721
3722    *PMODE is the mode of the inputs (in case they are const_int).
3723
3724    This function performs all the setup necessary so that the caller only has
3725    to emit a single comparison insn.  This setup can involve doing a BLKmode
3726    comparison or emitting a library call to perform the comparison if no insn
3727    is available to handle it.
3728    The values which are passed in through pointers can be modified; the caller
3729    should perform the comparison on the modified values.  Constant
3730    comparisons must have already been folded.  */
3731
3732 static void
3733 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
3734                   int unsignedp, enum optab_methods methods,
3735                   rtx *ptest, machine_mode *pmode)
3736 {
3737   machine_mode mode = *pmode;
3738   rtx libfunc, test;
3739   machine_mode cmp_mode;
3740   enum mode_class mclass;
3741
3742   /* The other methods are not needed.  */
3743   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
3744               || methods == OPTAB_LIB_WIDEN);
3745
3746   /* If we are optimizing, force expensive constants into a register.  */
3747   if (CONSTANT_P (x) && optimize
3748       && (rtx_cost (x, mode, COMPARE, 0, optimize_insn_for_speed_p ())
3749           > COSTS_N_INSNS (1)))
3750     x = force_reg (mode, x);
3751
3752   if (CONSTANT_P (y) && optimize
3753       && (rtx_cost (y, mode, COMPARE, 1, optimize_insn_for_speed_p ())
3754           > COSTS_N_INSNS (1)))
3755     y = force_reg (mode, y);
3756
3757 #if HAVE_cc0
3758   /* Make sure if we have a canonical comparison.  The RTL
3759      documentation states that canonical comparisons are required only
3760      for targets which have cc0.  */
3761   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
3762 #endif
3763
3764   /* Don't let both operands fail to indicate the mode.  */
3765   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
3766     x = force_reg (mode, x);
3767   if (mode == VOIDmode)
3768     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
3769
3770   /* Handle all BLKmode compares.  */
3771
3772   if (mode == BLKmode)
3773     {
3774       machine_mode result_mode;
3775       enum insn_code cmp_code;
3776       rtx result;
3777       rtx opalign
3778         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
3779
3780       gcc_assert (size);
3781
3782       /* Try to use a memory block compare insn - either cmpstr
3783          or cmpmem will do.  */
3784       FOR_EACH_MODE_IN_CLASS (cmp_mode, MODE_INT)
3785         {
3786           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
3787           if (cmp_code == CODE_FOR_nothing)
3788             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
3789           if (cmp_code == CODE_FOR_nothing)
3790             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
3791           if (cmp_code == CODE_FOR_nothing)
3792             continue;
3793
3794           /* Must make sure the size fits the insn's mode.  */
3795           if ((CONST_INT_P (size)
3796                && INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode)))
3797               || (GET_MODE_BITSIZE (GET_MODE (size))
3798                   > GET_MODE_BITSIZE (cmp_mode)))
3799             continue;
3800
3801           result_mode = insn_data[cmp_code].operand[0].mode;
3802           result = gen_reg_rtx (result_mode);
3803           size = convert_to_mode (cmp_mode, size, 1);
3804           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
3805
3806           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
3807           *pmode = result_mode;
3808           return;
3809         }
3810
3811       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
3812         goto fail;
3813
3814       /* Otherwise call a library function.  */
3815       result = emit_block_comp_via_libcall (XEXP (x, 0), XEXP (y, 0), size);
3816
3817       x = result;
3818       y = const0_rtx;
3819       mode = TYPE_MODE (integer_type_node);
3820       methods = OPTAB_LIB_WIDEN;
3821       unsignedp = false;
3822     }
3823
3824   /* Don't allow operands to the compare to trap, as that can put the
3825      compare and branch in different basic blocks.  */
3826   if (cfun->can_throw_non_call_exceptions)
3827     {
3828       if (may_trap_p (x))
3829         x = copy_to_reg (x);
3830       if (may_trap_p (y))
3831         y = copy_to_reg (y);
3832     }
3833
3834   if (GET_MODE_CLASS (mode) == MODE_CC)
3835     {
3836       enum insn_code icode = optab_handler (cbranch_optab, CCmode);
3837       test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3838       gcc_assert (icode != CODE_FOR_nothing
3839                   && insn_operand_matches (icode, 0, test));
3840       *ptest = test;
3841       return;
3842     }
3843
3844   mclass = GET_MODE_CLASS (mode);
3845   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3846   FOR_EACH_MODE_FROM (cmp_mode, mode)
3847     {
3848       enum insn_code icode;
3849       icode = optab_handler (cbranch_optab, cmp_mode);
3850       if (icode != CODE_FOR_nothing
3851           && insn_operand_matches (icode, 0, test))
3852         {
3853           rtx_insn *last = get_last_insn ();
3854           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
3855           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
3856           if (op0 && op1
3857               && insn_operand_matches (icode, 1, op0)
3858               && insn_operand_matches (icode, 2, op1))
3859             {
3860               XEXP (test, 0) = op0;
3861               XEXP (test, 1) = op1;
3862               *ptest = test;
3863               *pmode = cmp_mode;
3864               return;
3865             }
3866           delete_insns_since (last);
3867         }
3868
3869       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
3870         break;
3871     }
3872
3873   if (methods != OPTAB_LIB_WIDEN)
3874     goto fail;
3875
3876   if (!SCALAR_FLOAT_MODE_P (mode))
3877     {
3878       rtx result;
3879       machine_mode ret_mode;
3880
3881       /* Handle a libcall just for the mode we are using.  */
3882       libfunc = optab_libfunc (cmp_optab, mode);
3883       gcc_assert (libfunc);
3884
3885       /* If we want unsigned, and this mode has a distinct unsigned
3886          comparison routine, use that.  */
3887       if (unsignedp)
3888         {
3889           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
3890           if (ulibfunc)
3891             libfunc = ulibfunc;
3892         }
3893
3894       ret_mode = targetm.libgcc_cmp_return_mode ();
3895       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
3896                                         ret_mode, 2, x, mode, y, mode);
3897
3898       /* There are two kinds of comparison routines. Biased routines
3899          return 0/1/2, and unbiased routines return -1/0/1. Other parts
3900          of gcc expect that the comparison operation is equivalent
3901          to the modified comparison. For signed comparisons compare the
3902          result against 1 in the biased case, and zero in the unbiased
3903          case. For unsigned comparisons always compare against 1 after
3904          biasing the unbiased result by adding 1. This gives us a way to
3905          represent LTU.
3906          The comparisons in the fixed-point helper library are always
3907          biased.  */
3908       x = result;
3909       y = const1_rtx;
3910
3911       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
3912         {
3913           if (unsignedp)
3914             x = plus_constant (ret_mode, result, 1);
3915           else
3916             y = const0_rtx;
3917         }
3918
3919       *pmode = ret_mode;
3920       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
3921                         ptest, pmode);
3922     }
3923   else
3924     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
3925
3926   return;
3927
3928  fail:
3929   *ptest = NULL_RTX;
3930 }
3931
3932 /* Before emitting an insn with code ICODE, make sure that X, which is going
3933    to be used for operand OPNUM of the insn, is converted from mode MODE to
3934    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
3935    that it is accepted by the operand predicate.  Return the new value.  */
3936
3937 rtx
3938 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
3939                  machine_mode wider_mode, int unsignedp)
3940 {
3941   if (mode != wider_mode)
3942     x = convert_modes (wider_mode, mode, x, unsignedp);
3943
3944   if (!insn_operand_matches (icode, opnum, x))
3945     {
3946       machine_mode op_mode = insn_data[(int) icode].operand[opnum].mode;
3947       if (reload_completed)
3948         return NULL_RTX;
3949       if (GET_MODE (x) != op_mode && GET_MODE (x) != VOIDmode)
3950         return NULL_RTX;
3951       x = copy_to_mode_reg (op_mode, x);
3952     }
3953
3954   return x;
3955 }
3956
3957 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
3958    we can do the branch.  */
3959
3960 static void
3961 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label,
3962                           profile_probability prob)
3963 {
3964   machine_mode optab_mode;
3965   enum mode_class mclass;
3966   enum insn_code icode;
3967   rtx_insn *insn;
3968
3969   mclass = GET_MODE_CLASS (mode);
3970   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
3971   icode = optab_handler (cbranch_optab, optab_mode);
3972
3973   gcc_assert (icode != CODE_FOR_nothing);
3974   gcc_assert (insn_operand_matches (icode, 0, test));
3975   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
3976                                           XEXP (test, 1), label));
3977   if (prob.initialized_p ()
3978       && profile_status_for_fn (cfun) != PROFILE_ABSENT
3979       && insn
3980       && JUMP_P (insn)
3981       && any_condjump_p (insn)
3982       && !find_reg_note (insn, REG_BR_PROB, 0))
3983     add_reg_br_prob_note (insn, prob);
3984 }
3985
3986 /* Generate code to compare X with Y so that the condition codes are
3987    set and to jump to LABEL if the condition is true.  If X is a
3988    constant and Y is not a constant, then the comparison is swapped to
3989    ensure that the comparison RTL has the canonical form.
3990
3991    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
3992    need to be widened.  UNSIGNEDP is also used to select the proper
3993    branch condition code.
3994
3995    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
3996
3997    MODE is the mode of the inputs (in case they are const_int).
3998
3999    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4000    It will be potentially converted into an unsigned variant based on
4001    UNSIGNEDP to select a proper jump instruction.
4002
4003    PROB is the probability of jumping to LABEL.  */
4004
4005 void
4006 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4007                          machine_mode mode, int unsignedp, rtx label,
4008                          profile_probability prob)
4009 {
4010   rtx op0 = x, op1 = y;
4011   rtx test;
4012
4013   /* Swap operands and condition to ensure canonical RTL.  */
4014   if (swap_commutative_operands_p (x, y)
4015       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4016     {
4017       op0 = y, op1 = x;
4018       comparison = swap_condition (comparison);
4019     }
4020
4021   /* If OP0 is still a constant, then both X and Y must be constants
4022      or the opposite comparison is not supported.  Force X into a register
4023      to create canonical RTL.  */
4024   if (CONSTANT_P (op0))
4025     op0 = force_reg (mode, op0);
4026
4027   if (unsignedp)
4028     comparison = unsigned_condition (comparison);
4029
4030   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4031                     &test, &mode);
4032   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4033 }
4034
4035 \f
4036 /* Emit a library call comparison between floating point X and Y.
4037    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4038
4039 static void
4040 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4041                        rtx *ptest, machine_mode *pmode)
4042 {
4043   enum rtx_code swapped = swap_condition (comparison);
4044   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4045   machine_mode orig_mode = GET_MODE (x);
4046   machine_mode mode, cmp_mode;
4047   rtx true_rtx, false_rtx;
4048   rtx value, target, equiv;
4049   rtx_insn *insns;
4050   rtx libfunc = 0;
4051   bool reversed_p = false;
4052   cmp_mode = targetm.libgcc_cmp_return_mode ();
4053
4054   FOR_EACH_MODE_FROM (mode, orig_mode)
4055     {
4056       if (code_to_optab (comparison)
4057           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4058         break;
4059
4060       if (code_to_optab (swapped)
4061           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4062         {
4063           std::swap (x, y);
4064           comparison = swapped;
4065           break;
4066         }
4067
4068       if (code_to_optab (reversed)
4069           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4070         {
4071           comparison = reversed;
4072           reversed_p = true;
4073           break;
4074         }
4075     }
4076
4077   gcc_assert (mode != VOIDmode);
4078
4079   if (mode != orig_mode)
4080     {
4081       x = convert_to_mode (mode, x, 0);
4082       y = convert_to_mode (mode, y, 0);
4083     }
4084
4085   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4086      the RTL.  The allows the RTL optimizers to delete the libcall if the
4087      condition can be determined at compile-time.  */
4088   if (comparison == UNORDERED
4089       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4090     {
4091       true_rtx = const_true_rtx;
4092       false_rtx = const0_rtx;
4093     }
4094   else
4095     {
4096       switch (comparison)
4097         {
4098         case EQ:
4099           true_rtx = const0_rtx;
4100           false_rtx = const_true_rtx;
4101           break;
4102
4103         case NE:
4104           true_rtx = const_true_rtx;
4105           false_rtx = const0_rtx;
4106           break;
4107
4108         case GT:
4109           true_rtx = const1_rtx;
4110           false_rtx = const0_rtx;
4111           break;
4112
4113         case GE:
4114           true_rtx = const0_rtx;
4115           false_rtx = constm1_rtx;
4116           break;
4117
4118         case LT:
4119           true_rtx = constm1_rtx;
4120           false_rtx = const0_rtx;
4121           break;
4122
4123         case LE:
4124           true_rtx = const0_rtx;
4125           false_rtx = const1_rtx;
4126           break;
4127
4128         default:
4129           gcc_unreachable ();
4130         }
4131     }
4132
4133   if (comparison == UNORDERED)
4134     {
4135       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4136       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4137       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4138                                     temp, const_true_rtx, equiv);
4139     }
4140   else
4141     {
4142       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4143       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4144         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4145                                       equiv, true_rtx, false_rtx);
4146     }
4147
4148   start_sequence ();
4149   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4150                                    cmp_mode, 2, x, mode, y, mode);
4151   insns = get_insns ();
4152   end_sequence ();
4153
4154   target = gen_reg_rtx (cmp_mode);
4155   emit_libcall_block (insns, target, value, equiv);
4156
4157   if (comparison == UNORDERED
4158       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4159       || reversed_p)
4160     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4161   else
4162     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4163
4164   *pmode = cmp_mode;
4165 }
4166 \f
4167 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4168
4169 void
4170 emit_indirect_jump (rtx loc)
4171 {
4172   if (!targetm.have_indirect_jump ())
4173     sorry ("indirect jumps are not available on this target");
4174   else
4175     {
4176       struct expand_operand ops[1];
4177       create_address_operand (&ops[0], loc);
4178       expand_jump_insn (targetm.code_for_indirect_jump, 1, ops);
4179       emit_barrier ();
4180     }
4181 }
4182 \f
4183
4184 /* Emit a conditional move instruction if the machine supports one for that
4185    condition and machine mode.
4186
4187    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4188    the mode to use should they be constants.  If it is VOIDmode, they cannot
4189    both be constants.
4190
4191    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4192    should be stored there.  MODE is the mode to use should they be constants.
4193    If it is VOIDmode, they cannot both be constants.
4194
4195    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4196    is not supported.  */
4197
4198 rtx
4199 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4200                        machine_mode cmode, rtx op2, rtx op3,
4201                        machine_mode mode, int unsignedp)
4202 {
4203   rtx comparison;
4204   rtx_insn *last;
4205   enum insn_code icode;
4206   enum rtx_code reversed;
4207
4208   /* If the two source operands are identical, that's just a move.  */
4209
4210   if (rtx_equal_p (op2, op3))
4211     {
4212       if (!target)
4213         target = gen_reg_rtx (mode);
4214
4215       emit_move_insn (target, op3);
4216       return target;
4217     }
4218
4219   /* If one operand is constant, make it the second one.  Only do this
4220      if the other operand is not constant as well.  */
4221
4222   if (swap_commutative_operands_p (op0, op1))
4223     {
4224       std::swap (op0, op1);
4225       code = swap_condition (code);
4226     }
4227
4228   /* get_condition will prefer to generate LT and GT even if the old
4229      comparison was against zero, so undo that canonicalization here since
4230      comparisons against zero are cheaper.  */
4231   if (code == LT && op1 == const1_rtx)
4232     code = LE, op1 = const0_rtx;
4233   else if (code == GT && op1 == constm1_rtx)
4234     code = GE, op1 = const0_rtx;
4235
4236   if (cmode == VOIDmode)
4237     cmode = GET_MODE (op0);
4238
4239   enum rtx_code orig_code = code;
4240   bool swapped = false;
4241   if (swap_commutative_operands_p (op2, op3)
4242       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4243           != UNKNOWN))
4244     {
4245       std::swap (op2, op3);
4246       code = reversed;
4247       swapped = true;
4248     }
4249
4250   if (mode == VOIDmode)
4251     mode = GET_MODE (op2);
4252
4253   icode = direct_optab_handler (movcc_optab, mode);
4254
4255   if (icode == CODE_FOR_nothing)
4256     return NULL_RTX;
4257
4258   if (!target)
4259     target = gen_reg_rtx (mode);
4260
4261   for (int pass = 0; ; pass++)
4262     {
4263       code = unsignedp ? unsigned_condition (code) : code;
4264       comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4265
4266       /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4267          punt and let the caller figure out how best to deal with this
4268          situation.  */
4269       if (COMPARISON_P (comparison))
4270         {
4271           saved_pending_stack_adjust save;
4272           save_pending_stack_adjust (&save);
4273           last = get_last_insn ();
4274           do_pending_stack_adjust ();
4275           prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4276                             GET_CODE (comparison), NULL_RTX, unsignedp,
4277                             OPTAB_WIDEN, &comparison, &cmode);
4278           if (comparison)
4279             {
4280               struct expand_operand ops[4];
4281
4282               create_output_operand (&ops[0], target, mode);
4283               create_fixed_operand (&ops[1], comparison);
4284               create_input_operand (&ops[2], op2, mode);
4285               create_input_operand (&ops[3], op3, mode);
4286               if (maybe_expand_insn (icode, 4, ops))
4287                 {
4288                   if (ops[0].value != target)
4289                     convert_move (target, ops[0].value, false);
4290                   return target;
4291                 }
4292             }
4293           delete_insns_since (last);
4294           restore_pending_stack_adjust (&save);
4295         }
4296
4297       if (pass == 1)
4298         return NULL_RTX;
4299
4300       /* If the preferred op2/op3 order is not usable, retry with other
4301          operand order, perhaps it will expand successfully.  */
4302       if (swapped)
4303         code = orig_code;
4304       else if ((reversed = reversed_comparison_code_parts (orig_code, op0, op1,
4305                                                            NULL))
4306                != UNKNOWN)
4307         code = reversed;
4308       else
4309         return NULL_RTX;
4310       std::swap (op2, op3);
4311     }
4312 }
4313
4314
4315 /* Emit a conditional negate or bitwise complement using the
4316    negcc or notcc optabs if available.  Return NULL_RTX if such operations
4317    are not available.  Otherwise return the RTX holding the result.
4318    TARGET is the desired destination of the result.  COMP is the comparison
4319    on which to negate.  If COND is true move into TARGET the negation
4320    or bitwise complement of OP1.  Otherwise move OP2 into TARGET.
4321    CODE is either NEG or NOT.  MODE is the machine mode in which the
4322    operation is performed.  */
4323
4324 rtx
4325 emit_conditional_neg_or_complement (rtx target, rtx_code code,
4326                                      machine_mode mode, rtx cond, rtx op1,
4327                                      rtx op2)
4328 {
4329   optab op = unknown_optab;
4330   if (code == NEG)
4331     op = negcc_optab;
4332   else if (code == NOT)
4333     op = notcc_optab;
4334   else
4335     gcc_unreachable ();
4336
4337   insn_code icode = direct_optab_handler (op, mode);
4338
4339   if (icode == CODE_FOR_nothing)
4340     return NULL_RTX;
4341
4342   if (!target)
4343     target = gen_reg_rtx (mode);
4344
4345   rtx_insn *last = get_last_insn ();
4346   struct expand_operand ops[4];
4347
4348   create_output_operand (&ops[0], target, mode);
4349   create_fixed_operand (&ops[1], cond);
4350   create_input_operand (&ops[2], op1, mode);
4351   create_input_operand (&ops[3], op2, mode);
4352
4353   if (maybe_expand_insn (icode, 4, ops))
4354     {
4355       if (ops[0].value != target)
4356         convert_move (target, ops[0].value, false);
4357
4358       return target;
4359     }
4360   delete_insns_since (last);
4361   return NULL_RTX;
4362 }
4363
4364 /* Emit a conditional addition instruction if the machine supports one for that
4365    condition and machine mode.
4366
4367    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4368    the mode to use should they be constants.  If it is VOIDmode, they cannot
4369    both be constants.
4370
4371    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4372    should be stored there.  MODE is the mode to use should they be constants.
4373    If it is VOIDmode, they cannot both be constants.
4374
4375    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4376    is not supported.  */
4377
4378 rtx
4379 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4380                       machine_mode cmode, rtx op2, rtx op3,
4381                       machine_mode mode, int unsignedp)
4382 {
4383   rtx comparison;
4384   rtx_insn *last;
4385   enum insn_code icode;
4386
4387   /* If one operand is constant, make it the second one.  Only do this
4388      if the other operand is not constant as well.  */
4389
4390   if (swap_commutative_operands_p (op0, op1))
4391     {
4392       std::swap (op0, op1);
4393       code = swap_condition (code);
4394     }
4395
4396   /* get_condition will prefer to generate LT and GT even if the old
4397      comparison was against zero, so undo that canonicalization here since
4398      comparisons against zero are cheaper.  */
4399   if (code == LT && op1 == const1_rtx)
4400     code = LE, op1 = const0_rtx;
4401   else if (code == GT && op1 == constm1_rtx)
4402     code = GE, op1 = const0_rtx;
4403
4404   if (cmode == VOIDmode)
4405     cmode = GET_MODE (op0);
4406
4407   if (mode == VOIDmode)
4408     mode = GET_MODE (op2);
4409
4410   icode = optab_handler (addcc_optab, mode);
4411
4412   if (icode == CODE_FOR_nothing)
4413     return 0;
4414
4415   if (!target)
4416     target = gen_reg_rtx (mode);
4417
4418   code = unsignedp ? unsigned_condition (code) : code;
4419   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4420
4421   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4422      return NULL and let the caller figure out how best to deal with this
4423      situation.  */
4424   if (!COMPARISON_P (comparison))
4425     return NULL_RTX;
4426
4427   do_pending_stack_adjust ();
4428   last = get_last_insn ();
4429   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4430                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4431                     &comparison, &cmode);
4432   if (comparison)
4433     {
4434       struct expand_operand ops[4];
4435
4436       create_output_operand (&ops[0], target, mode);
4437       create_fixed_operand (&ops[1], comparison);
4438       create_input_operand (&ops[2], op2, mode);
4439       create_input_operand (&ops[3], op3, mode);
4440       if (maybe_expand_insn (icode, 4, ops))
4441         {
4442           if (ops[0].value != target)
4443             convert_move (target, ops[0].value, false);
4444           return target;
4445         }
4446     }
4447   delete_insns_since (last);
4448   return NULL_RTX;
4449 }
4450 \f
4451 /* These functions attempt to generate an insn body, rather than
4452    emitting the insn, but if the gen function already emits them, we
4453    make no attempt to turn them back into naked patterns.  */
4454
4455 /* Generate and return an insn body to add Y to X.  */
4456
4457 rtx_insn *
4458 gen_add2_insn (rtx x, rtx y)
4459 {
4460   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4461
4462   gcc_assert (insn_operand_matches (icode, 0, x));
4463   gcc_assert (insn_operand_matches (icode, 1, x));
4464   gcc_assert (insn_operand_matches (icode, 2, y));
4465
4466   return GEN_FCN (icode) (x, x, y);
4467 }
4468
4469 /* Generate and return an insn body to add r1 and c,
4470    storing the result in r0.  */
4471
4472 rtx_insn *
4473 gen_add3_insn (rtx r0, rtx r1, rtx c)
4474 {
4475   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4476
4477   if (icode == CODE_FOR_nothing
4478       || !insn_operand_matches (icode, 0, r0)
4479       || !insn_operand_matches (icode, 1, r1)
4480       || !insn_operand_matches (icode, 2, c))
4481     return NULL;
4482
4483   return GEN_FCN (icode) (r0, r1, c);
4484 }
4485
4486 int
4487 have_add2_insn (rtx x, rtx y)
4488 {
4489   enum insn_code icode;
4490
4491   gcc_assert (GET_MODE (x) != VOIDmode);
4492
4493   icode = optab_handler (add_optab, GET_MODE (x));
4494
4495   if (icode == CODE_FOR_nothing)
4496     return 0;
4497
4498   if (!insn_operand_matches (icode, 0, x)
4499       || !insn_operand_matches (icode, 1, x)
4500       || !insn_operand_matches (icode, 2, y))
4501     return 0;
4502
4503   return 1;
4504 }
4505
4506 /* Generate and return an insn body to add Y to X.  */
4507
4508 rtx_insn *
4509 gen_addptr3_insn (rtx x, rtx y, rtx z)
4510 {
4511   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4512
4513   gcc_assert (insn_operand_matches (icode, 0, x));
4514   gcc_assert (insn_operand_matches (icode, 1, y));
4515   gcc_assert (insn_operand_matches (icode, 2, z));
4516
4517   return GEN_FCN (icode) (x, y, z);
4518 }
4519
4520 /* Return true if the target implements an addptr pattern and X, Y,
4521    and Z are valid for the pattern predicates.  */
4522
4523 int
4524 have_addptr3_insn (rtx x, rtx y, rtx z)
4525 {
4526   enum insn_code icode;
4527
4528   gcc_assert (GET_MODE (x) != VOIDmode);
4529
4530   icode = optab_handler (addptr3_optab, GET_MODE (x));
4531
4532   if (icode == CODE_FOR_nothing)
4533     return 0;
4534
4535   if (!insn_operand_matches (icode, 0, x)
4536       || !insn_operand_matches (icode, 1, y)
4537       || !insn_operand_matches (icode, 2, z))
4538     return 0;
4539
4540   return 1;
4541 }
4542
4543 /* Generate and return an insn body to subtract Y from X.  */
4544
4545 rtx_insn *
4546 gen_sub2_insn (rtx x, rtx y)
4547 {
4548   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4549
4550   gcc_assert (insn_operand_matches (icode, 0, x));
4551   gcc_assert (insn_operand_matches (icode, 1, x));
4552   gcc_assert (insn_operand_matches (icode, 2, y));
4553
4554   return GEN_FCN (icode) (x, x, y);
4555 }
4556
4557 /* Generate and return an insn body to subtract r1 and c,
4558    storing the result in r0.  */
4559
4560 rtx_insn *
4561 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4562 {
4563   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4564
4565   if (icode == CODE_FOR_nothing
4566       || !insn_operand_matches (icode, 0, r0)
4567       || !insn_operand_matches (icode, 1, r1)
4568       || !insn_operand_matches (icode, 2, c))
4569     return NULL;
4570
4571   return GEN_FCN (icode) (r0, r1, c);
4572 }
4573
4574 int
4575 have_sub2_insn (rtx x, rtx y)
4576 {
4577   enum insn_code icode;
4578
4579   gcc_assert (GET_MODE (x) != VOIDmode);
4580
4581   icode = optab_handler (sub_optab, GET_MODE (x));
4582
4583   if (icode == CODE_FOR_nothing)
4584     return 0;
4585
4586   if (!insn_operand_matches (icode, 0, x)
4587       || !insn_operand_matches (icode, 1, x)
4588       || !insn_operand_matches (icode, 2, y))
4589     return 0;
4590
4591   return 1;
4592 }
4593 \f
4594 /* Generate the body of an insn to extend Y (with mode MFROM)
4595    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4596
4597 rtx_insn *
4598 gen_extend_insn (rtx x, rtx y, machine_mode mto,
4599                  machine_mode mfrom, int unsignedp)
4600 {
4601   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4602   return GEN_FCN (icode) (x, y);
4603 }
4604 \f
4605 /* Generate code to convert FROM to floating point
4606    and store in TO.  FROM must be fixed point and not VOIDmode.
4607    UNSIGNEDP nonzero means regard FROM as unsigned.
4608    Normally this is done by correcting the final value
4609    if it is negative.  */
4610
4611 void
4612 expand_float (rtx to, rtx from, int unsignedp)
4613 {
4614   enum insn_code icode;
4615   rtx target = to;
4616   machine_mode fmode, imode;
4617   bool can_do_signed = false;
4618
4619   /* Crash now, because we won't be able to decide which mode to use.  */
4620   gcc_assert (GET_MODE (from) != VOIDmode);
4621
4622   /* Look for an insn to do the conversion.  Do it in the specified
4623      modes if possible; otherwise convert either input, output or both to
4624      wider mode.  If the integer mode is wider than the mode of FROM,
4625      we can do the conversion signed even if the input is unsigned.  */
4626
4627   FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
4628     FOR_EACH_MODE_FROM (imode, GET_MODE (from))
4629       {
4630         int doing_unsigned = unsignedp;
4631
4632         if (fmode != GET_MODE (to)
4633             && significand_size (fmode) < GET_MODE_PRECISION (GET_MODE (from)))
4634           continue;
4635
4636         icode = can_float_p (fmode, imode, unsignedp);
4637         if (icode == CODE_FOR_nothing && unsignedp)
4638           {
4639             enum insn_code scode = can_float_p (fmode, imode, 0);
4640             if (scode != CODE_FOR_nothing)
4641               can_do_signed = true;
4642             if (imode != GET_MODE (from))
4643               icode = scode, doing_unsigned = 0;
4644           }
4645
4646         if (icode != CODE_FOR_nothing)
4647           {
4648             if (imode != GET_MODE (from))
4649               from = convert_to_mode (imode, from, unsignedp);
4650
4651             if (fmode != GET_MODE (to))
4652               target = gen_reg_rtx (fmode);
4653
4654             emit_unop_insn (icode, target, from,
4655                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
4656
4657             if (target != to)
4658               convert_move (to, target, 0);
4659             return;
4660           }
4661       }
4662
4663   /* Unsigned integer, and no way to convert directly.  Convert as signed,
4664      then unconditionally adjust the result.  */
4665   if (unsignedp && can_do_signed)
4666     {
4667       rtx_code_label *label = gen_label_rtx ();
4668       rtx temp;
4669       REAL_VALUE_TYPE offset;
4670
4671       /* Look for a usable floating mode FMODE wider than the source and at
4672          least as wide as the target.  Using FMODE will avoid rounding woes
4673          with unsigned values greater than the signed maximum value.  */
4674
4675       FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
4676         if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_BITSIZE (fmode)
4677             && can_float_p (fmode, GET_MODE (from), 0) != CODE_FOR_nothing)
4678           break;
4679
4680       if (fmode == VOIDmode)
4681         {
4682           /* There is no such mode.  Pretend the target is wide enough.  */
4683           fmode = GET_MODE (to);
4684
4685           /* Avoid double-rounding when TO is narrower than FROM.  */
4686           if ((significand_size (fmode) + 1)
4687               < GET_MODE_PRECISION (GET_MODE (from)))
4688             {
4689               rtx temp1;
4690               rtx_code_label *neglabel = gen_label_rtx ();
4691
4692               /* Don't use TARGET if it isn't a register, is a hard register,
4693                  or is the wrong mode.  */
4694               if (!REG_P (target)
4695                   || REGNO (target) < FIRST_PSEUDO_REGISTER
4696                   || GET_MODE (target) != fmode)
4697                 target = gen_reg_rtx (fmode);
4698
4699               imode = GET_MODE (from);
4700               do_pending_stack_adjust ();
4701
4702               /* Test whether the sign bit is set.  */
4703               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
4704                                        0, neglabel);
4705
4706               /* The sign bit is not set.  Convert as signed.  */
4707               expand_float (target, from, 0);
4708               emit_jump_insn (targetm.gen_jump (label));
4709               emit_barrier ();
4710
4711               /* The sign bit is set.
4712                  Convert to a usable (positive signed) value by shifting right
4713                  one bit, while remembering if a nonzero bit was shifted
4714                  out; i.e., compute  (from & 1) | (from >> 1).  */
4715
4716               emit_label (neglabel);
4717               temp = expand_binop (imode, and_optab, from, const1_rtx,
4718                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
4719               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
4720               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
4721                                    OPTAB_LIB_WIDEN);
4722               expand_float (target, temp, 0);
4723
4724               /* Multiply by 2 to undo the shift above.  */
4725               temp = expand_binop (fmode, add_optab, target, target,
4726                                    target, 0, OPTAB_LIB_WIDEN);
4727               if (temp != target)
4728                 emit_move_insn (target, temp);
4729
4730               do_pending_stack_adjust ();
4731               emit_label (label);
4732               goto done;
4733             }
4734         }
4735
4736       /* If we are about to do some arithmetic to correct for an
4737          unsigned operand, do it in a pseudo-register.  */
4738
4739       if (GET_MODE (to) != fmode
4740           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
4741         target = gen_reg_rtx (fmode);
4742
4743       /* Convert as signed integer to floating.  */
4744       expand_float (target, from, 0);
4745
4746       /* If FROM is negative (and therefore TO is negative),
4747          correct its value by 2**bitwidth.  */
4748
4749       do_pending_stack_adjust ();
4750       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, GET_MODE (from),
4751                                0, label);
4752
4753
4754       real_2expN (&offset, GET_MODE_PRECISION (GET_MODE (from)), fmode);
4755       temp = expand_binop (fmode, add_optab, target,
4756                            const_double_from_real_value (offset, fmode),
4757                            target, 0, OPTAB_LIB_WIDEN);
4758       if (temp != target)
4759         emit_move_insn (target, temp);
4760
4761       do_pending_stack_adjust ();
4762       emit_label (label);
4763       goto done;
4764     }
4765
4766   /* No hardware instruction available; call a library routine.  */
4767     {
4768       rtx libfunc;
4769       rtx_insn *insns;
4770       rtx value;
4771       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
4772
4773       if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_PRECISION (SImode))
4774         from = convert_to_mode (SImode, from, unsignedp);
4775
4776       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
4777       gcc_assert (libfunc);
4778
4779       start_sequence ();
4780
4781       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4782                                        GET_MODE (to), 1, from,
4783                                        GET_MODE (from));
4784       insns = get_insns ();
4785       end_sequence ();
4786
4787       emit_libcall_block (insns, target, value,
4788                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
4789                                          GET_MODE (to), from));
4790     }
4791
4792  done:
4793
4794   /* Copy result to requested destination
4795      if we have been computing in a temp location.  */
4796
4797   if (target != to)
4798     {
4799       if (GET_MODE (target) == GET_MODE (to))
4800         emit_move_insn (to, target);
4801       else
4802         convert_move (to, target, 0);
4803     }
4804 }
4805 \f
4806 /* Generate code to convert FROM to fixed point and store in TO.  FROM
4807    must be floating point.  */
4808
4809 void
4810 expand_fix (rtx to, rtx from, int unsignedp)
4811 {
4812   enum insn_code icode;
4813   rtx target = to;
4814   machine_mode fmode, imode;
4815   bool must_trunc = false;
4816
4817   /* We first try to find a pair of modes, one real and one integer, at
4818      least as wide as FROM and TO, respectively, in which we can open-code
4819      this conversion.  If the integer mode is wider than the mode of TO,
4820      we can do the conversion either signed or unsigned.  */
4821
4822   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
4823     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
4824       {
4825         int doing_unsigned = unsignedp;
4826
4827         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
4828         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
4829           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
4830
4831         if (icode != CODE_FOR_nothing)
4832           {
4833             rtx_insn *last = get_last_insn ();
4834             if (fmode != GET_MODE (from))
4835               from = convert_to_mode (fmode, from, 0);
4836
4837             if (must_trunc)
4838               {
4839                 rtx temp = gen_reg_rtx (GET_MODE (from));
4840                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
4841                                     temp, 0);
4842               }
4843
4844             if (imode != GET_MODE (to))
4845               target = gen_reg_rtx (imode);
4846
4847             if (maybe_emit_unop_insn (icode, target, from,
4848                                       doing_unsigned ? UNSIGNED_FIX : FIX))
4849               {
4850                 if (target != to)
4851                   convert_move (to, target, unsignedp);
4852                 return;
4853               }
4854             delete_insns_since (last);
4855           }
4856       }
4857
4858   /* For an unsigned conversion, there is one more way to do it.
4859      If we have a signed conversion, we generate code that compares
4860      the real value to the largest representable positive number.  If if
4861      is smaller, the conversion is done normally.  Otherwise, subtract
4862      one plus the highest signed number, convert, and add it back.
4863
4864      We only need to check all real modes, since we know we didn't find
4865      anything with a wider integer mode.
4866
4867      This code used to extend FP value into mode wider than the destination.
4868      This is needed for decimal float modes which cannot accurately
4869      represent one plus the highest signed number of the same size, but
4870      not for binary modes.  Consider, for instance conversion from SFmode
4871      into DImode.
4872
4873      The hot path through the code is dealing with inputs smaller than 2^63
4874      and doing just the conversion, so there is no bits to lose.
4875
4876      In the other path we know the value is positive in the range 2^63..2^64-1
4877      inclusive.  (as for other input overflow happens and result is undefined)
4878      So we know that the most important bit set in mantissa corresponds to
4879      2^63.  The subtraction of 2^63 should not generate any rounding as it
4880      simply clears out that bit.  The rest is trivial.  */
4881
4882   if (unsignedp && GET_MODE_PRECISION (GET_MODE (to)) <= HOST_BITS_PER_WIDE_INT)
4883     FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
4884       if (CODE_FOR_nothing != can_fix_p (GET_MODE (to), fmode, 0, &must_trunc)
4885           && (!DECIMAL_FLOAT_MODE_P (fmode)
4886               || GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (GET_MODE (to))))
4887         {
4888           int bitsize;
4889           REAL_VALUE_TYPE offset;
4890           rtx limit;
4891           rtx_code_label *lab1, *lab2;
4892           rtx_insn *insn;
4893
4894           bitsize = GET_MODE_PRECISION (GET_MODE (to));
4895           real_2expN (&offset, bitsize - 1, fmode);
4896           limit = const_double_from_real_value (offset, fmode);
4897           lab1 = gen_label_rtx ();
4898           lab2 = gen_label_rtx ();
4899
4900           if (fmode != GET_MODE (from))
4901             from = convert_to_mode (fmode, from, 0);
4902
4903           /* See if we need to do the subtraction.  */
4904           do_pending_stack_adjust ();
4905           emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX, GET_MODE (from),
4906                                    0, lab1);
4907
4908           /* If not, do the signed "fix" and branch around fixup code.  */
4909           expand_fix (to, from, 0);
4910           emit_jump_insn (targetm.gen_jump (lab2));
4911           emit_barrier ();
4912
4913           /* Otherwise, subtract 2**(N-1), convert to signed number,
4914              then add 2**(N-1).  Do the addition using XOR since this
4915              will often generate better code.  */
4916           emit_label (lab1);
4917           target = expand_binop (GET_MODE (from), sub_optab, from, limit,
4918                                  NULL_RTX, 0, OPTAB_LIB_WIDEN);
4919           expand_fix (to, target, 0);
4920           target = expand_binop (GET_MODE (to), xor_optab, to,
4921                                  gen_int_mode
4922                                  (HOST_WIDE_INT_1 << (bitsize - 1),
4923                                   GET_MODE (to)),
4924                                  to, 1, OPTAB_LIB_WIDEN);
4925
4926           if (target != to)
4927             emit_move_insn (to, target);
4928
4929           emit_label (lab2);
4930
4931           if (optab_handler (mov_optab, GET_MODE (to)) != CODE_FOR_nothing)
4932             {
4933               /* Make a place for a REG_NOTE and add it.  */
4934               insn = emit_move_insn (to, to);
4935               set_dst_reg_note (insn, REG_EQUAL,
4936                                 gen_rtx_fmt_e (UNSIGNED_FIX, GET_MODE (to),
4937                                                copy_rtx (from)),
4938                                 to);
4939             }
4940
4941           return;
4942         }
4943
4944   /* We can't do it with an insn, so use a library call.  But first ensure
4945      that the mode of TO is at least as wide as SImode, since those are the
4946      only library calls we know about.  */
4947
4948   if (GET_MODE_PRECISION (GET_MODE (to)) < GET_MODE_PRECISION (SImode))
4949     {
4950       target = gen_reg_rtx (SImode);
4951
4952       expand_fix (target, from, unsignedp);
4953     }
4954   else
4955     {
4956       rtx_insn *insns;
4957       rtx value;
4958       rtx libfunc;
4959
4960       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
4961       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
4962       gcc_assert (libfunc);
4963
4964       start_sequence ();
4965
4966       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4967                                        GET_MODE (to), 1, from,
4968                                        GET_MODE (from));
4969       insns = get_insns ();
4970       end_sequence ();
4971
4972       emit_libcall_block (insns, target, value,
4973                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
4974                                          GET_MODE (to), from));
4975     }
4976
4977   if (target != to)
4978     {
4979       if (GET_MODE (to) == GET_MODE (target))
4980         emit_move_insn (to, target);
4981       else
4982         convert_move (to, target, 0);
4983     }
4984 }
4985
4986
4987 /* Promote integer arguments for a libcall if necessary.
4988    emit_library_call_value cannot do the promotion because it does not
4989    know if it should do a signed or unsigned promotion.  This is because
4990    there are no tree types defined for libcalls.  */
4991
4992 static rtx
4993 prepare_libcall_arg (rtx arg, int uintp)
4994 {
4995   machine_mode mode = GET_MODE (arg);
4996   machine_mode arg_mode;
4997   if (SCALAR_INT_MODE_P (mode))
4998     {
4999       /*  If we need to promote the integer function argument we need to do
5000           it here instead of inside emit_library_call_value because in
5001           emit_library_call_value we don't know if we should do a signed or
5002           unsigned promotion.  */
5003
5004       int unsigned_p = 0;
5005       arg_mode = promote_function_mode (NULL_TREE, mode,
5006                                         &unsigned_p, NULL_TREE, 0);
5007       if (arg_mode != mode)
5008         return convert_to_mode (arg_mode, arg, uintp);
5009     }
5010     return arg;
5011 }
5012
5013 /* Generate code to convert FROM or TO a fixed-point.
5014    If UINTP is true, either TO or FROM is an unsigned integer.
5015    If SATP is true, we need to saturate the result.  */
5016
5017 void
5018 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5019 {
5020   machine_mode to_mode = GET_MODE (to);
5021   machine_mode from_mode = GET_MODE (from);
5022   convert_optab tab;
5023   enum rtx_code this_code;
5024   enum insn_code code;
5025   rtx_insn *insns;
5026   rtx value;
5027   rtx libfunc;
5028
5029   if (to_mode == from_mode)
5030     {
5031       emit_move_insn (to, from);
5032       return;
5033     }
5034
5035   if (uintp)
5036     {
5037       tab = satp ? satfractuns_optab : fractuns_optab;
5038       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5039     }
5040   else
5041     {
5042       tab = satp ? satfract_optab : fract_optab;
5043       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5044     }
5045   code = convert_optab_handler (tab, to_mode, from_mode);
5046   if (code != CODE_FOR_nothing)
5047     {
5048       emit_unop_insn (code, to, from, this_code);
5049       return;
5050     }
5051
5052   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5053   gcc_assert (libfunc);
5054
5055   from = prepare_libcall_arg (from, uintp);
5056   from_mode = GET_MODE (from);
5057
5058   start_sequence ();
5059   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5060                                    1, from, from_mode);
5061   insns = get_insns ();
5062   end_sequence ();
5063
5064   emit_libcall_block (insns, to, value,
5065                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5066 }
5067
5068 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5069    must be floating point, TO must be signed.  Use the conversion optab
5070    TAB to do the conversion.  */
5071
5072 bool
5073 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5074 {
5075   enum insn_code icode;
5076   rtx target = to;
5077   machine_mode fmode, imode;
5078
5079   /* We first try to find a pair of modes, one real and one integer, at
5080      least as wide as FROM and TO, respectively, in which we can open-code
5081      this conversion.  If the integer mode is wider than the mode of TO,
5082      we can do the conversion either signed or unsigned.  */
5083
5084   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
5085     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
5086       {
5087         icode = convert_optab_handler (tab, imode, fmode);
5088         if (icode != CODE_FOR_nothing)
5089           {
5090             rtx_insn *last = get_last_insn ();
5091             if (fmode != GET_MODE (from))
5092               from = convert_to_mode (fmode, from, 0);
5093
5094             if (imode != GET_MODE (to))
5095               target = gen_reg_rtx (imode);
5096
5097             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5098               {
5099                 delete_insns_since (last);
5100                 continue;
5101               }
5102             if (target != to)
5103               convert_move (to, target, 0);
5104             return true;
5105           }
5106       }
5107
5108   return false;
5109 }
5110 \f
5111 /* Report whether we have an instruction to perform the operation
5112    specified by CODE on operands of mode MODE.  */
5113 int
5114 have_insn_for (enum rtx_code code, machine_mode mode)
5115 {
5116   return (code_to_optab (code)
5117           && (optab_handler (code_to_optab (code), mode)
5118               != CODE_FOR_nothing));
5119 }
5120
5121 /* Print information about the current contents of the optabs on
5122    STDERR.  */
5123
5124 DEBUG_FUNCTION void
5125 debug_optab_libfuncs (void)
5126 {
5127   int i, j, k;
5128
5129   /* Dump the arithmetic optabs.  */
5130   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
5131     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5132       {
5133         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
5134         if (l)
5135           {
5136             gcc_assert (GET_CODE (l) == SYMBOL_REF);
5137             fprintf (stderr, "%s\t%s:\t%s\n",
5138                      GET_RTX_NAME (optab_to_code ((optab) i)),
5139                      GET_MODE_NAME (j),
5140                      XSTR (l, 0));
5141           }
5142       }
5143
5144   /* Dump the conversion optabs.  */
5145   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
5146     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5147       for (k = 0; k < NUM_MACHINE_MODES; ++k)
5148         {
5149           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
5150                                          (machine_mode) k);
5151           if (l)
5152             {
5153               gcc_assert (GET_CODE (l) == SYMBOL_REF);
5154               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
5155                        GET_RTX_NAME (optab_to_code ((optab) i)),
5156                        GET_MODE_NAME (j),
5157                        GET_MODE_NAME (k),
5158                        XSTR (l, 0));
5159             }
5160         }
5161 }
5162
5163 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
5164    CODE.  Return 0 on failure.  */
5165
5166 rtx_insn *
5167 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
5168 {
5169   machine_mode mode = GET_MODE (op1);
5170   enum insn_code icode;
5171   rtx_insn *insn;
5172   rtx trap_rtx;
5173
5174   if (mode == VOIDmode)
5175     return 0;
5176
5177   icode = optab_handler (ctrap_optab, mode);
5178   if (icode == CODE_FOR_nothing)
5179     return 0;
5180
5181   /* Some targets only accept a zero trap code.  */
5182   if (!insn_operand_matches (icode, 3, tcode))
5183     return 0;
5184
5185   do_pending_stack_adjust ();
5186   start_sequence ();
5187   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
5188                     &trap_rtx, &mode);
5189   if (!trap_rtx)
5190     insn = NULL;
5191   else
5192     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
5193                             tcode);
5194
5195   /* If that failed, then give up.  */
5196   if (insn == 0)
5197     {
5198       end_sequence ();
5199       return 0;
5200     }
5201
5202   emit_insn (insn);
5203   insn = get_insns ();
5204   end_sequence ();
5205   return insn;
5206 }
5207
5208 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
5209    or unsigned operation code.  */
5210
5211 enum rtx_code
5212 get_rtx_code (enum tree_code tcode, bool unsignedp)
5213 {
5214   enum rtx_code code;
5215   switch (tcode)
5216     {
5217     case EQ_EXPR:
5218       code = EQ;
5219       break;
5220     case NE_EXPR:
5221       code = NE;
5222       break;
5223     case LT_EXPR:
5224       code = unsignedp ? LTU : LT;
5225       break;
5226     case LE_EXPR:
5227       code = unsignedp ? LEU : LE;
5228       break;
5229     case GT_EXPR:
5230       code = unsignedp ? GTU : GT;
5231       break;
5232     case GE_EXPR:
5233       code = unsignedp ? GEU : GE;
5234       break;
5235
5236     case UNORDERED_EXPR:
5237       code = UNORDERED;
5238       break;
5239     case ORDERED_EXPR:
5240       code = ORDERED;
5241       break;
5242     case UNLT_EXPR:
5243       code = UNLT;
5244       break;
5245     case UNLE_EXPR:
5246       code = UNLE;
5247       break;
5248     case UNGT_EXPR:
5249       code = UNGT;
5250       break;
5251     case UNGE_EXPR:
5252       code = UNGE;
5253       break;
5254     case UNEQ_EXPR:
5255       code = UNEQ;
5256       break;
5257     case LTGT_EXPR:
5258       code = LTGT;
5259       break;
5260
5261     case BIT_AND_EXPR:
5262       code = AND;
5263       break;
5264
5265     case BIT_IOR_EXPR:
5266       code = IOR;
5267       break;
5268
5269     default:
5270       gcc_unreachable ();
5271     }
5272   return code;
5273 }
5274
5275 /* Return a comparison rtx of mode CMP_MODE for COND.  Use UNSIGNEDP to
5276    select signed or unsigned operators.  OPNO holds the index of the
5277    first comparison operand for insn ICODE.  Do not generate the
5278    compare instruction itself.  */
5279
5280 static rtx
5281 vector_compare_rtx (machine_mode cmp_mode, enum tree_code tcode,
5282                     tree t_op0, tree t_op1, bool unsignedp,
5283                     enum insn_code icode, unsigned int opno)
5284 {
5285   struct expand_operand ops[2];
5286   rtx rtx_op0, rtx_op1;
5287   machine_mode m0, m1;
5288   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
5289
5290   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
5291
5292   /* Expand operands.  For vector types with scalar modes, e.g. where int64x1_t
5293      has mode DImode, this can produce a constant RTX of mode VOIDmode; in such
5294      cases, use the original mode.  */
5295   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
5296                          EXPAND_STACK_PARM);
5297   m0 = GET_MODE (rtx_op0);
5298   if (m0 == VOIDmode)
5299     m0 = TYPE_MODE (TREE_TYPE (t_op0));
5300
5301   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
5302                          EXPAND_STACK_PARM);
5303   m1 = GET_MODE (rtx_op1);
5304   if (m1 == VOIDmode)
5305     m1 = TYPE_MODE (TREE_TYPE (t_op1));
5306
5307   create_input_operand (&ops[0], rtx_op0, m0);
5308   create_input_operand (&ops[1], rtx_op1, m1);
5309   if (!maybe_legitimize_operands (icode, opno, 2, ops))
5310     gcc_unreachable ();
5311   return gen_rtx_fmt_ee (rcode, cmp_mode, ops[0].value, ops[1].value);
5312 }
5313
5314 /* Checks if vec_perm mask SEL is a constant equivalent to a shift of the first
5315    vec_perm operand, assuming the second operand is a constant vector of zeroes.
5316    Return the shift distance in bits if so, or NULL_RTX if the vec_perm is not a
5317    shift.  */
5318 static rtx
5319 shift_amt_for_vec_perm_mask (rtx sel)
5320 {
5321   unsigned int i, first, nelt = GET_MODE_NUNITS (GET_MODE (sel));
5322   unsigned int bitsize = GET_MODE_UNIT_BITSIZE (GET_MODE (sel));
5323
5324   if (GET_CODE (sel) != CONST_VECTOR)
5325     return NULL_RTX;
5326
5327   first = INTVAL (CONST_VECTOR_ELT (sel, 0));
5328   if (first >= nelt)
5329     return NULL_RTX;
5330   for (i = 1; i < nelt; i++)
5331     {
5332       int idx = INTVAL (CONST_VECTOR_ELT (sel, i));
5333       unsigned int expected = i + first;
5334       /* Indices into the second vector are all equivalent.  */
5335       if (idx < 0 || (MIN (nelt, (unsigned) idx) != MIN (nelt, expected)))
5336         return NULL_RTX;
5337     }
5338
5339   return GEN_INT (first * bitsize);
5340 }
5341
5342 /* A subroutine of expand_vec_perm for expanding one vec_perm insn.  */
5343
5344 static rtx
5345 expand_vec_perm_1 (enum insn_code icode, rtx target,
5346                    rtx v0, rtx v1, rtx sel)
5347 {
5348   machine_mode tmode = GET_MODE (target);
5349   machine_mode smode = GET_MODE (sel);
5350   struct expand_operand ops[4];
5351
5352   create_output_operand (&ops[0], target, tmode);
5353   create_input_operand (&ops[3], sel, smode);
5354
5355   /* Make an effort to preserve v0 == v1.  The target expander is able to
5356      rely on this to determine if we're permuting a single input operand.  */
5357   if (rtx_equal_p (v0, v1))
5358     {
5359       if (!insn_operand_matches (icode, 1, v0))
5360         v0 = force_reg (tmode, v0);
5361       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
5362       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
5363
5364       create_fixed_operand (&ops[1], v0);
5365       create_fixed_operand (&ops[2], v0);
5366     }
5367   else
5368     {
5369       create_input_operand (&ops[1], v0, tmode);
5370       create_input_operand (&ops[2], v1, tmode);
5371     }
5372
5373   if (maybe_expand_insn (icode, 4, ops))
5374     return ops[0].value;
5375   return NULL_RTX;
5376 }
5377
5378 /* Generate instructions for vec_perm optab given its mode
5379    and three operands.  */
5380
5381 rtx
5382 expand_vec_perm (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
5383 {
5384   enum insn_code icode;
5385   machine_mode qimode;
5386   unsigned int i, w, e, u;
5387   rtx tmp, sel_qi = NULL;
5388   rtvec vec;
5389
5390   if (!target || GET_MODE (target) != mode)
5391     target = gen_reg_rtx (mode);
5392
5393   w = GET_MODE_SIZE (mode);
5394   e = GET_MODE_NUNITS (mode);
5395   u = GET_MODE_UNIT_SIZE (mode);
5396
5397   /* Set QIMODE to a different vector mode with byte elements.
5398      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
5399   qimode = VOIDmode;
5400   if (GET_MODE_INNER (mode) != QImode)
5401     {
5402       qimode = mode_for_vector (QImode, w);
5403       if (!VECTOR_MODE_P (qimode))
5404         qimode = VOIDmode;
5405     }
5406
5407   /* If the input is a constant, expand it specially.  */
5408   gcc_assert (GET_MODE_CLASS (GET_MODE (sel)) == MODE_VECTOR_INT);
5409   if (GET_CODE (sel) == CONST_VECTOR)
5410     {
5411       /* See if this can be handled with a vec_shr.  We only do this if the
5412          second vector is all zeroes.  */
5413       enum insn_code shift_code = optab_handler (vec_shr_optab, mode);
5414       enum insn_code shift_code_qi = ((qimode != VOIDmode && qimode != mode)
5415                                       ? optab_handler (vec_shr_optab, qimode)
5416                                       : CODE_FOR_nothing);
5417       rtx shift_amt = NULL_RTX;
5418       if (v1 == CONST0_RTX (GET_MODE (v1))
5419           && (shift_code != CODE_FOR_nothing
5420               || shift_code_qi != CODE_FOR_nothing))
5421         {
5422           shift_amt = shift_amt_for_vec_perm_mask (sel);
5423           if (shift_amt)
5424             {
5425               struct expand_operand ops[3];
5426               if (shift_code != CODE_FOR_nothing)
5427                 {
5428                   create_output_operand (&ops[0], target, mode);
5429                   create_input_operand (&ops[1], v0, mode);
5430                   create_convert_operand_from_type (&ops[2], shift_amt,
5431                                                     sizetype);
5432                   if (maybe_expand_insn (shift_code, 3, ops))
5433                     return ops[0].value;
5434                 }
5435               if (shift_code_qi != CODE_FOR_nothing)
5436                 {
5437                   tmp = gen_reg_rtx (qimode);
5438                   create_output_operand (&ops[0], tmp, qimode);
5439                   create_input_operand (&ops[1], gen_lowpart (qimode, v0),
5440                                         qimode);
5441                   create_convert_operand_from_type (&ops[2], shift_amt,
5442                                                     sizetype);
5443                   if (maybe_expand_insn (shift_code_qi, 3, ops))
5444                     return gen_lowpart (mode, ops[0].value);
5445                 }
5446             }
5447         }
5448
5449       icode = direct_optab_handler (vec_perm_const_optab, mode);
5450       if (icode != CODE_FOR_nothing)
5451         {
5452           tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5453           if (tmp)
5454             return tmp;
5455         }
5456
5457       /* Fall back to a constant byte-based permutation.  */
5458       if (qimode != VOIDmode)
5459         {
5460           vec = rtvec_alloc (w);
5461           for (i = 0; i < e; ++i)
5462             {
5463               unsigned int j, this_e;
5464
5465               this_e = INTVAL (CONST_VECTOR_ELT (sel, i));
5466               this_e &= 2 * e - 1;
5467               this_e *= u;
5468
5469               for (j = 0; j < u; ++j)
5470                 RTVEC_ELT (vec, i * u + j) = GEN_INT (this_e + j);
5471             }
5472           sel_qi = gen_rtx_CONST_VECTOR (qimode, vec);
5473
5474           icode = direct_optab_handler (vec_perm_const_optab, qimode);
5475           if (icode != CODE_FOR_nothing)
5476             {
5477               tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5478               tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5479                                        gen_lowpart (qimode, v1), sel_qi);
5480               if (tmp)
5481                 return gen_lowpart (mode, tmp);
5482             }
5483         }
5484     }
5485
5486   /* Otherwise expand as a fully variable permuation.  */
5487   icode = direct_optab_handler (vec_perm_optab, mode);
5488   if (icode != CODE_FOR_nothing)
5489     {
5490       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5491       if (tmp)
5492         return tmp;
5493     }
5494
5495   /* As a special case to aid several targets, lower the element-based
5496      permutation to a byte-based permutation and try again.  */
5497   if (qimode == VOIDmode)
5498     return NULL_RTX;
5499   icode = direct_optab_handler (vec_perm_optab, qimode);
5500   if (icode == CODE_FOR_nothing)
5501     return NULL_RTX;
5502
5503   if (sel_qi == NULL)
5504     {
5505       /* Multiply each element by its byte size.  */
5506       machine_mode selmode = GET_MODE (sel);
5507       if (u == 2)
5508         sel = expand_simple_binop (selmode, PLUS, sel, sel,
5509                                    NULL, 0, OPTAB_DIRECT);
5510       else
5511         sel = expand_simple_binop (selmode, ASHIFT, sel,
5512                                    GEN_INT (exact_log2 (u)),
5513                                    NULL, 0, OPTAB_DIRECT);
5514       gcc_assert (sel != NULL);
5515
5516       /* Broadcast the low byte each element into each of its bytes.  */
5517       vec = rtvec_alloc (w);
5518       for (i = 0; i < w; ++i)
5519         {
5520           int this_e = i / u * u;
5521           if (BYTES_BIG_ENDIAN)
5522             this_e += u - 1;
5523           RTVEC_ELT (vec, i) = GEN_INT (this_e);
5524         }
5525       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
5526       sel = gen_lowpart (qimode, sel);
5527       sel = expand_vec_perm (qimode, sel, sel, tmp, NULL);
5528       gcc_assert (sel != NULL);
5529
5530       /* Add the byte offset to each byte element.  */
5531       /* Note that the definition of the indicies here is memory ordering,
5532          so there should be no difference between big and little endian.  */
5533       vec = rtvec_alloc (w);
5534       for (i = 0; i < w; ++i)
5535         RTVEC_ELT (vec, i) = GEN_INT (i % u);
5536       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
5537       sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
5538                                     sel, 0, OPTAB_DIRECT);
5539       gcc_assert (sel_qi != NULL);
5540     }
5541
5542   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5543   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5544                            gen_lowpart (qimode, v1), sel_qi);
5545   if (tmp)
5546     tmp = gen_lowpart (mode, tmp);
5547   return tmp;
5548 }
5549
5550 /* Generate insns for a VEC_COND_EXPR with mask, given its TYPE and its
5551    three operands.  */
5552
5553 rtx
5554 expand_vec_cond_mask_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5555                            rtx target)
5556 {
5557   struct expand_operand ops[4];
5558   machine_mode mode = TYPE_MODE (vec_cond_type);
5559   machine_mode mask_mode = TYPE_MODE (TREE_TYPE (op0));
5560   enum insn_code icode = get_vcond_mask_icode (mode, mask_mode);
5561   rtx mask, rtx_op1, rtx_op2;
5562
5563   if (icode == CODE_FOR_nothing)
5564     return 0;
5565
5566   mask = expand_normal (op0);
5567   rtx_op1 = expand_normal (op1);
5568   rtx_op2 = expand_normal (op2);
5569
5570   mask = force_reg (mask_mode, mask);
5571   rtx_op1 = force_reg (GET_MODE (rtx_op1), rtx_op1);
5572
5573   create_output_operand (&ops[0], target, mode);
5574   create_input_operand (&ops[1], rtx_op1, mode);
5575   create_input_operand (&ops[2], rtx_op2, mode);
5576   create_input_operand (&ops[3], mask, mask_mode);
5577   expand_insn (icode, 4, ops);
5578
5579   return ops[0].value;
5580 }
5581
5582 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
5583    three operands.  */
5584
5585 rtx
5586 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5587                       rtx target)
5588 {
5589   struct expand_operand ops[6];
5590   enum insn_code icode;
5591   rtx comparison, rtx_op1, rtx_op2;
5592   machine_mode mode = TYPE_MODE (vec_cond_type);
5593   machine_mode cmp_op_mode;
5594   bool unsignedp;
5595   tree op0a, op0b;
5596   enum tree_code tcode;
5597
5598   if (COMPARISON_CLASS_P (op0))
5599     {
5600       op0a = TREE_OPERAND (op0, 0);
5601       op0b = TREE_OPERAND (op0, 1);
5602       tcode = TREE_CODE (op0);
5603     }
5604   else
5605     {
5606       gcc_assert (VECTOR_BOOLEAN_TYPE_P (TREE_TYPE (op0)));
5607       if (get_vcond_mask_icode (mode, TYPE_MODE (TREE_TYPE (op0)))
5608           != CODE_FOR_nothing)
5609         return expand_vec_cond_mask_expr (vec_cond_type, op0, op1,
5610                                           op2, target);
5611       /* Fake op0 < 0.  */
5612       else
5613         {
5614           gcc_assert (GET_MODE_CLASS (TYPE_MODE (TREE_TYPE (op0)))
5615                       == MODE_VECTOR_INT);
5616           op0a = op0;
5617           op0b = build_zero_cst (TREE_TYPE (op0));
5618           tcode = LT_EXPR;
5619         }
5620     }
5621   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
5622   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5623
5624
5625   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
5626               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
5627
5628   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
5629   if (icode == CODE_FOR_nothing)
5630     {
5631       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5632         icode = get_vcond_eq_icode (mode, cmp_op_mode);
5633       if (icode == CODE_FOR_nothing)
5634         return 0;
5635     }
5636
5637   comparison = vector_compare_rtx (VOIDmode, tcode, op0a, op0b, unsignedp,
5638                                    icode, 4);
5639   rtx_op1 = expand_normal (op1);
5640   rtx_op2 = expand_normal (op2);
5641
5642   create_output_operand (&ops[0], target, mode);
5643   create_input_operand (&ops[1], rtx_op1, mode);
5644   create_input_operand (&ops[2], rtx_op2, mode);
5645   create_fixed_operand (&ops[3], comparison);
5646   create_fixed_operand (&ops[4], XEXP (comparison, 0));
5647   create_fixed_operand (&ops[5], XEXP (comparison, 1));
5648   expand_insn (icode, 6, ops);
5649   return ops[0].value;
5650 }
5651
5652 /* Generate insns for a vector comparison into a mask.  */
5653
5654 rtx
5655 expand_vec_cmp_expr (tree type, tree exp, rtx target)
5656 {
5657   struct expand_operand ops[4];
5658   enum insn_code icode;
5659   rtx comparison;
5660   machine_mode mask_mode = TYPE_MODE (type);
5661   machine_mode vmode;
5662   bool unsignedp;
5663   tree op0a, op0b;
5664   enum tree_code tcode;
5665
5666   op0a = TREE_OPERAND (exp, 0);
5667   op0b = TREE_OPERAND (exp, 1);
5668   tcode = TREE_CODE (exp);
5669
5670   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5671   vmode = TYPE_MODE (TREE_TYPE (op0a));
5672
5673   icode = get_vec_cmp_icode (vmode, mask_mode, unsignedp);
5674   if (icode == CODE_FOR_nothing)
5675     {
5676       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5677         icode = get_vec_cmp_eq_icode (vmode, mask_mode);
5678       if (icode == CODE_FOR_nothing)
5679         return 0;
5680     }
5681
5682   comparison = vector_compare_rtx (mask_mode, tcode, op0a, op0b,
5683                                    unsignedp, icode, 2);
5684   create_output_operand (&ops[0], target, mask_mode);
5685   create_fixed_operand (&ops[1], comparison);
5686   create_fixed_operand (&ops[2], XEXP (comparison, 0));
5687   create_fixed_operand (&ops[3], XEXP (comparison, 1));
5688   expand_insn (icode, 4, ops);
5689   return ops[0].value;
5690 }
5691
5692 /* Expand a highpart multiply.  */
5693
5694 rtx
5695 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
5696                       rtx target, bool uns_p)
5697 {
5698   struct expand_operand eops[3];
5699   enum insn_code icode;
5700   int method, i, nunits;
5701   machine_mode wmode;
5702   rtx m1, m2, perm;
5703   optab tab1, tab2;
5704   rtvec v;
5705
5706   method = can_mult_highpart_p (mode, uns_p);
5707   switch (method)
5708     {
5709     case 0:
5710       return NULL_RTX;
5711     case 1:
5712       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
5713       return expand_binop (mode, tab1, op0, op1, target, uns_p,
5714                            OPTAB_LIB_WIDEN);
5715     case 2:
5716       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
5717       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
5718       break;
5719     case 3:
5720       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
5721       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
5722       if (BYTES_BIG_ENDIAN)
5723         std::swap (tab1, tab2);
5724       break;
5725     default:
5726       gcc_unreachable ();
5727     }
5728
5729   icode = optab_handler (tab1, mode);
5730   nunits = GET_MODE_NUNITS (mode);
5731   wmode = insn_data[icode].operand[0].mode;
5732   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
5733   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
5734
5735   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5736   create_input_operand (&eops[1], op0, mode);
5737   create_input_operand (&eops[2], op1, mode);
5738   expand_insn (icode, 3, eops);
5739   m1 = gen_lowpart (mode, eops[0].value);
5740
5741   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5742   create_input_operand (&eops[1], op0, mode);
5743   create_input_operand (&eops[2], op1, mode);
5744   expand_insn (optab_handler (tab2, mode), 3, eops);
5745   m2 = gen_lowpart (mode, eops[0].value);
5746
5747   v = rtvec_alloc (nunits);
5748   if (method == 2)
5749     {
5750       for (i = 0; i < nunits; ++i)
5751         RTVEC_ELT (v, i) = GEN_INT (!BYTES_BIG_ENDIAN + (i & ~1)
5752                                     + ((i & 1) ? nunits : 0));
5753     }
5754   else
5755     {
5756       for (i = 0; i < nunits; ++i)
5757         RTVEC_ELT (v, i) = GEN_INT (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
5758     }
5759   perm = gen_rtx_CONST_VECTOR (mode, v);
5760
5761   return expand_vec_perm (mode, m1, m2, perm, target);
5762 }
5763 \f
5764 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
5765    pattern.  */
5766
5767 static void
5768 find_cc_set (rtx x, const_rtx pat, void *data)
5769 {
5770   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
5771       && GET_CODE (pat) == SET)
5772     {
5773       rtx *p_cc_reg = (rtx *) data;
5774       gcc_assert (!*p_cc_reg);
5775       *p_cc_reg = x;
5776     }
5777 }
5778
5779 /* This is a helper function for the other atomic operations.  This function
5780    emits a loop that contains SEQ that iterates until a compare-and-swap
5781    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
5782    a set of instructions that takes a value from OLD_REG as an input and
5783    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
5784    set to the current contents of MEM.  After SEQ, a compare-and-swap will
5785    attempt to update MEM with NEW_REG.  The function returns true when the
5786    loop was generated successfully.  */
5787
5788 static bool
5789 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
5790 {
5791   machine_mode mode = GET_MODE (mem);
5792   rtx_code_label *label;
5793   rtx cmp_reg, success, oldval;
5794
5795   /* The loop we want to generate looks like
5796
5797         cmp_reg = mem;
5798       label:
5799         old_reg = cmp_reg;
5800         seq;
5801         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
5802         if (success)
5803           goto label;
5804
5805      Note that we only do the plain load from memory once.  Subsequent
5806      iterations use the value loaded by the compare-and-swap pattern.  */
5807
5808   label = gen_label_rtx ();
5809   cmp_reg = gen_reg_rtx (mode);
5810
5811   emit_move_insn (cmp_reg, mem);
5812   emit_label (label);
5813   emit_move_insn (old_reg, cmp_reg);
5814   if (seq)
5815     emit_insn (seq);
5816
5817   success = NULL_RTX;
5818   oldval = cmp_reg;
5819   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
5820                                        new_reg, false, MEMMODEL_SYNC_SEQ_CST,
5821                                        MEMMODEL_RELAXED))
5822     return false;
5823
5824   if (oldval != cmp_reg)
5825     emit_move_insn (cmp_reg, oldval);
5826
5827   /* Mark this jump predicted not taken.  */
5828   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
5829                            GET_MODE (success), 1, label,
5830                            profile_probability::guessed_never ());
5831   return true;
5832 }
5833
5834
5835 /* This function tries to emit an atomic_exchange intruction.  VAL is written
5836    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
5837    using TARGET if possible.  */
5838
5839 static rtx
5840 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
5841 {
5842   machine_mode mode = GET_MODE (mem);
5843   enum insn_code icode;
5844
5845   /* If the target supports the exchange directly, great.  */
5846   icode = direct_optab_handler (atomic_exchange_optab, mode);
5847   if (icode != CODE_FOR_nothing)
5848     {
5849       struct expand_operand ops[4];
5850
5851       create_output_operand (&ops[0], target, mode);
5852       create_fixed_operand (&ops[1], mem);
5853       create_input_operand (&ops[2], val, mode);
5854       create_integer_operand (&ops[3], model);
5855       if (maybe_expand_insn (icode, 4, ops))
5856         return ops[0].value;
5857     }
5858
5859   return NULL_RTX;
5860 }
5861
5862 /* This function tries to implement an atomic exchange operation using
5863    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
5864    The previous contents of *MEM are returned, using TARGET if possible.
5865    Since this instructionn is an acquire barrier only, stronger memory
5866    models may require additional barriers to be emitted.  */
5867
5868 static rtx
5869 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
5870                                    enum memmodel model)
5871 {
5872   machine_mode mode = GET_MODE (mem);
5873   enum insn_code icode;
5874   rtx_insn *last_insn = get_last_insn ();
5875
5876   icode = optab_handler (sync_lock_test_and_set_optab, mode);
5877
5878   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
5879      exists, and the memory model is stronger than acquire, add a release
5880      barrier before the instruction.  */
5881
5882   if (is_mm_seq_cst (model) || is_mm_release (model) || is_mm_acq_rel (model))
5883     expand_mem_thread_fence (model);
5884
5885   if (icode != CODE_FOR_nothing)
5886     {
5887       struct expand_operand ops[3];
5888       create_output_operand (&ops[0], target, mode);
5889       create_fixed_operand (&ops[1], mem);
5890       create_input_operand (&ops[2], val, mode);
5891       if (maybe_expand_insn (icode, 3, ops))
5892         return ops[0].value;
5893     }
5894
5895   /* If an external test-and-set libcall is provided, use that instead of
5896      any external compare-and-swap that we might get from the compare-and-
5897      swap-loop expansion later.  */
5898   if (!can_compare_and_swap_p (mode, false))
5899     {
5900       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
5901       if (libfunc != NULL)
5902         {
5903           rtx addr;
5904
5905           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
5906           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
5907                                           mode, 2, addr, ptr_mode,
5908                                           val, mode);
5909         }
5910     }
5911
5912   /* If the test_and_set can't be emitted, eliminate any barrier that might
5913      have been emitted.  */
5914   delete_insns_since (last_insn);
5915   return NULL_RTX;
5916 }
5917
5918 /* This function tries to implement an atomic exchange operation using a
5919    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
5920    *MEM are returned, using TARGET if possible.  No memory model is required
5921    since a compare_and_swap loop is seq-cst.  */
5922
5923 static rtx
5924 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
5925 {
5926   machine_mode mode = GET_MODE (mem);
5927
5928   if (can_compare_and_swap_p (mode, true))
5929     {
5930       if (!target || !register_operand (target, mode))
5931         target = gen_reg_rtx (mode);
5932       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
5933         return target;
5934     }
5935
5936   return NULL_RTX;
5937 }
5938
5939 /* This function tries to implement an atomic test-and-set operation
5940    using the atomic_test_and_set instruction pattern.  A boolean value
5941    is returned from the operation, using TARGET if possible.  */
5942
5943 static rtx
5944 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
5945 {
5946   machine_mode pat_bool_mode;
5947   struct expand_operand ops[3];
5948
5949   if (!targetm.have_atomic_test_and_set ())
5950     return NULL_RTX;
5951
5952   /* While we always get QImode from __atomic_test_and_set, we get
5953      other memory modes from __sync_lock_test_and_set.  Note that we
5954      use no endian adjustment here.  This matches the 4.6 behavior
5955      in the Sparc backend.  */
5956   enum insn_code icode = targetm.code_for_atomic_test_and_set;
5957   gcc_checking_assert (insn_data[icode].operand[1].mode == QImode);
5958   if (GET_MODE (mem) != QImode)
5959     mem = adjust_address_nv (mem, QImode, 0);
5960
5961   pat_bool_mode = insn_data[icode].operand[0].mode;
5962   create_output_operand (&ops[0], target, pat_bool_mode);
5963   create_fixed_operand (&ops[1], mem);
5964   create_integer_operand (&ops[2], model);
5965
5966   if (maybe_expand_insn (icode, 3, ops))
5967     return ops[0].value;
5968   return NULL_RTX;
5969 }
5970
5971 /* This function expands the legacy _sync_lock test_and_set operation which is
5972    generally an atomic exchange.  Some limited targets only allow the
5973    constant 1 to be stored.  This is an ACQUIRE operation.
5974
5975    TARGET is an optional place to stick the return value.
5976    MEM is where VAL is stored.  */
5977
5978 rtx
5979 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
5980 {
5981   rtx ret;
5982
5983   /* Try an atomic_exchange first.  */
5984   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_SYNC_ACQUIRE);
5985   if (ret)
5986     return ret;
5987
5988   ret = maybe_emit_sync_lock_test_and_set (target, mem, val,
5989                                            MEMMODEL_SYNC_ACQUIRE);
5990   if (ret)
5991     return ret;
5992
5993   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
5994   if (ret)
5995     return ret;
5996
5997   /* If there are no other options, try atomic_test_and_set if the value
5998      being stored is 1.  */
5999   if (val == const1_rtx)
6000     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_SYNC_ACQUIRE);
6001
6002   return ret;
6003 }
6004
6005 /* This function expands the atomic test_and_set operation:
6006    atomically store a boolean TRUE into MEM and return the previous value.
6007
6008    MEMMODEL is the memory model variant to use.
6009    TARGET is an optional place to stick the return value.  */
6010
6011 rtx
6012 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6013 {
6014   machine_mode mode = GET_MODE (mem);
6015   rtx ret, trueval, subtarget;
6016
6017   ret = maybe_emit_atomic_test_and_set (target, mem, model);
6018   if (ret)
6019     return ret;
6020
6021   /* Be binary compatible with non-default settings of trueval, and different
6022      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
6023      another only has atomic-exchange.  */
6024   if (targetm.atomic_test_and_set_trueval == 1)
6025     {
6026       trueval = const1_rtx;
6027       subtarget = target ? target : gen_reg_rtx (mode);
6028     }
6029   else
6030     {
6031       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
6032       subtarget = gen_reg_rtx (mode);
6033     }
6034
6035   /* Try the atomic-exchange optab...  */
6036   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
6037
6038   /* ... then an atomic-compare-and-swap loop ... */
6039   if (!ret)
6040     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
6041
6042   /* ... before trying the vaguely defined legacy lock_test_and_set. */
6043   if (!ret)
6044     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
6045
6046   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
6047      things with the value 1.  Thus we try again without trueval.  */
6048   if (!ret && targetm.atomic_test_and_set_trueval != 1)
6049     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
6050
6051   /* Failing all else, assume a single threaded environment and simply
6052      perform the operation.  */
6053   if (!ret)
6054     {
6055       /* If the result is ignored skip the move to target.  */
6056       if (subtarget != const0_rtx)
6057         emit_move_insn (subtarget, mem);
6058
6059       emit_move_insn (mem, trueval);
6060       ret = subtarget;
6061     }
6062
6063   /* Recall that have to return a boolean value; rectify if trueval
6064      is not exactly one.  */
6065   if (targetm.atomic_test_and_set_trueval != 1)
6066     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
6067
6068   return ret;
6069 }
6070
6071 /* This function expands the atomic exchange operation:
6072    atomically store VAL in MEM and return the previous value in MEM.
6073
6074    MEMMODEL is the memory model variant to use.
6075    TARGET is an optional place to stick the return value.  */
6076
6077 rtx
6078 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6079 {
6080   machine_mode mode = GET_MODE (mem);
6081   rtx ret;
6082
6083   /* If loads are not atomic for the required size and we are not called to
6084      provide a __sync builtin, do not do anything so that we stay consistent
6085      with atomic loads of the same size.  */
6086   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6087     return NULL_RTX;
6088
6089   ret = maybe_emit_atomic_exchange (target, mem, val, model);
6090
6091   /* Next try a compare-and-swap loop for the exchange.  */
6092   if (!ret)
6093     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6094
6095   return ret;
6096 }
6097
6098 /* This function expands the atomic compare exchange operation:
6099
6100    *PTARGET_BOOL is an optional place to store the boolean success/failure.
6101    *PTARGET_OVAL is an optional place to store the old value from memory.
6102    Both target parameters may be NULL or const0_rtx to indicate that we do
6103    not care about that return value.  Both target parameters are updated on
6104    success to the actual location of the corresponding result.
6105
6106    MEMMODEL is the memory model variant to use.
6107
6108    The return value of the function is true for success.  */
6109
6110 bool
6111 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
6112                                 rtx mem, rtx expected, rtx desired,
6113                                 bool is_weak, enum memmodel succ_model,
6114                                 enum memmodel fail_model)
6115 {
6116   machine_mode mode = GET_MODE (mem);
6117   struct expand_operand ops[8];
6118   enum insn_code icode;
6119   rtx target_oval, target_bool = NULL_RTX;
6120   rtx libfunc;
6121
6122   /* If loads are not atomic for the required size and we are not called to
6123      provide a __sync builtin, do not do anything so that we stay consistent
6124      with atomic loads of the same size.  */
6125   if (!can_atomic_load_p (mode) && !is_mm_sync (succ_model))
6126     return false;
6127
6128   /* Load expected into a register for the compare and swap.  */
6129   if (MEM_P (expected))
6130     expected = copy_to_reg (expected);
6131
6132   /* Make sure we always have some place to put the return oldval.
6133      Further, make sure that place is distinct from the input expected,
6134      just in case we need that path down below.  */
6135   if (ptarget_oval && *ptarget_oval == const0_rtx)
6136     ptarget_oval = NULL;
6137
6138   if (ptarget_oval == NULL
6139       || (target_oval = *ptarget_oval) == NULL
6140       || reg_overlap_mentioned_p (expected, target_oval))
6141     target_oval = gen_reg_rtx (mode);
6142
6143   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
6144   if (icode != CODE_FOR_nothing)
6145     {
6146       machine_mode bool_mode = insn_data[icode].operand[0].mode;
6147
6148       if (ptarget_bool && *ptarget_bool == const0_rtx)
6149         ptarget_bool = NULL;
6150
6151       /* Make sure we always have a place for the bool operand.  */
6152       if (ptarget_bool == NULL
6153           || (target_bool = *ptarget_bool) == NULL
6154           || GET_MODE (target_bool) != bool_mode)
6155         target_bool = gen_reg_rtx (bool_mode);
6156
6157       /* Emit the compare_and_swap.  */
6158       create_output_operand (&ops[0], target_bool, bool_mode);
6159       create_output_operand (&ops[1], target_oval, mode);
6160       create_fixed_operand (&ops[2], mem);
6161       create_input_operand (&ops[3], expected, mode);
6162       create_input_operand (&ops[4], desired, mode);
6163       create_integer_operand (&ops[5], is_weak);
6164       create_integer_operand (&ops[6], succ_model);
6165       create_integer_operand (&ops[7], fail_model);
6166       if (maybe_expand_insn (icode, 8, ops))
6167         {
6168           /* Return success/failure.  */
6169           target_bool = ops[0].value;
6170           target_oval = ops[1].value;
6171           goto success;
6172         }
6173     }
6174
6175   /* Otherwise fall back to the original __sync_val_compare_and_swap
6176      which is always seq-cst.  */
6177   icode = optab_handler (sync_compare_and_swap_optab, mode);
6178   if (icode != CODE_FOR_nothing)
6179     {
6180       rtx cc_reg;
6181
6182       create_output_operand (&ops[0], target_oval, mode);
6183       create_fixed_operand (&ops[1], mem);
6184       create_input_operand (&ops[2], expected, mode);
6185       create_input_operand (&ops[3], desired, mode);
6186       if (!maybe_expand_insn (icode, 4, ops))
6187         return false;
6188
6189       target_oval = ops[0].value;
6190
6191       /* If the caller isn't interested in the boolean return value,
6192          skip the computation of it.  */
6193       if (ptarget_bool == NULL)
6194         goto success;
6195
6196       /* Otherwise, work out if the compare-and-swap succeeded.  */
6197       cc_reg = NULL_RTX;
6198       if (have_insn_for (COMPARE, CCmode))
6199         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
6200       if (cc_reg)
6201         {
6202           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
6203                                                const0_rtx, VOIDmode, 0, 1);
6204           goto success;
6205         }
6206       goto success_bool_from_val;
6207     }
6208
6209   /* Also check for library support for __sync_val_compare_and_swap.  */
6210   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
6211   if (libfunc != NULL)
6212     {
6213       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6214       rtx target = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6215                                             mode, 3, addr, ptr_mode,
6216                                             expected, mode, desired, mode);
6217       emit_move_insn (target_oval, target);
6218
6219       /* Compute the boolean return value only if requested.  */
6220       if (ptarget_bool)
6221         goto success_bool_from_val;
6222       else
6223         goto success;
6224     }
6225
6226   /* Failure.  */
6227   return false;
6228
6229  success_bool_from_val:
6230    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
6231                                         expected, VOIDmode, 1, 1);
6232  success:
6233   /* Make sure that the oval output winds up where the caller asked.  */
6234   if (ptarget_oval)
6235     *ptarget_oval = target_oval;
6236   if (ptarget_bool)
6237     *ptarget_bool = target_bool;
6238   return true;
6239 }
6240
6241 /* Generate asm volatile("" : : : "memory") as the memory barrier.  */
6242
6243 static void
6244 expand_asm_memory_barrier (void)
6245 {
6246   rtx asm_op, clob;
6247
6248   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, "", "", 0,
6249                                  rtvec_alloc (0), rtvec_alloc (0),
6250                                  rtvec_alloc (0), UNKNOWN_LOCATION);
6251   MEM_VOLATILE_P (asm_op) = 1;
6252
6253   clob = gen_rtx_SCRATCH (VOIDmode);
6254   clob = gen_rtx_MEM (BLKmode, clob);
6255   clob = gen_rtx_CLOBBER (VOIDmode, clob);
6256
6257   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
6258 }
6259
6260 /* This routine will either emit the mem_thread_fence pattern or issue a
6261    sync_synchronize to generate a fence for memory model MEMMODEL.  */
6262
6263 void
6264 expand_mem_thread_fence (enum memmodel model)
6265 {
6266   if (is_mm_relaxed (model))
6267     return;
6268   if (targetm.have_mem_thread_fence ())
6269     {
6270       emit_insn (targetm.gen_mem_thread_fence (GEN_INT (model)));
6271       expand_asm_memory_barrier ();
6272     }
6273   else if (targetm.have_memory_barrier ())
6274     emit_insn (targetm.gen_memory_barrier ());
6275   else if (synchronize_libfunc != NULL_RTX)
6276     emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode, 0);
6277   else
6278     expand_asm_memory_barrier ();
6279 }
6280
6281 /* This routine will either emit the mem_signal_fence pattern or issue a
6282    sync_synchronize to generate a fence for memory model MEMMODEL.  */
6283
6284 void
6285 expand_mem_signal_fence (enum memmodel model)
6286 {
6287   if (targetm.have_mem_signal_fence ())
6288     emit_insn (targetm.gen_mem_signal_fence (GEN_INT (model)));
6289   else if (!is_mm_relaxed (model))
6290     {
6291       /* By default targets are coherent between a thread and the signal
6292          handler running on the same thread.  Thus this really becomes a
6293          compiler barrier, in that stores must not be sunk past
6294          (or raised above) a given point.  */
6295       expand_asm_memory_barrier ();
6296     }
6297 }
6298
6299 /* This function expands the atomic load operation:
6300    return the atomically loaded value in MEM.
6301
6302    MEMMODEL is the memory model variant to use.
6303    TARGET is an option place to stick the return value.  */
6304
6305 rtx
6306 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
6307 {
6308   machine_mode mode = GET_MODE (mem);
6309   enum insn_code icode;
6310
6311   /* If the target supports the load directly, great.  */
6312   icode = direct_optab_handler (atomic_load_optab, mode);
6313   if (icode != CODE_FOR_nothing)
6314     {
6315       struct expand_operand ops[3];
6316
6317       create_output_operand (&ops[0], target, mode);
6318       create_fixed_operand (&ops[1], mem);
6319       create_integer_operand (&ops[2], model);
6320       if (maybe_expand_insn (icode, 3, ops))
6321         return ops[0].value;
6322     }
6323
6324   /* If the size of the object is greater than word size on this target,
6325      then we assume that a load will not be atomic.  We could try to
6326      emulate a load with a compare-and-swap operation, but the store that
6327      doing this could result in would be incorrect if this is a volatile
6328      atomic load or targetting read-only-mapped memory.  */
6329   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6330     /* If there is no atomic load, leave the library call.  */
6331     return NULL_RTX;
6332
6333   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
6334   if (!target || target == const0_rtx)
6335     target = gen_reg_rtx (mode);
6336
6337   /* For SEQ_CST, emit a barrier before the load.  */
6338   if (is_mm_seq_cst (model))
6339     expand_mem_thread_fence (model);
6340
6341   emit_move_insn (target, mem);
6342
6343   /* Emit the appropriate barrier after the load.  */
6344   expand_mem_thread_fence (model);
6345
6346   return target;
6347 }
6348
6349 /* This function expands the atomic store operation:
6350    Atomically store VAL in MEM.
6351    MEMMODEL is the memory model variant to use.
6352    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
6353    function returns const0_rtx if a pattern was emitted.  */
6354
6355 rtx
6356 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
6357 {
6358   machine_mode mode = GET_MODE (mem);
6359   enum insn_code icode;
6360   struct expand_operand ops[3];
6361
6362   /* If the target supports the store directly, great.  */
6363   icode = direct_optab_handler (atomic_store_optab, mode);
6364   if (icode != CODE_FOR_nothing)
6365     {
6366       create_fixed_operand (&ops[0], mem);
6367       create_input_operand (&ops[1], val, mode);
6368       create_integer_operand (&ops[2], model);
6369       if (maybe_expand_insn (icode, 3, ops))
6370         return const0_rtx;
6371     }
6372
6373   /* If using __sync_lock_release is a viable alternative, try it.
6374      Note that this will not be set to true if we are expanding a generic
6375      __atomic_store_n.  */
6376   if (use_release)
6377     {
6378       icode = direct_optab_handler (sync_lock_release_optab, mode);
6379       if (icode != CODE_FOR_nothing)
6380         {
6381           create_fixed_operand (&ops[0], mem);
6382           create_input_operand (&ops[1], const0_rtx, mode);
6383           if (maybe_expand_insn (icode, 2, ops))
6384             {
6385               /* lock_release is only a release barrier.  */
6386               if (is_mm_seq_cst (model))
6387                 expand_mem_thread_fence (model);
6388               return const0_rtx;
6389             }
6390         }
6391     }
6392
6393   /* If the size of the object is greater than word size on this target,
6394      a default store will not be atomic.  */
6395   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6396     {
6397       /* If loads are atomic or we are called to provide a __sync builtin,
6398          we can try a atomic_exchange and throw away the result.  Otherwise,
6399          don't do anything so that we do not create an inconsistency between
6400          loads and stores.  */
6401       if (can_atomic_load_p (mode) || is_mm_sync (model))
6402         {
6403           rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
6404           if (!target)
6405             target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem,
6406                                                                 val);
6407           if (target)
6408             return const0_rtx;
6409         }
6410         return NULL_RTX;
6411     }
6412
6413   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
6414   expand_mem_thread_fence (model);
6415
6416   emit_move_insn (mem, val);
6417
6418   /* For SEQ_CST, also emit a barrier after the store.  */
6419   if (is_mm_seq_cst (model))
6420     expand_mem_thread_fence (model);
6421
6422   return const0_rtx;
6423 }
6424
6425
6426 /* Structure containing the pointers and values required to process the
6427    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
6428
6429 struct atomic_op_functions
6430 {
6431   direct_optab mem_fetch_before;
6432   direct_optab mem_fetch_after;
6433   direct_optab mem_no_result;
6434   optab fetch_before;
6435   optab fetch_after;
6436   direct_optab no_result;
6437   enum rtx_code reverse_code;
6438 };
6439
6440
6441 /* Fill in structure pointed to by OP with the various optab entries for an
6442    operation of type CODE.  */
6443
6444 static void
6445 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
6446 {
6447   gcc_assert (op!= NULL);
6448
6449   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
6450      in the source code during compilation, and the optab entries are not
6451      computable until runtime.  Fill in the values at runtime.  */
6452   switch (code)
6453     {
6454     case PLUS:
6455       op->mem_fetch_before = atomic_fetch_add_optab;
6456       op->mem_fetch_after = atomic_add_fetch_optab;
6457       op->mem_no_result = atomic_add_optab;
6458       op->fetch_before = sync_old_add_optab;
6459       op->fetch_after = sync_new_add_optab;
6460       op->no_result = sync_add_optab;
6461       op->reverse_code = MINUS;
6462       break;
6463     case MINUS:
6464       op->mem_fetch_before = atomic_fetch_sub_optab;
6465       op->mem_fetch_after = atomic_sub_fetch_optab;
6466       op->mem_no_result = atomic_sub_optab;
6467       op->fetch_before = sync_old_sub_optab;
6468       op->fetch_after = sync_new_sub_optab;
6469       op->no_result = sync_sub_optab;
6470       op->reverse_code = PLUS;
6471       break;
6472     case XOR:
6473       op->mem_fetch_before = atomic_fetch_xor_optab;
6474       op->mem_fetch_after = atomic_xor_fetch_optab;
6475       op->mem_no_result = atomic_xor_optab;
6476       op->fetch_before = sync_old_xor_optab;
6477       op->fetch_after = sync_new_xor_optab;
6478       op->no_result = sync_xor_optab;
6479       op->reverse_code = XOR;
6480       break;
6481     case AND:
6482       op->mem_fetch_before = atomic_fetch_and_optab;
6483       op->mem_fetch_after = atomic_and_fetch_optab;
6484       op->mem_no_result = atomic_and_optab;
6485       op->fetch_before = sync_old_and_optab;
6486       op->fetch_after = sync_new_and_optab;
6487       op->no_result = sync_and_optab;
6488       op->reverse_code = UNKNOWN;
6489       break;
6490     case IOR:
6491       op->mem_fetch_before = atomic_fetch_or_optab;
6492       op->mem_fetch_after = atomic_or_fetch_optab;
6493       op->mem_no_result = atomic_or_optab;
6494       op->fetch_before = sync_old_ior_optab;
6495       op->fetch_after = sync_new_ior_optab;
6496       op->no_result = sync_ior_optab;
6497       op->reverse_code = UNKNOWN;
6498       break;
6499     case NOT:
6500       op->mem_fetch_before = atomic_fetch_nand_optab;
6501       op->mem_fetch_after = atomic_nand_fetch_optab;
6502       op->mem_no_result = atomic_nand_optab;
6503       op->fetch_before = sync_old_nand_optab;
6504       op->fetch_after = sync_new_nand_optab;
6505       op->no_result = sync_nand_optab;
6506       op->reverse_code = UNKNOWN;
6507       break;
6508     default:
6509       gcc_unreachable ();
6510     }
6511 }
6512
6513 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
6514    using memory order MODEL.  If AFTER is true the operation needs to return
6515    the value of *MEM after the operation, otherwise the previous value.
6516    TARGET is an optional place to place the result.  The result is unused if
6517    it is const0_rtx.
6518    Return the result if there is a better sequence, otherwise NULL_RTX.  */
6519
6520 static rtx
6521 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6522                          enum memmodel model, bool after)
6523 {
6524   /* If the value is prefetched, or not used, it may be possible to replace
6525      the sequence with a native exchange operation.  */
6526   if (!after || target == const0_rtx)
6527     {
6528       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
6529       if (code == AND && val == const0_rtx)
6530         {
6531           if (target == const0_rtx)
6532             target = gen_reg_rtx (GET_MODE (mem));
6533           return maybe_emit_atomic_exchange (target, mem, val, model);
6534         }
6535
6536       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
6537       if (code == IOR && val == constm1_rtx)
6538         {
6539           if (target == const0_rtx)
6540             target = gen_reg_rtx (GET_MODE (mem));
6541           return maybe_emit_atomic_exchange (target, mem, val, model);
6542         }
6543     }
6544
6545   return NULL_RTX;
6546 }
6547
6548 /* Try to emit an instruction for a specific operation varaition.
6549    OPTAB contains the OP functions.
6550    TARGET is an optional place to return the result. const0_rtx means unused.
6551    MEM is the memory location to operate on.
6552    VAL is the value to use in the operation.
6553    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
6554    MODEL is the memory model, if used.
6555    AFTER is true if the returned result is the value after the operation.  */
6556
6557 static rtx
6558 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
6559                rtx val, bool use_memmodel, enum memmodel model, bool after)
6560 {
6561   machine_mode mode = GET_MODE (mem);
6562   struct expand_operand ops[4];
6563   enum insn_code icode;
6564   int op_counter = 0;
6565   int num_ops;
6566
6567   /* Check to see if there is a result returned.  */
6568   if (target == const0_rtx)
6569     {
6570       if (use_memmodel)
6571         {
6572           icode = direct_optab_handler (optab->mem_no_result, mode);
6573           create_integer_operand (&ops[2], model);
6574           num_ops = 3;
6575         }
6576       else
6577         {
6578           icode = direct_optab_handler (optab->no_result, mode);
6579           num_ops = 2;
6580         }
6581     }
6582   /* Otherwise, we need to generate a result.  */
6583   else
6584     {
6585       if (use_memmodel)
6586         {
6587           icode = direct_optab_handler (after ? optab->mem_fetch_after
6588                                         : optab->mem_fetch_before, mode);
6589           create_integer_operand (&ops[3], model);
6590           num_ops = 4;
6591         }
6592       else
6593         {
6594           icode = optab_handler (after ? optab->fetch_after
6595                                  : optab->fetch_before, mode);
6596           num_ops = 3;
6597         }
6598       create_output_operand (&ops[op_counter++], target, mode);
6599     }
6600   if (icode == CODE_FOR_nothing)
6601     return NULL_RTX;
6602
6603   create_fixed_operand (&ops[op_counter++], mem);
6604   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
6605   create_convert_operand_to (&ops[op_counter++], val, mode, true);
6606
6607   if (maybe_expand_insn (icode, num_ops, ops))
6608     return (target == const0_rtx ? const0_rtx : ops[0].value);
6609
6610   return NULL_RTX;
6611 }
6612
6613
6614 /* This function expands an atomic fetch_OP or OP_fetch operation:
6615    TARGET is an option place to stick the return value.  const0_rtx indicates
6616    the result is unused.
6617    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6618    CODE is the operation being performed (OP)
6619    MEMMODEL is the memory model variant to use.
6620    AFTER is true to return the result of the operation (OP_fetch).
6621    AFTER is false to return the value before the operation (fetch_OP).
6622
6623    This function will *only* generate instructions if there is a direct
6624    optab. No compare and swap loops or libcalls will be generated. */
6625
6626 static rtx
6627 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
6628                                     enum rtx_code code, enum memmodel model,
6629                                     bool after)
6630 {
6631   machine_mode mode = GET_MODE (mem);
6632   struct atomic_op_functions optab;
6633   rtx result;
6634   bool unused_result = (target == const0_rtx);
6635
6636   get_atomic_op_for_code (&optab, code);
6637
6638   /* Check to see if there are any better instructions.  */
6639   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
6640   if (result)
6641     return result;
6642
6643   /* Check for the case where the result isn't used and try those patterns.  */
6644   if (unused_result)
6645     {
6646       /* Try the memory model variant first.  */
6647       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
6648       if (result)
6649         return result;
6650
6651       /* Next try the old style withuot a memory model.  */
6652       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
6653       if (result)
6654         return result;
6655
6656       /* There is no no-result pattern, so try patterns with a result.  */
6657       target = NULL_RTX;
6658     }
6659
6660   /* Try the __atomic version.  */
6661   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
6662   if (result)
6663     return result;
6664
6665   /* Try the older __sync version.  */
6666   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
6667   if (result)
6668     return result;
6669
6670   /* If the fetch value can be calculated from the other variation of fetch,
6671      try that operation.  */
6672   if (after || unused_result || optab.reverse_code != UNKNOWN)
6673     {
6674       /* Try the __atomic version, then the older __sync version.  */
6675       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
6676       if (!result)
6677         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
6678
6679       if (result)
6680         {
6681           /* If the result isn't used, no need to do compensation code.  */
6682           if (unused_result)
6683             return result;
6684
6685           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
6686              Fetch_before == after REVERSE_OP val.  */
6687           if (!after)
6688             code = optab.reverse_code;
6689           if (code == NOT)
6690             {
6691               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
6692                                             true, OPTAB_LIB_WIDEN);
6693               result = expand_simple_unop (mode, NOT, result, target, true);
6694             }
6695           else
6696             result = expand_simple_binop (mode, code, result, val, target,
6697                                           true, OPTAB_LIB_WIDEN);
6698           return result;
6699         }
6700     }
6701
6702   /* No direct opcode can be generated.  */
6703   return NULL_RTX;
6704 }
6705
6706
6707
6708 /* This function expands an atomic fetch_OP or OP_fetch operation:
6709    TARGET is an option place to stick the return value.  const0_rtx indicates
6710    the result is unused.
6711    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6712    CODE is the operation being performed (OP)
6713    MEMMODEL is the memory model variant to use.
6714    AFTER is true to return the result of the operation (OP_fetch).
6715    AFTER is false to return the value before the operation (fetch_OP).  */
6716 rtx
6717 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6718                         enum memmodel model, bool after)
6719 {
6720   machine_mode mode = GET_MODE (mem);
6721   rtx result;
6722   bool unused_result = (target == const0_rtx);
6723
6724   /* If loads are not atomic for the required size and we are not called to
6725      provide a __sync builtin, do not do anything so that we stay consistent
6726      with atomic loads of the same size.  */
6727   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6728     return NULL_RTX;
6729
6730   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
6731                                                after);
6732
6733   if (result)
6734     return result;
6735
6736   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
6737   if (code == PLUS || code == MINUS)
6738     {
6739       rtx tmp;
6740       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
6741
6742       start_sequence ();
6743       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
6744       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
6745                                                    model, after);
6746       if (result)
6747         {
6748           /* PLUS worked so emit the insns and return.  */
6749           tmp = get_insns ();
6750           end_sequence ();
6751           emit_insn (tmp);
6752           return result;
6753         }
6754
6755       /* PLUS did not work, so throw away the negation code and continue.  */
6756       end_sequence ();
6757     }
6758
6759   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
6760   if (!can_compare_and_swap_p (mode, false))
6761     {
6762       rtx libfunc;
6763       bool fixup = false;
6764       enum rtx_code orig_code = code;
6765       struct atomic_op_functions optab;
6766
6767       get_atomic_op_for_code (&optab, code);
6768       libfunc = optab_libfunc (after ? optab.fetch_after
6769                                : optab.fetch_before, mode);
6770       if (libfunc == NULL
6771           && (after || unused_result || optab.reverse_code != UNKNOWN))
6772         {
6773           fixup = true;
6774           if (!after)
6775             code = optab.reverse_code;
6776           libfunc = optab_libfunc (after ? optab.fetch_before
6777                                    : optab.fetch_after, mode);
6778         }
6779       if (libfunc != NULL)
6780         {
6781           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6782           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
6783                                             2, addr, ptr_mode, val, mode);
6784
6785           if (!unused_result && fixup)
6786             result = expand_simple_binop (mode, code, result, val, target,
6787                                           true, OPTAB_LIB_WIDEN);
6788           return result;
6789         }
6790
6791       /* We need the original code for any further attempts.  */
6792       code = orig_code;
6793     }
6794
6795   /* If nothing else has succeeded, default to a compare and swap loop.  */
6796   if (can_compare_and_swap_p (mode, true))
6797     {
6798       rtx_insn *insn;
6799       rtx t0 = gen_reg_rtx (mode), t1;
6800
6801       start_sequence ();
6802
6803       /* If the result is used, get a register for it.  */
6804       if (!unused_result)
6805         {
6806           if (!target || !register_operand (target, mode))
6807             target = gen_reg_rtx (mode);
6808           /* If fetch_before, copy the value now.  */
6809           if (!after)
6810             emit_move_insn (target, t0);
6811         }
6812       else
6813         target = const0_rtx;
6814
6815       t1 = t0;
6816       if (code == NOT)
6817         {
6818           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
6819                                     true, OPTAB_LIB_WIDEN);
6820           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
6821         }
6822       else
6823         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
6824                                   OPTAB_LIB_WIDEN);
6825
6826       /* For after, copy the value now.  */
6827       if (!unused_result && after)
6828         emit_move_insn (target, t1);
6829       insn = get_insns ();
6830       end_sequence ();
6831
6832       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
6833         return target;
6834     }
6835
6836   return NULL_RTX;
6837 }
6838 \f
6839 /* Return true if OPERAND is suitable for operand number OPNO of
6840    instruction ICODE.  */
6841
6842 bool
6843 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
6844 {
6845   return (!insn_data[(int) icode].operand[opno].predicate
6846           || (insn_data[(int) icode].operand[opno].predicate
6847               (operand, insn_data[(int) icode].operand[opno].mode)));
6848 }
6849 \f
6850 /* TARGET is a target of a multiword operation that we are going to
6851    implement as a series of word-mode operations.  Return true if
6852    TARGET is suitable for this purpose.  */
6853
6854 bool
6855 valid_multiword_target_p (rtx target)
6856 {
6857   machine_mode mode;
6858   int i;
6859
6860   mode = GET_MODE (target);
6861   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
6862     if (!validate_subreg (word_mode, mode, target, i))
6863       return false;
6864   return true;
6865 }
6866
6867 /* Like maybe_legitimize_operand, but do not change the code of the
6868    current rtx value.  */
6869
6870 static bool
6871 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
6872                                     struct expand_operand *op)
6873 {
6874   /* See if the operand matches in its current form.  */
6875   if (insn_operand_matches (icode, opno, op->value))
6876     return true;
6877
6878   /* If the operand is a memory whose address has no side effects,
6879      try forcing the address into a non-virtual pseudo register.
6880      The check for side effects is important because copy_to_mode_reg
6881      cannot handle things like auto-modified addresses.  */
6882   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
6883     {
6884       rtx addr, mem;
6885
6886       mem = op->value;
6887       addr = XEXP (mem, 0);
6888       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
6889           && !side_effects_p (addr))
6890         {
6891           rtx_insn *last;
6892           machine_mode mode;
6893
6894           last = get_last_insn ();
6895           mode = get_address_mode (mem);
6896           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
6897           if (insn_operand_matches (icode, opno, mem))
6898             {
6899               op->value = mem;
6900               return true;
6901             }
6902           delete_insns_since (last);
6903         }
6904     }
6905
6906   return false;
6907 }
6908
6909 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
6910    on success, storing the new operand value back in OP.  */
6911
6912 static bool
6913 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
6914                           struct expand_operand *op)
6915 {
6916   machine_mode mode, imode;
6917   bool old_volatile_ok, result;
6918
6919   mode = op->mode;
6920   switch (op->type)
6921     {
6922     case EXPAND_FIXED:
6923       old_volatile_ok = volatile_ok;
6924       volatile_ok = true;
6925       result = maybe_legitimize_operand_same_code (icode, opno, op);
6926       volatile_ok = old_volatile_ok;
6927       return result;
6928
6929     case EXPAND_OUTPUT:
6930       gcc_assert (mode != VOIDmode);
6931       if (op->value
6932           && op->value != const0_rtx
6933           && GET_MODE (op->value) == mode
6934           && maybe_legitimize_operand_same_code (icode, opno, op))
6935         return true;
6936
6937       op->value = gen_reg_rtx (mode);
6938       op->target = 0;
6939       break;
6940
6941     case EXPAND_INPUT:
6942     input:
6943       gcc_assert (mode != VOIDmode);
6944       gcc_assert (GET_MODE (op->value) == VOIDmode
6945                   || GET_MODE (op->value) == mode);
6946       if (maybe_legitimize_operand_same_code (icode, opno, op))
6947         return true;
6948
6949       op->value = copy_to_mode_reg (mode, op->value);
6950       break;
6951
6952     case EXPAND_CONVERT_TO:
6953       gcc_assert (mode != VOIDmode);
6954       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
6955       goto input;
6956
6957     case EXPAND_CONVERT_FROM:
6958       if (GET_MODE (op->value) != VOIDmode)
6959         mode = GET_MODE (op->value);
6960       else
6961         /* The caller must tell us what mode this value has.  */
6962         gcc_assert (mode != VOIDmode);
6963
6964       imode = insn_data[(int) icode].operand[opno].mode;
6965       if (imode != VOIDmode && imode != mode)
6966         {
6967           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
6968           mode = imode;
6969         }
6970       goto input;
6971
6972     case EXPAND_ADDRESS:
6973       gcc_assert (mode != VOIDmode);
6974       op->value = convert_memory_address (mode, op->value);
6975       goto input;
6976
6977     case EXPAND_INTEGER:
6978       mode = insn_data[(int) icode].operand[opno].mode;
6979       if (mode != VOIDmode && const_int_operand (op->value, mode))
6980         goto input;
6981       break;
6982     }
6983   return insn_operand_matches (icode, opno, op->value);
6984 }
6985
6986 /* Make OP describe an input operand that should have the same value
6987    as VALUE, after any mode conversion that the target might request.
6988    TYPE is the type of VALUE.  */
6989
6990 void
6991 create_convert_operand_from_type (struct expand_operand *op,
6992                                   rtx value, tree type)
6993 {
6994   create_convert_operand_from (op, value, TYPE_MODE (type),
6995                                TYPE_UNSIGNED (type));
6996 }
6997
6998 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
6999    of instruction ICODE.  Return true on success, leaving the new operand
7000    values in the OPS themselves.  Emit no code on failure.  */
7001
7002 bool
7003 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
7004                            unsigned int nops, struct expand_operand *ops)
7005 {
7006   rtx_insn *last;
7007   unsigned int i;
7008
7009   last = get_last_insn ();
7010   for (i = 0; i < nops; i++)
7011     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
7012       {
7013         delete_insns_since (last);
7014         return false;
7015       }
7016   return true;
7017 }
7018
7019 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
7020    as its operands.  Return the instruction pattern on success,
7021    and emit any necessary set-up code.  Return null and emit no
7022    code on failure.  */
7023
7024 rtx_insn *
7025 maybe_gen_insn (enum insn_code icode, unsigned int nops,
7026                 struct expand_operand *ops)
7027 {
7028   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
7029   if (!maybe_legitimize_operands (icode, 0, nops, ops))
7030     return NULL;
7031
7032   switch (nops)
7033     {
7034     case 1:
7035       return GEN_FCN (icode) (ops[0].value);
7036     case 2:
7037       return GEN_FCN (icode) (ops[0].value, ops[1].value);
7038     case 3:
7039       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
7040     case 4:
7041       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7042                               ops[3].value);
7043     case 5:
7044       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7045                               ops[3].value, ops[4].value);
7046     case 6:
7047       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7048                               ops[3].value, ops[4].value, ops[5].value);
7049     case 7:
7050       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7051                               ops[3].value, ops[4].value, ops[5].value,
7052                               ops[6].value);
7053     case 8:
7054       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7055                               ops[3].value, ops[4].value, ops[5].value,
7056                               ops[6].value, ops[7].value);
7057     case 9:
7058       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7059                               ops[3].value, ops[4].value, ops[5].value,
7060                               ops[6].value, ops[7].value, ops[8].value);
7061     }
7062   gcc_unreachable ();
7063 }
7064
7065 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
7066    as its operands.  Return true on success and emit no code on failure.  */
7067
7068 bool
7069 maybe_expand_insn (enum insn_code icode, unsigned int nops,
7070                    struct expand_operand *ops)
7071 {
7072   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7073   if (pat)
7074     {
7075       emit_insn (pat);
7076       return true;
7077     }
7078   return false;
7079 }
7080
7081 /* Like maybe_expand_insn, but for jumps.  */
7082
7083 bool
7084 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
7085                         struct expand_operand *ops)
7086 {
7087   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7088   if (pat)
7089     {
7090       emit_jump_insn (pat);
7091       return true;
7092     }
7093   return false;
7094 }
7095
7096 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
7097    as its operands.  */
7098
7099 void
7100 expand_insn (enum insn_code icode, unsigned int nops,
7101              struct expand_operand *ops)
7102 {
7103   if (!maybe_expand_insn (icode, nops, ops))
7104     gcc_unreachable ();
7105 }
7106
7107 /* Like expand_insn, but for jumps.  */
7108
7109 void
7110 expand_jump_insn (enum insn_code icode, unsigned int nops,
7111                   struct expand_operand *ops)
7112 {
7113   if (!maybe_expand_jump_insn (icode, nops, ops))
7114     gcc_unreachable ();
7115 }