gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2014 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "tm.h"
  25 #include "diagnostic-core.h"
  26
  27 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  28    is properly defined.  */
  29 #include "insn-config.h"
  30 #include "rtl.h"
  31 #include "tree.h"
  32 #include "stor-layout.h"
  33 #include "stringpool.h"
  34 #include "varasm.h"
  35 #include "tm_p.h"
  36 #include "flags.h"
  37 #include "function.h"
  38 #include "except.h"
  39 #include "expr.h"
  40 #include "optabs.h"
  41 #include "libfuncs.h"
  42 #include "recog.h"
  43 #include "reload.h"
  44 #include "ggc.h"
  45 #include "basic-block.h"
  46 #include "target.h"
  47
  48 struct target_optabs default_target_optabs;
  49 struct target_libfuncs default_target_libfuncs;
  50 struct target_optabs *this_fn_optabs = &default_target_optabs;
  51 #if SWITCHABLE_TARGET
  52 struct target_optabs *this_target_optabs = &default_target_optabs;
  53 struct target_libfuncs *this_target_libfuncs = &default_target_libfuncs;
  54 #endif
  55
  56 #define libfunc_hash \
  57   (this_target_libfuncs->x_libfunc_hash)
  58
  59 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  60                                    enum machine_mode *);
  61 static rtx expand_unop_direct (enum machine_mode, optab, rtx, rtx, int);
  62 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  63
  64 /* Debug facility for use in GDB.  */
  65 void debug_optab_libfuncs (void);
  66
  67 /* Prefixes for the current version of decimal floating point (BID vs. DPD) */
  68 #if ENABLE_DECIMAL_BID_FORMAT
  69 #define DECIMAL_PREFIX "bid_"
  70 #else
  71 #define DECIMAL_PREFIX "dpd_"
  72 #endif
  73 \f
  74 /* Used for libfunc_hash.  */
  75
  76 static hashval_t
  77 hash_libfunc (const void *p)
  78 {
  79   const struct libfunc_entry *const e = (const struct libfunc_entry *) p;
  80   return ((e->mode1 + e->mode2 * NUM_MACHINE_MODES) ^ e->op);
  81 }
  82
  83 /* Used for libfunc_hash.  */
  84
  85 static int
  86 eq_libfunc (const void *p, const void *q)
  87 {
  88   const struct libfunc_entry *const e1 = (const struct libfunc_entry *) p;
  89   const struct libfunc_entry *const e2 = (const struct libfunc_entry *) q;
  90   return e1->op == e2->op && e1->mode1 == e2->mode1 && e1->mode2 == e2->mode2;
  91 }
  92
  93 /* Return libfunc corresponding operation defined by OPTAB converting
  94    from MODE2 to MODE1.  Trigger lazy initialization if needed, return NULL
  95    if no libfunc is available.  */
  96 rtx
  97 convert_optab_libfunc (convert_optab optab, enum machine_mode mode1,
  98                        enum machine_mode mode2)
  99 {
 100   struct libfunc_entry e;
 101   struct libfunc_entry **slot;
 102
 103   /* ??? This ought to be an assert, but not all of the places
 104      that we expand optabs know about the optabs that got moved
 105      to being direct.  */
 106   if (!(optab >= FIRST_CONV_OPTAB && optab <= LAST_CONVLIB_OPTAB))
 107     return NULL_RTX;
 108
 109   e.op = optab;
 110   e.mode1 = mode1;
 111   e.mode2 = mode2;
 112   slot = (struct libfunc_entry **)
 113     htab_find_slot (libfunc_hash, &e, NO_INSERT);
 114   if (!slot)
 115     {
 116       const struct convert_optab_libcall_d *d
 117         = &convlib_def[optab - FIRST_CONV_OPTAB];
 118
 119       if (d->libcall_gen == NULL)
 120         return NULL;
 121
 122       d->libcall_gen (optab, d->libcall_basename, mode1, mode2);
 123       slot = (struct libfunc_entry **)
 124         htab_find_slot (libfunc_hash, &e, NO_INSERT);
 125       if (!slot)
 126         return NULL;
 127     }
 128   return (*slot)->libfunc;
 129 }
 130
 131 /* Return libfunc corresponding operation defined by OPTAB in MODE.
 132    Trigger lazy initialization if needed, return NULL if no libfunc is
 133    available.  */
 134 rtx
 135 optab_libfunc (optab optab, enum machine_mode mode)
 136 {
 137   struct libfunc_entry e;
 138   struct libfunc_entry **slot;
 139
 140   /* ??? This ought to be an assert, but not all of the places
 141      that we expand optabs know about the optabs that got moved
 142      to being direct.  */
 143   if (!(optab >= FIRST_NORM_OPTAB && optab <= LAST_NORMLIB_OPTAB))
 144     return NULL_RTX;
 145
 146   e.op = optab;
 147   e.mode1 = mode;
 148   e.mode2 = VOIDmode;
 149   slot = (struct libfunc_entry **)
 150     htab_find_slot (libfunc_hash, &e, NO_INSERT);
 151   if (!slot)
 152     {
 153       const struct optab_libcall_d *d
 154         = &normlib_def[optab - FIRST_NORM_OPTAB];
 155
 156       if (d->libcall_gen == NULL)
 157         return NULL;
 158
 159       d->libcall_gen (optab, d->libcall_basename, d->libcall_suffix, mode);
 160       slot = (struct libfunc_entry **)
 161         htab_find_slot (libfunc_hash, &e, NO_INSERT);
 162       if (!slot)
 163         return NULL;
 164     }
 165   return (*slot)->libfunc;
 166 }
 167
 168 \f
 169 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
 170    the result of operation CODE applied to OP0 (and OP1 if it is a binary
 171    operation).
 172
 173    If the last insn does not set TARGET, don't do anything, but return 1.
 174
 175    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
 176    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
 177    try again, ensuring that TARGET is not one of the operands.  */
 178
 179 static int
 180 add_equal_note (rtx insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
 181 {
 182   rtx last_insn, set;
 183   rtx note;
 184
 185   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
 186
 187   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
 188       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
 189       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
 190       && GET_RTX_CLASS (code) != RTX_COMPARE
 191       && GET_RTX_CLASS (code) != RTX_UNARY)
 192     return 1;
 193
 194   if (GET_CODE (target) == ZERO_EXTRACT)
 195     return 1;
 196
 197   for (last_insn = insns;
 198        NEXT_INSN (last_insn) != NULL_RTX;
 199        last_insn = NEXT_INSN (last_insn))
 200     ;
 201
 202   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
 203      a value changing in the insn, so the note would be invalid for CSE.  */
 204   if (reg_overlap_mentioned_p (target, op0)
 205       || (op1 && reg_overlap_mentioned_p (target, op1)))
 206     {
 207       if (MEM_P (target)
 208           && (rtx_equal_p (target, op0)
 209               || (op1 && rtx_equal_p (target, op1))))
 210         {
 211           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 212              over expanding it as temp = MEM op X, MEM = temp.  If the target
 213              supports MEM = MEM op X instructions, it is sometimes too hard
 214              to reconstruct that form later, especially if X is also a memory,
 215              and due to multiple occurrences of addresses the address might
 216              be forced into register unnecessarily.
 217              Note that not emitting the REG_EQUIV note might inhibit
 218              CSE in some cases.  */
 219           set = single_set (last_insn);
 220           if (set
 221               && GET_CODE (SET_SRC (set)) == code
 222               && MEM_P (SET_DEST (set))
 223               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 224                   || (op1 && rtx_equal_p (SET_DEST (set),
 225                                           XEXP (SET_SRC (set), 1)))))
 226             return 1;
 227         }
 228       return 0;
 229     }
 230
 231   set = set_for_reg_notes (last_insn);
 232   if (set == NULL_RTX)
 233     return 1;
 234
 235   if (! rtx_equal_p (SET_DEST (set), target)
 236       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 237       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 238           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 239     return 1;
 240
 241   if (GET_RTX_CLASS (code) == RTX_UNARY)
 242     switch (code)
 243       {
 244       case FFS:
 245       case CLZ:
 246       case CTZ:
 247       case CLRSB:
 248       case POPCOUNT:
 249       case PARITY:
 250       case BSWAP:
 251         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 252           {
 253             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 254             if (GET_MODE_SIZE (GET_MODE (op0))
 255                 > GET_MODE_SIZE (GET_MODE (target)))
 256               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 257                                          note, GET_MODE (op0));
 258             else
 259               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 260                                          note, GET_MODE (op0));
 261             break;
 262           }
 263         /* FALLTHRU */
 264       default:
 265         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 266         break;
 267       }
 268   else
 269     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 270
 271   set_unique_reg_note (last_insn, REG_EQUAL, note);
 272
 273   return 1;
 274 }
 275 \f
 276 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 277    for a widening operation would be.  In most cases this would be OP0, but if
 278    that's a constant it'll be VOIDmode, which isn't useful.  */
 279
 280 static enum machine_mode
 281 widened_mode (enum machine_mode to_mode, rtx op0, rtx op1)
 282 {
 283   enum machine_mode m0 = GET_MODE (op0);
 284   enum machine_mode m1 = GET_MODE (op1);
 285   enum machine_mode result;
 286
 287   if (m0 == VOIDmode && m1 == VOIDmode)
 288     return to_mode;
 289   else if (m0 == VOIDmode || GET_MODE_SIZE (m0) < GET_MODE_SIZE (m1))
 290     result = m1;
 291   else
 292     result = m0;
 293
 294   if (GET_MODE_SIZE (result) > GET_MODE_SIZE (to_mode))
 295     return to_mode;
 296
 297   return result;
 298 }
 299 \f
 300 /* Like optab_handler, but for widening_operations that have a
 301    TO_MODE and a FROM_MODE.  */
 302
 303 enum insn_code
 304 widening_optab_handler (optab op, enum machine_mode to_mode,
 305                         enum machine_mode from_mode)
 306 {
 307   unsigned scode = (op << 16) | to_mode;
 308   if (to_mode != from_mode && from_mode != VOIDmode)
 309     {
 310       /* ??? Why does find_widening_optab_handler_and_mode attempt to
 311          widen things that can't be widened?  E.g. add_optab... */
 312       if (op > LAST_CONV_OPTAB)
 313         return CODE_FOR_nothing;
 314       scode |= from_mode << 8;
 315     }
 316   return raw_optab_handler (scode);
 317 }
 318
 319 /* Find a widening optab even if it doesn't widen as much as we want.
 320    E.g. if from_mode is HImode, and to_mode is DImode, and there is no
 321    direct HI->SI insn, then return SI->DI, if that exists.
 322    If PERMIT_NON_WIDENING is non-zero then this can be used with
 323    non-widening optabs also.  */
 324
 325 enum insn_code
 326 find_widening_optab_handler_and_mode (optab op, enum machine_mode to_mode,
 327                                       enum machine_mode from_mode,
 328                                       int permit_non_widening,
 329                                       enum machine_mode *found_mode)
 330 {
 331   for (; (permit_non_widening || from_mode != to_mode)
 332          && GET_MODE_SIZE (from_mode) <= GET_MODE_SIZE (to_mode)
 333          && from_mode != VOIDmode;
 334        from_mode = GET_MODE_WIDER_MODE (from_mode))
 335     {
 336       enum insn_code handler = widening_optab_handler (op, to_mode,
 337                                                        from_mode);
 338
 339       if (handler != CODE_FOR_nothing)
 340         {
 341           if (found_mode)
 342             *found_mode = from_mode;
 343           return handler;
 344         }
 345     }
 346
 347   return CODE_FOR_nothing;
 348 }
 349 \f
 350 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 351    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 352    not actually do a sign-extend or zero-extend, but can leave the
 353    higher-order bits of the result rtx undefined, for example, in the case
 354    of logical operations, but not right shifts.  */
 355
 356 static rtx
 357 widen_operand (rtx op, enum machine_mode mode, enum machine_mode oldmode,
 358                int unsignedp, int no_extend)
 359 {
 360   rtx result;
 361
 362   /* If we don't have to extend and this is a constant, return it.  */
 363   if (no_extend && GET_MODE (op) == VOIDmode)
 364     return op;
 365
 366   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 367      extend since it will be more efficient to do so unless the signedness of
 368      a promoted object differs from our extension.  */
 369   if (! no_extend
 370       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 371           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 372     return convert_modes (mode, oldmode, op, unsignedp);
 373
 374   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 375      SUBREG.  */
 376   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
 377     return gen_lowpart (mode, force_reg (GET_MODE (op), op));
 378
 379   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 380      part to OP.  */
 381
 382   result = gen_reg_rtx (mode);
 383   emit_clobber (result);
 384   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 385   return result;
 386 }
 387 \f
 388 /* Return the optab used for computing the operation given by the tree code,
 389    CODE and the tree EXP.  This function is not always usable (for example, it
 390    cannot give complete results for multiplication or division) but probably
 391    ought to be relied on more widely throughout the expander.  */
 392 optab
 393 optab_for_tree_code (enum tree_code code, const_tree type,
 394                      enum optab_subtype subtype)
 395 {
 396   bool trapv;
 397   switch (code)
 398     {
 399     case BIT_AND_EXPR:
 400       return and_optab;
 401
 402     case BIT_IOR_EXPR:
 403       return ior_optab;
 404
 405     case BIT_NOT_EXPR:
 406       return one_cmpl_optab;
 407
 408     case BIT_XOR_EXPR:
 409       return xor_optab;
 410
 411     case MULT_HIGHPART_EXPR:
 412       return TYPE_UNSIGNED (type) ? umul_highpart_optab : smul_highpart_optab;
 413
 414     case TRUNC_MOD_EXPR:
 415     case CEIL_MOD_EXPR:
 416     case FLOOR_MOD_EXPR:
 417     case ROUND_MOD_EXPR:
 418       return TYPE_UNSIGNED (type) ? umod_optab : smod_optab;
 419
 420     case RDIV_EXPR:
 421     case TRUNC_DIV_EXPR:
 422     case CEIL_DIV_EXPR:
 423     case FLOOR_DIV_EXPR:
 424     case ROUND_DIV_EXPR:
 425     case EXACT_DIV_EXPR:
 426       if (TYPE_SATURATING (type))
 427         return TYPE_UNSIGNED (type) ? usdiv_optab : ssdiv_optab;
 428       return TYPE_UNSIGNED (type) ? udiv_optab : sdiv_optab;
 429
 430     case LSHIFT_EXPR:
 431       if (TREE_CODE (type) == VECTOR_TYPE)
 432         {
 433           if (subtype == optab_vector)
 434             return TYPE_SATURATING (type) ? unknown_optab : vashl_optab;
 435
 436           gcc_assert (subtype == optab_scalar);
 437         }
 438       if (TYPE_SATURATING (type))
 439         return TYPE_UNSIGNED (type) ? usashl_optab : ssashl_optab;
 440       return ashl_optab;
 441
 442     case RSHIFT_EXPR:
 443       if (TREE_CODE (type) == VECTOR_TYPE)
 444         {
 445           if (subtype == optab_vector)
 446             return TYPE_UNSIGNED (type) ? vlshr_optab : vashr_optab;
 447
 448           gcc_assert (subtype == optab_scalar);
 449         }
 450       return TYPE_UNSIGNED (type) ? lshr_optab : ashr_optab;
 451
 452     case LROTATE_EXPR:
 453       if (TREE_CODE (type) == VECTOR_TYPE)
 454         {
 455           if (subtype == optab_vector)
 456             return vrotl_optab;
 457
 458           gcc_assert (subtype == optab_scalar);
 459         }
 460       return rotl_optab;
 461
 462     case RROTATE_EXPR:
 463       if (TREE_CODE (type) == VECTOR_TYPE)
 464         {
 465           if (subtype == optab_vector)
 466             return vrotr_optab;
 467
 468           gcc_assert (subtype == optab_scalar);
 469         }
 470       return rotr_optab;
 471
 472     case MAX_EXPR:
 473       return TYPE_UNSIGNED (type) ? umax_optab : smax_optab;
 474
 475     case MIN_EXPR:
 476       return TYPE_UNSIGNED (type) ? umin_optab : smin_optab;
 477
 478     case REALIGN_LOAD_EXPR:
 479       return vec_realign_load_optab;
 480
 481     case WIDEN_SUM_EXPR:
 482       return TYPE_UNSIGNED (type) ? usum_widen_optab : ssum_widen_optab;
 483
 484     case DOT_PROD_EXPR:
 485       return TYPE_UNSIGNED (type) ? udot_prod_optab : sdot_prod_optab;
 486
 487     case SAD_EXPR:
 488       return TYPE_UNSIGNED (type) ? usad_optab : ssad_optab;
 489
 490     case WIDEN_MULT_PLUS_EXPR:
 491       return (TYPE_UNSIGNED (type)
 492               ? (TYPE_SATURATING (type)
 493                  ? usmadd_widen_optab : umadd_widen_optab)
 494               : (TYPE_SATURATING (type)
 495                  ? ssmadd_widen_optab : smadd_widen_optab));
 496
 497     case WIDEN_MULT_MINUS_EXPR:
 498       return (TYPE_UNSIGNED (type)
 499               ? (TYPE_SATURATING (type)
 500                  ? usmsub_widen_optab : umsub_widen_optab)
 501               : (TYPE_SATURATING (type)
 502                  ? ssmsub_widen_optab : smsub_widen_optab));
 503
 504     case FMA_EXPR:
 505       return fma_optab;
 506
 507     case REDUC_MAX_EXPR:
 508       return TYPE_UNSIGNED (type) ? reduc_umax_optab : reduc_smax_optab;
 509
 510     case REDUC_MIN_EXPR:
 511       return TYPE_UNSIGNED (type) ? reduc_umin_optab : reduc_smin_optab;
 512
 513     case REDUC_PLUS_EXPR:
 514       return TYPE_UNSIGNED (type) ? reduc_uplus_optab : reduc_splus_optab;
 515
 516     case VEC_LSHIFT_EXPR:
 517       return vec_shl_optab;
 518
 519     case VEC_RSHIFT_EXPR:
 520       return vec_shr_optab;
 521
 522     case VEC_WIDEN_MULT_HI_EXPR:
 523       return TYPE_UNSIGNED (type) ?
 524         vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
 525
 526     case VEC_WIDEN_MULT_LO_EXPR:
 527       return TYPE_UNSIGNED (type) ?
 528         vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
 529
 530     case VEC_WIDEN_MULT_EVEN_EXPR:
 531       return TYPE_UNSIGNED (type) ?
 532         vec_widen_umult_even_optab : vec_widen_smult_even_optab;
 533
 534     case VEC_WIDEN_MULT_ODD_EXPR:
 535       return TYPE_UNSIGNED (type) ?
 536         vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
 537
 538     case VEC_WIDEN_LSHIFT_HI_EXPR:
 539       return TYPE_UNSIGNED (type) ?
 540         vec_widen_ushiftl_hi_optab : vec_widen_sshiftl_hi_optab;
 541
 542     case VEC_WIDEN_LSHIFT_LO_EXPR:
 543       return TYPE_UNSIGNED (type) ?
 544         vec_widen_ushiftl_lo_optab : vec_widen_sshiftl_lo_optab;
 545
 546     case VEC_UNPACK_HI_EXPR:
 547       return TYPE_UNSIGNED (type) ?
 548         vec_unpacku_hi_optab : vec_unpacks_hi_optab;
 549
 550     case VEC_UNPACK_LO_EXPR:
 551       return TYPE_UNSIGNED (type) ?
 552         vec_unpacku_lo_optab : vec_unpacks_lo_optab;
 553
 554     case VEC_UNPACK_FLOAT_HI_EXPR:
 555       /* The signedness is determined from input operand.  */
 556       return TYPE_UNSIGNED (type) ?
 557         vec_unpacku_float_hi_optab : vec_unpacks_float_hi_optab;
 558
 559     case VEC_UNPACK_FLOAT_LO_EXPR:
 560       /* The signedness is determined from input operand.  */
 561       return TYPE_UNSIGNED (type) ?
 562         vec_unpacku_float_lo_optab : vec_unpacks_float_lo_optab;
 563
 564     case VEC_PACK_TRUNC_EXPR:
 565       return vec_pack_trunc_optab;
 566
 567     case VEC_PACK_SAT_EXPR:
 568       return TYPE_UNSIGNED (type) ? vec_pack_usat_optab : vec_pack_ssat_optab;
 569
 570     case VEC_PACK_FIX_TRUNC_EXPR:
 571       /* The signedness is determined from output operand.  */
 572       return TYPE_UNSIGNED (type) ?
 573         vec_pack_ufix_trunc_optab : vec_pack_sfix_trunc_optab;
 574
 575     default:
 576       break;
 577     }
 578
 579   trapv = INTEGRAL_TYPE_P (type) && TYPE_OVERFLOW_TRAPS (type);
 580   switch (code)
 581     {
 582     case POINTER_PLUS_EXPR:
 583     case PLUS_EXPR:
 584       if (TYPE_SATURATING (type))
 585         return TYPE_UNSIGNED (type) ? usadd_optab : ssadd_optab;
 586       return trapv ? addv_optab : add_optab;
 587
 588     case MINUS_EXPR:
 589       if (TYPE_SATURATING (type))
 590         return TYPE_UNSIGNED (type) ? ussub_optab : sssub_optab;
 591       return trapv ? subv_optab : sub_optab;
 592
 593     case MULT_EXPR:
 594       if (TYPE_SATURATING (type))
 595         return TYPE_UNSIGNED (type) ? usmul_optab : ssmul_optab;
 596       return trapv ? smulv_optab : smul_optab;
 597
 598     case NEGATE_EXPR:
 599       if (TYPE_SATURATING (type))
 600         return TYPE_UNSIGNED (type) ? usneg_optab : ssneg_optab;
 601       return trapv ? negv_optab : neg_optab;
 602
 603     case ABS_EXPR:
 604       return trapv ? absv_optab : abs_optab;
 605
 606     default:
 607       return unknown_optab;
 608     }
 609 }
 610 \f
 611
 612 /* Expand vector widening operations.
 613
 614    There are two different classes of operations handled here:
 615    1) Operations whose result is wider than all the arguments to the operation.
 616       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 617       In this case OP0 and optionally OP1 would be initialized,
 618       but WIDE_OP wouldn't (not relevant for this case).
 619    2) Operations whose result is of the same size as the last argument to the
 620       operation, but wider than all the other arguments to the operation.
 621       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 622       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 623
 624    E.g, when called to expand the following operations, this is how
 625    the arguments will be initialized:
 626                                 nops    OP0     OP1     WIDE_OP
 627    widening-sum                 2       oprnd0  -       oprnd1
 628    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 629    widening-mult                2       oprnd0  oprnd1  -
 630    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 631
 632 rtx
 633 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 634                            rtx target, int unsignedp)
 635 {
 636   struct expand_operand eops[4];
 637   tree oprnd0, oprnd1, oprnd2;
 638   enum machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 639   optab widen_pattern_optab;
 640   enum insn_code icode;
 641   int nops = TREE_CODE_LENGTH (ops->code);
 642   int op;
 643
 644   oprnd0 = ops->op0;
 645   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 646   widen_pattern_optab =
 647     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 648   if (ops->code == WIDEN_MULT_PLUS_EXPR
 649       || ops->code == WIDEN_MULT_MINUS_EXPR)
 650     icode = find_widening_optab_handler (widen_pattern_optab,
 651                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 652                                          tmode0, 0);
 653   else
 654     icode = optab_handler (widen_pattern_optab, tmode0);
 655   gcc_assert (icode != CODE_FOR_nothing);
 656
 657   if (nops >= 2)
 658     {
 659       oprnd1 = ops->op1;
 660       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 661     }
 662
 663   /* The last operand is of a wider mode than the rest of the operands.  */
 664   if (nops == 2)
 665     wmode = tmode1;
 666   else if (nops == 3)
 667     {
 668       gcc_assert (tmode1 == tmode0);
 669       gcc_assert (op1);
 670       oprnd2 = ops->op2;
 671       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 672     }
 673
 674   op = 0;
 675   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 676   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 677   if (op1)
 678     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 679   if (wide_op)
 680     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 681   expand_insn (icode, op, eops);
 682   return eops[0].value;
 683 }
 684
 685 /* Generate code to perform an operation specified by TERNARY_OPTAB
 686    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 687
 688    UNSIGNEDP is for the case where we have to widen the operands
 689    to perform the operation.  It says to use zero-extension.
 690
 691    If TARGET is nonzero, the value
 692    is generated there, if it is convenient to do so.
 693    In all cases an rtx is returned for the locus of the value;
 694    this may or may not be TARGET.  */
 695
 696 rtx
 697 expand_ternary_op (enum machine_mode mode, optab ternary_optab, rtx op0,
 698                    rtx op1, rtx op2, rtx target, int unsignedp)
 699 {
 700   struct expand_operand ops[4];
 701   enum insn_code icode = optab_handler (ternary_optab, mode);
 702
 703   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 704
 705   create_output_operand (&ops[0], target, mode);
 706   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 707   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 708   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 709   expand_insn (icode, 4, ops);
 710   return ops[0].value;
 711 }
 712
 713
 714 /* Like expand_binop, but return a constant rtx if the result can be
 715    calculated at compile time.  The arguments and return value are
 716    otherwise the same as for expand_binop.  */
 717
 718 rtx
 719 simplify_expand_binop (enum machine_mode mode, optab binoptab,
 720                        rtx op0, rtx op1, rtx target, int unsignedp,
 721                        enum optab_methods methods)
 722 {
 723   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 724     {
 725       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 726                                          mode, op0, op1);
 727       if (x)
 728         return x;
 729     }
 730
 731   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 732 }
 733
 734 /* Like simplify_expand_binop, but always put the result in TARGET.
 735    Return true if the expansion succeeded.  */
 736
 737 bool
 738 force_expand_binop (enum machine_mode mode, optab binoptab,
 739                     rtx op0, rtx op1, rtx target, int unsignedp,
 740                     enum optab_methods methods)
 741 {
 742   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 743                                  target, unsignedp, methods);
 744   if (x == 0)
 745     return false;
 746   if (x != target)
 747     emit_move_insn (target, x);
 748   return true;
 749 }
 750
 751 /* Generate insns for VEC_LSHIFT_EXPR, VEC_RSHIFT_EXPR.  */
 752
 753 rtx
 754 expand_vec_shift_expr (sepops ops, rtx target)
 755 {
 756   struct expand_operand eops[3];
 757   enum insn_code icode;
 758   rtx rtx_op1, rtx_op2;
 759   enum machine_mode mode = TYPE_MODE (ops->type);
 760   tree vec_oprnd = ops->op0;
 761   tree shift_oprnd = ops->op1;
 762   optab shift_optab;
 763
 764   switch (ops->code)
 765     {
 766       case VEC_RSHIFT_EXPR:
 767         shift_optab = vec_shr_optab;
 768         break;
 769       case VEC_LSHIFT_EXPR:
 770         shift_optab = vec_shl_optab;
 771         break;
 772       default:
 773         gcc_unreachable ();
 774     }
 775
 776   icode = optab_handler (shift_optab, mode);
 777   gcc_assert (icode != CODE_FOR_nothing);
 778
 779   rtx_op1 = expand_normal (vec_oprnd);
 780   rtx_op2 = expand_normal (shift_oprnd);
 781
 782   create_output_operand (&eops[0], target, mode);
 783   create_input_operand (&eops[1], rtx_op1, GET_MODE (rtx_op1));
 784   create_convert_operand_from_type (&eops[2], rtx_op2, TREE_TYPE (shift_oprnd));
 785   expand_insn (icode, 3, eops);
 786
 787   return eops[0].value;
 788 }
 789
 790 /* Create a new vector value in VMODE with all elements set to OP.  The
 791    mode of OP must be the element mode of VMODE.  If OP is a constant,
 792    then the return value will be a constant.  */
 793
 794 static rtx
 795 expand_vector_broadcast (enum machine_mode vmode, rtx op)
 796 {
 797   enum insn_code icode;
 798   rtvec vec;
 799   rtx ret;
 800   int i, n;
 801
 802   gcc_checking_assert (VECTOR_MODE_P (vmode));
 803
 804   n = GET_MODE_NUNITS (vmode);
 805   vec = rtvec_alloc (n);
 806   for (i = 0; i < n; ++i)
 807     RTVEC_ELT (vec, i) = op;
 808
 809   if (CONSTANT_P (op))
 810     return gen_rtx_CONST_VECTOR (vmode, vec);
 811
 812   /* ??? If the target doesn't have a vec_init, then we have no easy way
 813      of performing this operation.  Most of this sort of generic support
 814      is hidden away in the vector lowering support in gimple.  */
 815   icode = optab_handler (vec_init_optab, vmode);
 816   if (icode == CODE_FOR_nothing)
 817     return NULL;
 818
 819   ret = gen_reg_rtx (vmode);
 820   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 821
 822   return ret;
 823 }
 824
 825 /* This subroutine of expand_doubleword_shift handles the cases in which
 826    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 827    value are the same as for the parent routine, except that SUPERWORD_OP1
 828    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 829    INTO_TARGET may be null if the caller has decided to calculate it.  */
 830
 831 static bool
 832 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 833                         rtx outof_target, rtx into_target,
 834                         int unsignedp, enum optab_methods methods)
 835 {
 836   if (into_target != 0)
 837     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 838                              into_target, unsignedp, methods))
 839       return false;
 840
 841   if (outof_target != 0)
 842     {
 843       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 844          of the sign bit, otherwise we must fill it with zeros.  */
 845       if (binoptab != ashr_optab)
 846         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 847       else
 848         if (!force_expand_binop (word_mode, binoptab,
 849                                  outof_input, GEN_INT (BITS_PER_WORD - 1),
 850                                  outof_target, unsignedp, methods))
 851           return false;
 852     }
 853   return true;
 854 }
 855
 856 /* This subroutine of expand_doubleword_shift handles the cases in which
 857    the effective shift value is < BITS_PER_WORD.  The arguments and return
 858    value are the same as for the parent routine.  */
 859
 860 static bool
 861 expand_subword_shift (enum machine_mode op1_mode, optab binoptab,
 862                       rtx outof_input, rtx into_input, rtx op1,
 863                       rtx outof_target, rtx into_target,
 864                       int unsignedp, enum optab_methods methods,
 865                       unsigned HOST_WIDE_INT shift_mask)
 866 {
 867   optab reverse_unsigned_shift, unsigned_shift;
 868   rtx tmp, carries;
 869
 870   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 871   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 872
 873   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 874      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 875      the opposite direction to BINOPTAB.  */
 876   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 877     {
 878       carries = outof_input;
 879       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 880                                             op1_mode), op1_mode);
 881       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 882                                    0, true, methods);
 883     }
 884   else
 885     {
 886       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 887          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 888          has unknown behavior.  Do a single shift first, then shift by the
 889          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 890          are truncated to the mode size.  */
 891       carries = expand_binop (word_mode, reverse_unsigned_shift,
 892                               outof_input, const1_rtx, 0, unsignedp, methods);
 893       if (shift_mask == BITS_PER_WORD - 1)
 894         {
 895           tmp = immed_wide_int_const
 896             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 897           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 898                                        0, true, methods);
 899         }
 900       else
 901         {
 902           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 903                                                 op1_mode), op1_mode);
 904           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 905                                        0, true, methods);
 906         }
 907     }
 908   if (tmp == 0 || carries == 0)
 909     return false;
 910   carries = expand_binop (word_mode, reverse_unsigned_shift,
 911                           carries, tmp, 0, unsignedp, methods);
 912   if (carries == 0)
 913     return false;
 914
 915   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 916      so the result can go directly into INTO_TARGET if convenient.  */
 917   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 918                       into_target, unsignedp, methods);
 919   if (tmp == 0)
 920     return false;
 921
 922   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 923   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 924                            into_target, unsignedp, methods))
 925     return false;
 926
 927   /* Use a standard word_mode shift for the out-of half.  */
 928   if (outof_target != 0)
 929     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 930                              outof_target, unsignedp, methods))
 931       return false;
 932
 933   return true;
 934 }
 935
 936
 937 #ifdef HAVE_conditional_move
 938 /* Try implementing expand_doubleword_shift using conditional moves.
 939    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 940    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 941    are the shift counts to use in the former and latter case.  All other
 942    arguments are the same as the parent routine.  */
 943
 944 static bool
 945 expand_doubleword_shift_condmove (enum machine_mode op1_mode, optab binoptab,
 946                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 947                                   rtx outof_input, rtx into_input,
 948                                   rtx subword_op1, rtx superword_op1,
 949                                   rtx outof_target, rtx into_target,
 950                                   int unsignedp, enum optab_methods methods,
 951                                   unsigned HOST_WIDE_INT shift_mask)
 952 {
 953   rtx outof_superword, into_superword;
 954
 955   /* Put the superword version of the output into OUTOF_SUPERWORD and
 956      INTO_SUPERWORD.  */
 957   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 958   if (outof_target != 0 && subword_op1 == superword_op1)
 959     {
 960       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 961          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 962       into_superword = outof_target;
 963       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 964                                    outof_superword, 0, unsignedp, methods))
 965         return false;
 966     }
 967   else
 968     {
 969       into_superword = gen_reg_rtx (word_mode);
 970       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 971                                    outof_superword, into_superword,
 972                                    unsignedp, methods))
 973         return false;
 974     }
 975
 976   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 977   if (!expand_subword_shift (op1_mode, binoptab,
 978                              outof_input, into_input, subword_op1,
 979                              outof_target, into_target,
 980                              unsignedp, methods, shift_mask))
 981     return false;
 982
 983   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 984      might be the current value of OUTOF_TARGET.  */
 985   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 986                               into_target, into_superword, word_mode, false))
 987     return false;
 988
 989   if (outof_target != 0)
 990     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 991                                 outof_target, outof_superword,
 992                                 word_mode, false))
 993       return false;
 994
 995   return true;
 996 }
 997 #endif
 998
 999 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
1000    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
1001    input operand; the shift moves bits in the direction OUTOF_INPUT->
1002    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
1003    of the target.  OP1 is the shift count and OP1_MODE is its mode.
1004    If OP1 is constant, it will have been truncated as appropriate
1005    and is known to be nonzero.
1006
1007    If SHIFT_MASK is zero, the result of word shifts is undefined when the
1008    shift count is outside the range [0, BITS_PER_WORD).  This routine must
1009    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
1010
1011    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
1012    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
1013    fill with zeros or sign bits as appropriate.
1014
1015    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
1016    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
1017    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
1018    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
1019    are undefined.
1020
1021    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
1022    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
1023    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
1024    function wants to calculate it itself.
1025
1026    Return true if the shift could be successfully synthesized.  */
1027
1028 static bool
1029 expand_doubleword_shift (enum machine_mode op1_mode, optab binoptab,
1030                          rtx outof_input, rtx into_input, rtx op1,
1031                          rtx outof_target, rtx into_target,
1032                          int unsignedp, enum optab_methods methods,
1033                          unsigned HOST_WIDE_INT shift_mask)
1034 {
1035   rtx superword_op1, tmp, cmp1, cmp2;
1036   rtx subword_label, done_label;
1037   enum rtx_code cmp_code;
1038
1039   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
1040      fill the result with sign or zero bits as appropriate.  If so, the value
1041      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
1042      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
1043      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
1044
1045      This isn't worthwhile for constant shifts since the optimizers will
1046      cope better with in-range shift counts.  */
1047   if (shift_mask >= BITS_PER_WORD
1048       && outof_target != 0
1049       && !CONSTANT_P (op1))
1050     {
1051       if (!expand_doubleword_shift (op1_mode, binoptab,
1052                                     outof_input, into_input, op1,
1053                                     0, into_target,
1054                                     unsignedp, methods, shift_mask))
1055         return false;
1056       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
1057                                outof_target, unsignedp, methods))
1058         return false;
1059       return true;
1060     }
1061
1062   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
1063      is true when the effective shift value is less than BITS_PER_WORD.
1064      Set SUPERWORD_OP1 to the shift count that should be used to shift
1065      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
1066   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
1067   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
1068     {
1069       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
1070          is a subword shift count.  */
1071       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
1072                                     0, true, methods);
1073       cmp2 = CONST0_RTX (op1_mode);
1074       cmp_code = EQ;
1075       superword_op1 = op1;
1076     }
1077   else
1078     {
1079       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
1080       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
1081                                     0, true, methods);
1082       cmp2 = CONST0_RTX (op1_mode);
1083       cmp_code = LT;
1084       superword_op1 = cmp1;
1085     }
1086   if (cmp1 == 0)
1087     return false;
1088
1089   /* If we can compute the condition at compile time, pick the
1090      appropriate subroutine.  */
1091   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
1092   if (tmp != 0 && CONST_INT_P (tmp))
1093     {
1094       if (tmp == const0_rtx)
1095         return expand_superword_shift (binoptab, outof_input, superword_op1,
1096                                        outof_target, into_target,
1097                                        unsignedp, methods);
1098       else
1099         return expand_subword_shift (op1_mode, binoptab,
1100                                      outof_input, into_input, op1,
1101                                      outof_target, into_target,
1102                                      unsignedp, methods, shift_mask);
1103     }
1104
1105 #ifdef HAVE_conditional_move
1106   /* Try using conditional moves to generate straight-line code.  */
1107   {
1108     rtx_insn *start = get_last_insn ();
1109     if (expand_doubleword_shift_condmove (op1_mode, binoptab,
1110                                           cmp_code, cmp1, cmp2,
1111                                           outof_input, into_input,
1112                                           op1, superword_op1,
1113                                           outof_target, into_target,
1114                                           unsignedp, methods, shift_mask))
1115       return true;
1116     delete_insns_since (start);
1117   }
1118 #endif
1119
1120   /* As a last resort, use branches to select the correct alternative.  */
1121   subword_label = gen_label_rtx ();
1122   done_label = gen_label_rtx ();
1123
1124   NO_DEFER_POP;
1125   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
1126                            0, 0, subword_label, -1);
1127   OK_DEFER_POP;
1128
1129   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
1130                                outof_target, into_target,
1131                                unsignedp, methods))
1132     return false;
1133
1134   emit_jump_insn (gen_jump (done_label));
1135   emit_barrier ();
1136   emit_label (subword_label);
1137
1138   if (!expand_subword_shift (op1_mode, binoptab,
1139                              outof_input, into_input, op1,
1140                              outof_target, into_target,
1141                              unsignedp, methods, shift_mask))
1142     return false;
1143
1144   emit_label (done_label);
1145   return true;
1146 }
1147 \f
1148 /* Subroutine of expand_binop.  Perform a double word multiplication of
1149    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
1150    as the target's word_mode.  This function return NULL_RTX if anything
1151    goes wrong, in which case it may have already emitted instructions
1152    which need to be deleted.
1153
1154    If we want to multiply two two-word values and have normal and widening
1155    multiplies of single-word values, we can do this with three smaller
1156    multiplications.
1157
1158    The multiplication proceeds as follows:
1159                                  _______________________
1160                                 [__op0_high_|__op0_low__]
1161                                  _______________________
1162         *                       [__op1_high_|__op1_low__]
1163         _______________________________________________
1164                                  _______________________
1165     (1)                         [__op0_low__*__op1_low__]
1166                      _______________________
1167     (2a)            [__op0_low__*__op1_high_]
1168                      _______________________
1169     (2b)            [__op0_high_*__op1_low__]
1170          _______________________
1171     (3) [__op0_high_*__op1_high_]
1172
1173
1174   This gives a 4-word result.  Since we are only interested in the
1175   lower 2 words, partial result (3) and the upper words of (2a) and
1176   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
1177   calculated using non-widening multiplication.
1178
1179   (1), however, needs to be calculated with an unsigned widening
1180   multiplication.  If this operation is not directly supported we
1181   try using a signed widening multiplication and adjust the result.
1182   This adjustment works as follows:
1183
1184       If both operands are positive then no adjustment is needed.
1185
1186       If the operands have different signs, for example op0_low < 0 and
1187       op1_low >= 0, the instruction treats the most significant bit of
1188       op0_low as a sign bit instead of a bit with significance
1189       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
1190       with 2**BITS_PER_WORD - op0_low, and two's complements the
1191       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
1192       the result.
1193
1194       Similarly, if both operands are negative, we need to add
1195       (op0_low + op1_low) * 2**BITS_PER_WORD.
1196
1197       We use a trick to adjust quickly.  We logically shift op0_low right
1198       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
1199       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
1200       logical shift exists, we do an arithmetic right shift and subtract
1201       the 0 or -1.  */
1202
1203 static rtx
1204 expand_doubleword_mult (enum machine_mode mode, rtx op0, rtx op1, rtx target,
1205                        bool umulp, enum optab_methods methods)
1206 {
1207   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
1208   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
1209   rtx wordm1 = umulp ? NULL_RTX : GEN_INT (BITS_PER_WORD - 1);
1210   rtx product, adjust, product_high, temp;
1211
1212   rtx op0_high = operand_subword_force (op0, high, mode);
1213   rtx op0_low = operand_subword_force (op0, low, mode);
1214   rtx op1_high = operand_subword_force (op1, high, mode);
1215   rtx op1_low = operand_subword_force (op1, low, mode);
1216
1217   /* If we're using an unsigned multiply to directly compute the product
1218      of the low-order words of the operands and perform any required
1219      adjustments of the operands, we begin by trying two more multiplications
1220      and then computing the appropriate sum.
1221
1222      We have checked above that the required addition is provided.
1223      Full-word addition will normally always succeed, especially if
1224      it is provided at all, so we don't worry about its failure.  The
1225      multiplication may well fail, however, so we do handle that.  */
1226
1227   if (!umulp)
1228     {
1229       /* ??? This could be done with emit_store_flag where available.  */
1230       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
1231                            NULL_RTX, 1, methods);
1232       if (temp)
1233         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
1234                                  NULL_RTX, 0, OPTAB_DIRECT);
1235       else
1236         {
1237           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
1238                                NULL_RTX, 0, methods);
1239           if (!temp)
1240             return NULL_RTX;
1241           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
1242                                    NULL_RTX, 0, OPTAB_DIRECT);
1243         }
1244
1245       if (!op0_high)
1246         return NULL_RTX;
1247     }
1248
1249   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
1250                          NULL_RTX, 0, OPTAB_DIRECT);
1251   if (!adjust)
1252     return NULL_RTX;
1253
1254   /* OP0_HIGH should now be dead.  */
1255
1256   if (!umulp)
1257     {
1258       /* ??? This could be done with emit_store_flag where available.  */
1259       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
1260                            NULL_RTX, 1, methods);
1261       if (temp)
1262         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
1263                                  NULL_RTX, 0, OPTAB_DIRECT);
1264       else
1265         {
1266           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
1267                                NULL_RTX, 0, methods);
1268           if (!temp)
1269             return NULL_RTX;
1270           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
1271                                    NULL_RTX, 0, OPTAB_DIRECT);
1272         }
1273
1274       if (!op1_high)
1275         return NULL_RTX;
1276     }
1277
1278   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
1279                        NULL_RTX, 0, OPTAB_DIRECT);
1280   if (!temp)
1281     return NULL_RTX;
1282
1283   /* OP1_HIGH should now be dead.  */
1284
1285   adjust = expand_binop (word_mode, add_optab, adjust, temp,
1286                          NULL_RTX, 0, OPTAB_DIRECT);
1287
1288   if (target && !REG_P (target))
1289     target = NULL_RTX;
1290
1291   if (umulp)
1292     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
1293                             target, 1, OPTAB_DIRECT);
1294   else
1295     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
1296                             target, 1, OPTAB_DIRECT);
1297
1298   if (!product)
1299     return NULL_RTX;
1300
1301   product_high = operand_subword (product, high, 1, mode);
1302   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
1303                          NULL_RTX, 0, OPTAB_DIRECT);
1304   emit_move_insn (product_high, adjust);
1305   return product;
1306 }
1307 \f
1308 /* Wrapper around expand_binop which takes an rtx code to specify
1309    the operation to perform, not an optab pointer.  All other
1310    arguments are the same.  */
1311 rtx
1312 expand_simple_binop (enum machine_mode mode, enum rtx_code code, rtx op0,
1313                      rtx op1, rtx target, int unsignedp,
1314                      enum optab_methods methods)
1315 {
1316   optab binop = code_to_optab (code);
1317   gcc_assert (binop);
1318
1319   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
1320 }
1321
1322 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
1323    binop.  Order them according to commutative_operand_precedence and, if
1324    possible, try to put TARGET or a pseudo first.  */
1325 static bool
1326 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
1327 {
1328   int op0_prec = commutative_operand_precedence (op0);
1329   int op1_prec = commutative_operand_precedence (op1);
1330
1331   if (op0_prec < op1_prec)
1332     return true;
1333
1334   if (op0_prec > op1_prec)
1335     return false;
1336
1337   /* With equal precedence, both orders are ok, but it is better if the
1338      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
1339   if (target == 0 || REG_P (target))
1340     return (REG_P (op1) && !REG_P (op0)) || target == op1;
1341   else
1342     return rtx_equal_p (op1, target);
1343 }
1344
1345 /* Return true if BINOPTAB implements a shift operation.  */
1346
1347 static bool
1348 shift_optab_p (optab binoptab)
1349 {
1350   switch (optab_to_code (binoptab))
1351     {
1352     case ASHIFT:
1353     case SS_ASHIFT:
1354     case US_ASHIFT:
1355     case ASHIFTRT:
1356     case LSHIFTRT:
1357     case ROTATE:
1358     case ROTATERT:
1359       return true;
1360
1361     default:
1362       return false;
1363     }
1364 }
1365
1366 /* Return true if BINOPTAB implements a commutative binary operation.  */
1367
1368 static bool
1369 commutative_optab_p (optab binoptab)
1370 {
1371   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
1372           || binoptab == smul_widen_optab
1373           || binoptab == umul_widen_optab
1374           || binoptab == smul_highpart_optab
1375           || binoptab == umul_highpart_optab);
1376 }
1377
1378 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
1379    optimizing, and if the operand is a constant that costs more than
1380    1 instruction, force the constant into a register and return that
1381    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
1382
1383 static rtx
1384 avoid_expensive_constant (enum machine_mode mode, optab binoptab,
1385                           int opn, rtx x, bool unsignedp)
1386 {
1387   bool speed = optimize_insn_for_speed_p ();
1388
1389   if (mode != VOIDmode
1390       && optimize
1391       && CONSTANT_P (x)
1392       && (rtx_cost (x, optab_to_code (binoptab), opn, speed)
1393           > set_src_cost (x, speed)))
1394     {
1395       if (CONST_INT_P (x))
1396         {
1397           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
1398           if (intval != INTVAL (x))
1399             x = GEN_INT (intval);
1400         }
1401       else
1402         x = convert_modes (mode, VOIDmode, x, unsignedp);
1403       x = force_reg (mode, x);
1404     }
1405   return x;
1406 }
1407
1408 /* Helper function for expand_binop: handle the case where there
1409    is an insn that directly implements the indicated operation.
1410    Returns null if this is not possible.  */
1411 static rtx
1412 expand_binop_directly (enum machine_mode mode, optab binoptab,
1413                        rtx op0, rtx op1,
1414                        rtx target, int unsignedp, enum optab_methods methods,
1415                        rtx_insn *last)
1416 {
1417   enum machine_mode from_mode = widened_mode (mode, op0, op1);
1418   enum insn_code icode = find_widening_optab_handler (binoptab, mode,
1419                                                       from_mode, 1);
1420   enum machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1421   enum machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1422   enum machine_mode mode0, mode1, tmp_mode;
1423   struct expand_operand ops[3];
1424   bool commutative_p;
1425   rtx pat;
1426   rtx xop0 = op0, xop1 = op1;
1427   rtx swap;
1428
1429   /* If it is a commutative operator and the modes would match
1430      if we would swap the operands, we can save the conversions.  */
1431   commutative_p = commutative_optab_p (binoptab);
1432   if (commutative_p
1433       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1434       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1435     {
1436       swap = xop0;
1437       xop0 = xop1;
1438       xop1 = swap;
1439     }
1440
1441   /* If we are optimizing, force expensive constants into a register.  */
1442   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1443   if (!shift_optab_p (binoptab))
1444     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1445
1446   /* In case the insn wants input operands in modes different from
1447      those of the actual operands, convert the operands.  It would
1448      seem that we don't need to convert CONST_INTs, but we do, so
1449      that they're properly zero-extended, sign-extended or truncated
1450      for their mode.  */
1451
1452   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1453   if (xmode0 != VOIDmode && xmode0 != mode0)
1454     {
1455       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1456       mode0 = xmode0;
1457     }
1458
1459   mode1 = GET_MODE (xop1) != VOIDmode ? GET_MODE (xop1) : mode;
1460   if (xmode1 != VOIDmode && xmode1 != mode1)
1461     {
1462       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1463       mode1 = xmode1;
1464     }
1465
1466   /* If operation is commutative,
1467      try to make the first operand a register.
1468      Even better, try to make it the same as the target.
1469      Also try to make the last operand a constant.  */
1470   if (commutative_p
1471       && swap_commutative_operands_with_target (target, xop0, xop1))
1472     {
1473       swap = xop1;
1474       xop1 = xop0;
1475       xop0 = swap;
1476     }
1477
1478   /* Now, if insn's predicates don't allow our operands, put them into
1479      pseudo regs.  */
1480
1481   if (binoptab == vec_pack_trunc_optab
1482       || binoptab == vec_pack_usat_optab
1483       || binoptab == vec_pack_ssat_optab
1484       || binoptab == vec_pack_ufix_trunc_optab
1485       || binoptab == vec_pack_sfix_trunc_optab)
1486     {
1487       /* The mode of the result is different then the mode of the
1488          arguments.  */
1489       tmp_mode = insn_data[(int) icode].operand[0].mode;
1490       if (GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1491         {
1492           delete_insns_since (last);
1493           return NULL_RTX;
1494         }
1495     }
1496   else
1497     tmp_mode = mode;
1498
1499   create_output_operand (&ops[0], target, tmp_mode);
1500   create_input_operand (&ops[1], xop0, mode0);
1501   create_input_operand (&ops[2], xop1, mode1);
1502   pat = maybe_gen_insn (icode, 3, ops);
1503   if (pat)
1504     {
1505       /* If PAT is composed of more than one insn, try to add an appropriate
1506          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1507          operand, call expand_binop again, this time without a target.  */
1508       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1509           && ! add_equal_note (pat, ops[0].value, optab_to_code (binoptab),
1510                                ops[1].value, ops[2].value))
1511         {
1512           delete_insns_since (last);
1513           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1514                                unsignedp, methods);
1515         }
1516
1517       emit_insn (pat);
1518       return ops[0].value;
1519     }
1520   delete_insns_since (last);
1521   return NULL_RTX;
1522 }
1523
1524 /* Generate code to perform an operation specified by BINOPTAB
1525    on operands OP0 and OP1, with result having machine-mode MODE.
1526
1527    UNSIGNEDP is for the case where we have to widen the operands
1528    to perform the operation.  It says to use zero-extension.
1529
1530    If TARGET is nonzero, the value
1531    is generated there, if it is convenient to do so.
1532    In all cases an rtx is returned for the locus of the value;
1533    this may or may not be TARGET.  */
1534
1535 rtx
1536 expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
1537               rtx target, int unsignedp, enum optab_methods methods)
1538 {
1539   enum optab_methods next_methods
1540     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1541        ? OPTAB_WIDEN : methods);
1542   enum mode_class mclass;
1543   enum machine_mode wider_mode;
1544   rtx libfunc;
1545   rtx temp;
1546   rtx_insn *entry_last = get_last_insn ();
1547   rtx_insn *last;
1548
1549   mclass = GET_MODE_CLASS (mode);
1550
1551   /* If subtracting an integer constant, convert this into an addition of
1552      the negated constant.  */
1553
1554   if (binoptab == sub_optab && CONST_INT_P (op1))
1555     {
1556       op1 = negate_rtx (mode, op1);
1557       binoptab = add_optab;
1558     }
1559
1560   /* Record where to delete back to if we backtrack.  */
1561   last = get_last_insn ();
1562
1563   /* If we can do it with a three-operand insn, do so.  */
1564
1565   if (methods != OPTAB_MUST_WIDEN
1566       && find_widening_optab_handler (binoptab, mode,
1567                                       widened_mode (mode, op0, op1), 1)
1568             != CODE_FOR_nothing)
1569     {
1570       temp = expand_binop_directly (mode, binoptab, op0, op1, target,
1571                                     unsignedp, methods, last);
1572       if (temp)
1573         return temp;
1574     }
1575
1576   /* If we were trying to rotate, and that didn't work, try rotating
1577      the other direction before falling back to shifts and bitwise-or.  */
1578   if (((binoptab == rotl_optab
1579         && optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
1580        || (binoptab == rotr_optab
1581            && optab_handler (rotl_optab, mode) != CODE_FOR_nothing))
1582       && mclass == MODE_INT)
1583     {
1584       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1585       rtx newop1;
1586       unsigned int bits = GET_MODE_PRECISION (mode);
1587
1588       if (CONST_INT_P (op1))
1589         newop1 = GEN_INT (bits - INTVAL (op1));
1590       else if (targetm.shift_truncation_mask (mode) == bits - 1)
1591         newop1 = negate_rtx (GET_MODE (op1), op1);
1592       else
1593         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1594                                gen_int_mode (bits, GET_MODE (op1)), op1,
1595                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1596
1597       temp = expand_binop_directly (mode, otheroptab, op0, newop1,
1598                                     target, unsignedp, methods, last);
1599       if (temp)
1600         return temp;
1601     }
1602
1603   /* If this is a multiply, see if we can do a widening operation that
1604      takes operands of this mode and makes a wider mode.  */
1605
1606   if (binoptab == smul_optab
1607       && GET_MODE_2XWIDER_MODE (mode) != VOIDmode
1608       && (widening_optab_handler ((unsignedp ? umul_widen_optab
1609                                              : smul_widen_optab),
1610                                   GET_MODE_2XWIDER_MODE (mode), mode)
1611           != CODE_FOR_nothing))
1612     {
1613       temp = expand_binop (GET_MODE_2XWIDER_MODE (mode),
1614                            unsignedp ? umul_widen_optab : smul_widen_optab,
1615                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1616
1617       if (temp != 0)
1618         {
1619           if (GET_MODE_CLASS (mode) == MODE_INT
1620               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1621             return gen_lowpart (mode, temp);
1622           else
1623             return convert_to_mode (mode, temp, unsignedp);
1624         }
1625     }
1626
1627   /* If this is a vector shift by a scalar, see if we can do a vector
1628      shift by a vector.  If so, broadcast the scalar into a vector.  */
1629   if (mclass == MODE_VECTOR_INT)
1630     {
1631       optab otheroptab = unknown_optab;
1632
1633       if (binoptab == ashl_optab)
1634         otheroptab = vashl_optab;
1635       else if (binoptab == ashr_optab)
1636         otheroptab = vashr_optab;
1637       else if (binoptab == lshr_optab)
1638         otheroptab = vlshr_optab;
1639       else if (binoptab == rotl_optab)
1640         otheroptab = vrotl_optab;
1641       else if (binoptab == rotr_optab)
1642         otheroptab = vrotr_optab;
1643
1644       if (otheroptab && optab_handler (otheroptab, mode) != CODE_FOR_nothing)
1645         {
1646           rtx vop1 = expand_vector_broadcast (mode, op1);
1647           if (vop1)
1648             {
1649               temp = expand_binop_directly (mode, otheroptab, op0, vop1,
1650                                             target, unsignedp, methods, last);
1651               if (temp)
1652                 return temp;
1653             }
1654         }
1655     }
1656
1657   /* Look for a wider mode of the same class for which we think we
1658      can open-code the operation.  Check for a widening multiply at the
1659      wider mode as well.  */
1660
1661   if (CLASS_HAS_WIDER_MODES_P (mclass)
1662       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1663     for (wider_mode = GET_MODE_WIDER_MODE (mode);
1664          wider_mode != VOIDmode;
1665          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
1666       {
1667         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1668             || (binoptab == smul_optab
1669                 && GET_MODE_WIDER_MODE (wider_mode) != VOIDmode
1670                 && (find_widening_optab_handler ((unsignedp
1671                                                   ? umul_widen_optab
1672                                                   : smul_widen_optab),
1673                                                  GET_MODE_WIDER_MODE (wider_mode),
1674                                                  mode, 0)
1675                     != CODE_FOR_nothing)))
1676           {
1677             rtx xop0 = op0, xop1 = op1;
1678             int no_extend = 0;
1679
1680             /* For certain integer operations, we need not actually extend
1681                the narrow operands, as long as we will truncate
1682                the results to the same narrowness.  */
1683
1684             if ((binoptab == ior_optab || binoptab == and_optab
1685                  || binoptab == xor_optab
1686                  || binoptab == add_optab || binoptab == sub_optab
1687                  || binoptab == smul_optab || binoptab == ashl_optab)
1688                 && mclass == MODE_INT)
1689               {
1690                 no_extend = 1;
1691                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1692                                                  xop0, unsignedp);
1693                 if (binoptab != ashl_optab)
1694                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1695                                                    xop1, unsignedp);
1696               }
1697
1698             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1699
1700             /* The second operand of a shift must always be extended.  */
1701             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1702                                   no_extend && binoptab != ashl_optab);
1703
1704             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1705                                  unsignedp, OPTAB_DIRECT);
1706             if (temp)
1707               {
1708                 if (mclass != MODE_INT
1709                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1710                   {
1711                     if (target == 0)
1712                       target = gen_reg_rtx (mode);
1713                     convert_move (target, temp, 0);
1714                     return target;
1715                   }
1716                 else
1717                   return gen_lowpart (mode, temp);
1718               }
1719             else
1720               delete_insns_since (last);
1721           }
1722       }
1723
1724   /* If operation is commutative,
1725      try to make the first operand a register.
1726      Even better, try to make it the same as the target.
1727      Also try to make the last operand a constant.  */
1728   if (commutative_optab_p (binoptab)
1729       && swap_commutative_operands_with_target (target, op0, op1))
1730     {
1731       temp = op1;
1732       op1 = op0;
1733       op0 = temp;
1734     }
1735
1736   /* These can be done a word at a time.  */
1737   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1738       && mclass == MODE_INT
1739       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
1740       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1741     {
1742       int i;
1743       rtx_insn *insns;
1744
1745       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1746          won't be accurate, so use a new target.  */
1747       if (target == 0
1748           || target == op0
1749           || target == op1
1750           || !valid_multiword_target_p (target))
1751         target = gen_reg_rtx (mode);
1752
1753       start_sequence ();
1754
1755       /* Do the actual arithmetic.  */
1756       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
1757         {
1758           rtx target_piece = operand_subword (target, i, 1, mode);
1759           rtx x = expand_binop (word_mode, binoptab,
1760                                 operand_subword_force (op0, i, mode),
1761                                 operand_subword_force (op1, i, mode),
1762                                 target_piece, unsignedp, next_methods);
1763
1764           if (x == 0)
1765             break;
1766
1767           if (target_piece != x)
1768             emit_move_insn (target_piece, x);
1769         }
1770
1771       insns = get_insns ();
1772       end_sequence ();
1773
1774       if (i == GET_MODE_BITSIZE (mode) / BITS_PER_WORD)
1775         {
1776           emit_insn (insns);
1777           return target;
1778         }
1779     }
1780
1781   /* Synthesize double word shifts from single word shifts.  */
1782   if ((binoptab == lshr_optab || binoptab == ashl_optab
1783        || binoptab == ashr_optab)
1784       && mclass == MODE_INT
1785       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1786       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
1787       && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode)
1788       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1789       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1790       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1791     {
1792       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1793       enum machine_mode op1_mode;
1794
1795       double_shift_mask = targetm.shift_truncation_mask (mode);
1796       shift_mask = targetm.shift_truncation_mask (word_mode);
1797       op1_mode = GET_MODE (op1) != VOIDmode ? GET_MODE (op1) : word_mode;
1798
1799       /* Apply the truncation to constant shifts.  */
1800       if (double_shift_mask > 0 && CONST_INT_P (op1))
1801         op1 = GEN_INT (INTVAL (op1) & double_shift_mask);
1802
1803       if (op1 == CONST0_RTX (op1_mode))
1804         return op0;
1805
1806       /* Make sure that this is a combination that expand_doubleword_shift
1807          can handle.  See the comments there for details.  */
1808       if (double_shift_mask == 0
1809           || (shift_mask == BITS_PER_WORD - 1
1810               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1811         {
1812           rtx_insn *insns;
1813           rtx into_target, outof_target;
1814           rtx into_input, outof_input;
1815           int left_shift, outof_word;
1816
1817           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1818              won't be accurate, so use a new target.  */
1819           if (target == 0
1820               || target == op0
1821               || target == op1
1822               || !valid_multiword_target_p (target))
1823             target = gen_reg_rtx (mode);
1824
1825           start_sequence ();
1826
1827           /* OUTOF_* is the word we are shifting bits away from, and
1828              INTO_* is the word that we are shifting bits towards, thus
1829              they differ depending on the direction of the shift and
1830              WORDS_BIG_ENDIAN.  */
1831
1832           left_shift = binoptab == ashl_optab;
1833           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1834
1835           outof_target = operand_subword (target, outof_word, 1, mode);
1836           into_target = operand_subword (target, 1 - outof_word, 1, mode);
1837
1838           outof_input = operand_subword_force (op0, outof_word, mode);
1839           into_input = operand_subword_force (op0, 1 - outof_word, mode);
1840
1841           if (expand_doubleword_shift (op1_mode, binoptab,
1842                                        outof_input, into_input, op1,
1843                                        outof_target, into_target,
1844                                        unsignedp, next_methods, shift_mask))
1845             {
1846               insns = get_insns ();
1847               end_sequence ();
1848
1849               emit_insn (insns);
1850               return target;
1851             }
1852           end_sequence ();
1853         }
1854     }
1855
1856   /* Synthesize double word rotates from single word shifts.  */
1857   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1858       && mclass == MODE_INT
1859       && CONST_INT_P (op1)
1860       && GET_MODE_PRECISION (mode) == 2 * BITS_PER_WORD
1861       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1862       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1863     {
1864       rtx_insn *insns;
1865       rtx into_target, outof_target;
1866       rtx into_input, outof_input;
1867       rtx inter;
1868       int shift_count, left_shift, outof_word;
1869
1870       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1871          won't be accurate, so use a new target. Do this also if target is not
1872          a REG, first because having a register instead may open optimization
1873          opportunities, and second because if target and op0 happen to be MEMs
1874          designating the same location, we would risk clobbering it too early
1875          in the code sequence we generate below.  */
1876       if (target == 0
1877           || target == op0
1878           || target == op1
1879           || !REG_P (target)
1880           || !valid_multiword_target_p (target))
1881         target = gen_reg_rtx (mode);
1882
1883       start_sequence ();
1884
1885       shift_count = INTVAL (op1);
1886
1887       /* OUTOF_* is the word we are shifting bits away from, and
1888          INTO_* is the word that we are shifting bits towards, thus
1889          they differ depending on the direction of the shift and
1890          WORDS_BIG_ENDIAN.  */
1891
1892       left_shift = (binoptab == rotl_optab);
1893       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1894
1895       outof_target = operand_subword (target, outof_word, 1, mode);
1896       into_target = operand_subword (target, 1 - outof_word, 1, mode);
1897
1898       outof_input = operand_subword_force (op0, outof_word, mode);
1899       into_input = operand_subword_force (op0, 1 - outof_word, mode);
1900
1901       if (shift_count == BITS_PER_WORD)
1902         {
1903           /* This is just a word swap.  */
1904           emit_move_insn (outof_target, into_input);
1905           emit_move_insn (into_target, outof_input);
1906           inter = const0_rtx;
1907         }
1908       else
1909         {
1910           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1911           rtx first_shift_count, second_shift_count;
1912           optab reverse_unsigned_shift, unsigned_shift;
1913
1914           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1915                                     ? lshr_optab : ashl_optab);
1916
1917           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1918                             ? ashl_optab : lshr_optab);
1919
1920           if (shift_count > BITS_PER_WORD)
1921             {
1922               first_shift_count = GEN_INT (shift_count - BITS_PER_WORD);
1923               second_shift_count = GEN_INT (2 * BITS_PER_WORD - shift_count);
1924             }
1925           else
1926             {
1927               first_shift_count = GEN_INT (BITS_PER_WORD - shift_count);
1928               second_shift_count = GEN_INT (shift_count);
1929             }
1930
1931           into_temp1 = expand_binop (word_mode, unsigned_shift,
1932                                      outof_input, first_shift_count,
1933                                      NULL_RTX, unsignedp, next_methods);
1934           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1935                                      into_input, second_shift_count,
1936                                      NULL_RTX, unsignedp, next_methods);
1937
1938           if (into_temp1 != 0 && into_temp2 != 0)
1939             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1940                                   into_target, unsignedp, next_methods);
1941           else
1942             inter = 0;
1943
1944           if (inter != 0 && inter != into_target)
1945             emit_move_insn (into_target, inter);
1946
1947           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1948                                       into_input, first_shift_count,
1949                                       NULL_RTX, unsignedp, next_methods);
1950           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1951                                       outof_input, second_shift_count,
1952                                       NULL_RTX, unsignedp, next_methods);
1953
1954           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1955             inter = expand_binop (word_mode, ior_optab,
1956                                   outof_temp1, outof_temp2,
1957                                   outof_target, unsignedp, next_methods);
1958
1959           if (inter != 0 && inter != outof_target)
1960             emit_move_insn (outof_target, inter);
1961         }
1962
1963       insns = get_insns ();
1964       end_sequence ();
1965
1966       if (inter != 0)
1967         {
1968           emit_insn (insns);
1969           return target;
1970         }
1971     }
1972
1973   /* These can be done a word at a time by propagating carries.  */
1974   if ((binoptab == add_optab || binoptab == sub_optab)
1975       && mclass == MODE_INT
1976       && GET_MODE_SIZE (mode) >= 2 * UNITS_PER_WORD
1977       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1978     {
1979       unsigned int i;
1980       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1981       const unsigned int nwords = GET_MODE_BITSIZE (mode) / BITS_PER_WORD;
1982       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1983       rtx xop0, xop1, xtarget;
1984
1985       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1986          value is one of those, use it.  Otherwise, use 1 since it is the
1987          one easiest to get.  */
1988 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1989       int normalizep = STORE_FLAG_VALUE;
1990 #else
1991       int normalizep = 1;
1992 #endif
1993
1994       /* Prepare the operands.  */
1995       xop0 = force_reg (mode, op0);
1996       xop1 = force_reg (mode, op1);
1997
1998       xtarget = gen_reg_rtx (mode);
1999
2000       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
2001         target = xtarget;
2002
2003       /* Indicate for flow that the entire target reg is being set.  */
2004       if (REG_P (target))
2005         emit_clobber (xtarget);
2006
2007       /* Do the actual arithmetic.  */
2008       for (i = 0; i < nwords; i++)
2009         {
2010           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
2011           rtx target_piece = operand_subword (xtarget, index, 1, mode);
2012           rtx op0_piece = operand_subword_force (xop0, index, mode);
2013           rtx op1_piece = operand_subword_force (xop1, index, mode);
2014           rtx x;
2015
2016           /* Main add/subtract of the input operands.  */
2017           x = expand_binop (word_mode, binoptab,
2018                             op0_piece, op1_piece,
2019                             target_piece, unsignedp, next_methods);
2020           if (x == 0)
2021             break;
2022
2023           if (i + 1 < nwords)
2024             {
2025               /* Store carry from main add/subtract.  */
2026               carry_out = gen_reg_rtx (word_mode);
2027               carry_out = emit_store_flag_force (carry_out,
2028                                                  (binoptab == add_optab
2029                                                   ? LT : GT),
2030                                                  x, op0_piece,
2031                                                  word_mode, 1, normalizep);
2032             }
2033
2034           if (i > 0)
2035             {
2036               rtx newx;
2037
2038               /* Add/subtract previous carry to main result.  */
2039               newx = expand_binop (word_mode,
2040                                    normalizep == 1 ? binoptab : otheroptab,
2041                                    x, carry_in,
2042                                    NULL_RTX, 1, next_methods);
2043
2044               if (i + 1 < nwords)
2045                 {
2046                   /* Get out carry from adding/subtracting carry in.  */
2047                   rtx carry_tmp = gen_reg_rtx (word_mode);
2048                   carry_tmp = emit_store_flag_force (carry_tmp,
2049                                                      (binoptab == add_optab
2050                                                       ? LT : GT),
2051                                                      newx, x,
2052                                                      word_mode, 1, normalizep);
2053
2054                   /* Logical-ior the two poss. carry together.  */
2055                   carry_out = expand_binop (word_mode, ior_optab,
2056                                             carry_out, carry_tmp,
2057                                             carry_out, 0, next_methods);
2058                   if (carry_out == 0)
2059                     break;
2060                 }
2061               emit_move_insn (target_piece, newx);
2062             }
2063           else
2064             {
2065               if (x != target_piece)
2066                 emit_move_insn (target_piece, x);
2067             }
2068
2069           carry_in = carry_out;
2070         }
2071
2072       if (i == GET_MODE_BITSIZE (mode) / (unsigned) BITS_PER_WORD)
2073         {
2074           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing
2075               || ! rtx_equal_p (target, xtarget))
2076             {
2077               rtx temp = emit_move_insn (target, xtarget);
2078
2079               set_dst_reg_note (temp, REG_EQUAL,
2080                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
2081                                                 mode, copy_rtx (xop0),
2082                                                 copy_rtx (xop1)),
2083                                 target);
2084             }
2085           else
2086             target = xtarget;
2087
2088           return target;
2089         }
2090
2091       else
2092         delete_insns_since (last);
2093     }
2094
2095   /* Attempt to synthesize double word multiplies using a sequence of word
2096      mode multiplications.  We first attempt to generate a sequence using a
2097      more efficient unsigned widening multiply, and if that fails we then
2098      try using a signed widening multiply.  */
2099
2100   if (binoptab == smul_optab
2101       && mclass == MODE_INT
2102       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2103       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
2104       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
2105     {
2106       rtx product = NULL_RTX;
2107       if (widening_optab_handler (umul_widen_optab, mode, word_mode)
2108             != CODE_FOR_nothing)
2109         {
2110           product = expand_doubleword_mult (mode, op0, op1, target,
2111                                             true, methods);
2112           if (!product)
2113             delete_insns_since (last);
2114         }
2115
2116       if (product == NULL_RTX
2117           && widening_optab_handler (smul_widen_optab, mode, word_mode)
2118                 != CODE_FOR_nothing)
2119         {
2120           product = expand_doubleword_mult (mode, op0, op1, target,
2121                                             false, methods);
2122           if (!product)
2123             delete_insns_since (last);
2124         }
2125
2126       if (product != NULL_RTX)
2127         {
2128           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing)
2129             {
2130               temp = emit_move_insn (target ? target : product, product);
2131               set_dst_reg_note (temp,
2132                                 REG_EQUAL,
2133                                 gen_rtx_fmt_ee (MULT, mode,
2134                                                 copy_rtx (op0),
2135                                                 copy_rtx (op1)),
2136                                 target ? target : product);
2137             }
2138           return product;
2139         }
2140     }
2141
2142   /* It can't be open-coded in this mode.
2143      Use a library call if one is available and caller says that's ok.  */
2144
2145   libfunc = optab_libfunc (binoptab, mode);
2146   if (libfunc
2147       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
2148     {
2149       rtx_insn *insns;
2150       rtx op1x = op1;
2151       enum machine_mode op1_mode = mode;
2152       rtx value;
2153
2154       start_sequence ();
2155
2156       if (shift_optab_p (binoptab))
2157         {
2158           op1_mode = targetm.libgcc_shift_count_mode ();
2159           /* Specify unsigned here,
2160              since negative shift counts are meaningless.  */
2161           op1x = convert_to_mode (op1_mode, op1, 1);
2162         }
2163
2164       if (GET_MODE (op0) != VOIDmode
2165           && GET_MODE (op0) != mode)
2166         op0 = convert_to_mode (mode, op0, unsignedp);
2167
2168       /* Pass 1 for NO_QUEUE so we don't lose any increments
2169          if the libcall is cse'd or moved.  */
2170       value = emit_library_call_value (libfunc,
2171                                        NULL_RTX, LCT_CONST, mode, 2,
2172                                        op0, mode, op1x, op1_mode);
2173
2174       insns = get_insns ();
2175       end_sequence ();
2176
2177       target = gen_reg_rtx (mode);
2178       emit_libcall_block_1 (insns, target, value,
2179                             gen_rtx_fmt_ee (optab_to_code (binoptab),
2180                                             mode, op0, op1),
2181                             trapv_binoptab_p (binoptab));
2182
2183       return target;
2184     }
2185
2186   delete_insns_since (last);
2187
2188   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2189
2190   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
2191          || methods == OPTAB_MUST_WIDEN))
2192     {
2193       /* Caller says, don't even try.  */
2194       delete_insns_since (entry_last);
2195       return 0;
2196     }
2197
2198   /* Compute the value of METHODS to pass to recursive calls.
2199      Don't allow widening to be tried recursively.  */
2200
2201   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
2202
2203   /* Look for a wider mode of the same class for which it appears we can do
2204      the operation.  */
2205
2206   if (CLASS_HAS_WIDER_MODES_P (mclass))
2207     {
2208       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2209            wider_mode != VOIDmode;
2210            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2211         {
2212           if (find_widening_optab_handler (binoptab, wider_mode, mode, 1)
2213                   != CODE_FOR_nothing
2214               || (methods == OPTAB_LIB
2215                   && optab_libfunc (binoptab, wider_mode)))
2216             {
2217               rtx xop0 = op0, xop1 = op1;
2218               int no_extend = 0;
2219
2220               /* For certain integer operations, we need not actually extend
2221                  the narrow operands, as long as we will truncate
2222                  the results to the same narrowness.  */
2223
2224               if ((binoptab == ior_optab || binoptab == and_optab
2225                    || binoptab == xor_optab
2226                    || binoptab == add_optab || binoptab == sub_optab
2227                    || binoptab == smul_optab || binoptab == ashl_optab)
2228                   && mclass == MODE_INT)
2229                 no_extend = 1;
2230
2231               xop0 = widen_operand (xop0, wider_mode, mode,
2232                                     unsignedp, no_extend);
2233
2234               /* The second operand of a shift must always be extended.  */
2235               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
2236                                     no_extend && binoptab != ashl_optab);
2237
2238               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
2239                                    unsignedp, methods);
2240               if (temp)
2241                 {
2242                   if (mclass != MODE_INT
2243                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2244                     {
2245                       if (target == 0)
2246                         target = gen_reg_rtx (mode);
2247                       convert_move (target, temp, 0);
2248                       return target;
2249                     }
2250                   else
2251                     return gen_lowpart (mode, temp);
2252                 }
2253               else
2254                 delete_insns_since (last);
2255             }
2256         }
2257     }
2258
2259   delete_insns_since (entry_last);
2260   return 0;
2261 }
2262 \f
2263 /* Expand a binary operator which has both signed and unsigned forms.
2264    UOPTAB is the optab for unsigned operations, and SOPTAB is for
2265    signed operations.
2266
2267    If we widen unsigned operands, we may use a signed wider operation instead
2268    of an unsigned wider operation, since the result would be the same.  */
2269
2270 rtx
2271 sign_expand_binop (enum machine_mode mode, optab uoptab, optab soptab,
2272                    rtx op0, rtx op1, rtx target, int unsignedp,
2273                    enum optab_methods methods)
2274 {
2275   rtx temp;
2276   optab direct_optab = unsignedp ? uoptab : soptab;
2277   bool save_enable;
2278
2279   /* Do it without widening, if possible.  */
2280   temp = expand_binop (mode, direct_optab, op0, op1, target,
2281                        unsignedp, OPTAB_DIRECT);
2282   if (temp || methods == OPTAB_DIRECT)
2283     return temp;
2284
2285   /* Try widening to a signed int.  Disable any direct use of any
2286      signed insn in the current mode.  */
2287   save_enable = swap_optab_enable (soptab, mode, false);
2288
2289   temp = expand_binop (mode, soptab, op0, op1, target,
2290                        unsignedp, OPTAB_WIDEN);
2291
2292   /* For unsigned operands, try widening to an unsigned int.  */
2293   if (!temp && unsignedp)
2294     temp = expand_binop (mode, uoptab, op0, op1, target,
2295                          unsignedp, OPTAB_WIDEN);
2296   if (temp || methods == OPTAB_WIDEN)
2297     goto egress;
2298
2299   /* Use the right width libcall if that exists.  */
2300   temp = expand_binop (mode, direct_optab, op0, op1, target,
2301                        unsignedp, OPTAB_LIB);
2302   if (temp || methods == OPTAB_LIB)
2303     goto egress;
2304
2305   /* Must widen and use a libcall, use either signed or unsigned.  */
2306   temp = expand_binop (mode, soptab, op0, op1, target,
2307                        unsignedp, methods);
2308   if (!temp && unsignedp)
2309     temp = expand_binop (mode, uoptab, op0, op1, target,
2310                          unsignedp, methods);
2311
2312  egress:
2313   /* Undo the fiddling above.  */
2314   if (save_enable)
2315     swap_optab_enable (soptab, mode, true);
2316   return temp;
2317 }
2318 \f
2319 /* Generate code to perform an operation specified by UNOPPTAB
2320    on operand OP0, with two results to TARG0 and TARG1.
2321    We assume that the order of the operands for the instruction
2322    is TARG0, TARG1, OP0.
2323
2324    Either TARG0 or TARG1 may be zero, but what that means is that
2325    the result is not actually wanted.  We will generate it into
2326    a dummy pseudo-reg and discard it.  They may not both be zero.
2327
2328    Returns 1 if this operation can be performed; 0 if not.  */
2329
2330 int
2331 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
2332                     int unsignedp)
2333 {
2334   enum machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2335   enum mode_class mclass;
2336   enum machine_mode wider_mode;
2337   rtx_insn *entry_last = get_last_insn ();
2338   rtx_insn *last;
2339
2340   mclass = GET_MODE_CLASS (mode);
2341
2342   if (!targ0)
2343     targ0 = gen_reg_rtx (mode);
2344   if (!targ1)
2345     targ1 = gen_reg_rtx (mode);
2346
2347   /* Record where to go back to if we fail.  */
2348   last = get_last_insn ();
2349
2350   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2351     {
2352       struct expand_operand ops[3];
2353       enum insn_code icode = optab_handler (unoptab, mode);
2354
2355       create_fixed_operand (&ops[0], targ0);
2356       create_fixed_operand (&ops[1], targ1);
2357       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
2358       if (maybe_expand_insn (icode, 3, ops))
2359         return 1;
2360     }
2361
2362   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2363
2364   if (CLASS_HAS_WIDER_MODES_P (mclass))
2365     {
2366       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2367            wider_mode != VOIDmode;
2368            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2369         {
2370           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2371             {
2372               rtx t0 = gen_reg_rtx (wider_mode);
2373               rtx t1 = gen_reg_rtx (wider_mode);
2374               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2375
2376               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
2377                 {
2378                   convert_move (targ0, t0, unsignedp);
2379                   convert_move (targ1, t1, unsignedp);
2380                   return 1;
2381                 }
2382               else
2383                 delete_insns_since (last);
2384             }
2385         }
2386     }
2387
2388   delete_insns_since (entry_last);
2389   return 0;
2390 }
2391 \f
2392 /* Generate code to perform an operation specified by BINOPTAB
2393    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2394    We assume that the order of the operands for the instruction
2395    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2396    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2397
2398    Either TARG0 or TARG1 may be zero, but what that means is that
2399    the result is not actually wanted.  We will generate it into
2400    a dummy pseudo-reg and discard it.  They may not both be zero.
2401
2402    Returns 1 if this operation can be performed; 0 if not.  */
2403
2404 int
2405 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2406                      int unsignedp)
2407 {
2408   enum machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2409   enum mode_class mclass;
2410   enum machine_mode wider_mode;
2411   rtx_insn *entry_last = get_last_insn ();
2412   rtx_insn *last;
2413
2414   mclass = GET_MODE_CLASS (mode);
2415
2416   if (!targ0)
2417     targ0 = gen_reg_rtx (mode);
2418   if (!targ1)
2419     targ1 = gen_reg_rtx (mode);
2420
2421   /* Record where to go back to if we fail.  */
2422   last = get_last_insn ();
2423
2424   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2425     {
2426       struct expand_operand ops[4];
2427       enum insn_code icode = optab_handler (binoptab, mode);
2428       enum machine_mode mode0 = insn_data[icode].operand[1].mode;
2429       enum machine_mode mode1 = insn_data[icode].operand[2].mode;
2430       rtx xop0 = op0, xop1 = op1;
2431
2432       /* If we are optimizing, force expensive constants into a register.  */
2433       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2434       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2435
2436       create_fixed_operand (&ops[0], targ0);
2437       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2438       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2439       create_fixed_operand (&ops[3], targ1);
2440       if (maybe_expand_insn (icode, 4, ops))
2441         return 1;
2442       delete_insns_since (last);
2443     }
2444
2445   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2446
2447   if (CLASS_HAS_WIDER_MODES_P (mclass))
2448     {
2449       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2450            wider_mode != VOIDmode;
2451            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2452         {
2453           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2454             {
2455               rtx t0 = gen_reg_rtx (wider_mode);
2456               rtx t1 = gen_reg_rtx (wider_mode);
2457               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2458               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2459
2460               if (expand_twoval_binop (binoptab, cop0, cop1,
2461                                        t0, t1, unsignedp))
2462                 {
2463                   convert_move (targ0, t0, unsignedp);
2464                   convert_move (targ1, t1, unsignedp);
2465                   return 1;
2466                 }
2467               else
2468                 delete_insns_since (last);
2469             }
2470         }
2471     }
2472
2473   delete_insns_since (entry_last);
2474   return 0;
2475 }
2476
2477 /* Expand the two-valued library call indicated by BINOPTAB, but
2478    preserve only one of the values.  If TARG0 is non-NULL, the first
2479    value is placed into TARG0; otherwise the second value is placed
2480    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2481    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2482    This routine assumes that the value returned by the library call is
2483    as if the return value was of an integral mode twice as wide as the
2484    mode of OP0.  Returns 1 if the call was successful.  */
2485
2486 bool
2487 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2488                              rtx targ0, rtx targ1, enum rtx_code code)
2489 {
2490   enum machine_mode mode;
2491   enum machine_mode libval_mode;
2492   rtx libval;
2493   rtx_insn *insns;
2494   rtx libfunc;
2495
2496   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2497   gcc_assert (!targ0 != !targ1);
2498
2499   mode = GET_MODE (op0);
2500   libfunc = optab_libfunc (binoptab, mode);
2501   if (!libfunc)
2502     return false;
2503
2504   /* The value returned by the library function will have twice as
2505      many bits as the nominal MODE.  */
2506   libval_mode = smallest_mode_for_size (2 * GET_MODE_BITSIZE (mode),
2507                                         MODE_INT);
2508   start_sequence ();
2509   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2510                                     libval_mode, 2,
2511                                     op0, mode,
2512                                     op1, mode);
2513   /* Get the part of VAL containing the value that we want.  */
2514   libval = simplify_gen_subreg (mode, libval, libval_mode,
2515                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2516   insns = get_insns ();
2517   end_sequence ();
2518   /* Move the into the desired location.  */
2519   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2520                       gen_rtx_fmt_ee (code, mode, op0, op1));
2521
2522   return true;
2523 }
2524
2525 \f
2526 /* Wrapper around expand_unop which takes an rtx code to specify
2527    the operation to perform, not an optab pointer.  All other
2528    arguments are the same.  */
2529 rtx
2530 expand_simple_unop (enum machine_mode mode, enum rtx_code code, rtx op0,
2531                     rtx target, int unsignedp)
2532 {
2533   optab unop = code_to_optab (code);
2534   gcc_assert (unop);
2535
2536   return expand_unop (mode, unop, op0, target, unsignedp);
2537 }
2538
2539 /* Try calculating
2540         (clz:narrow x)
2541    as
2542         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2543
2544    A similar operation can be used for clrsb.  UNOPTAB says which operation
2545    we are trying to expand.  */
2546 static rtx
2547 widen_leading (enum machine_mode mode, rtx op0, rtx target, optab unoptab)
2548 {
2549   enum mode_class mclass = GET_MODE_CLASS (mode);
2550   if (CLASS_HAS_WIDER_MODES_P (mclass))
2551     {
2552       enum machine_mode wider_mode;
2553       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2554            wider_mode != VOIDmode;
2555            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2556         {
2557           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2558             {
2559               rtx xop0, temp;
2560               rtx_insn *last;
2561
2562               last = get_last_insn ();
2563
2564               if (target == 0)
2565                 target = gen_reg_rtx (mode);
2566               xop0 = widen_operand (op0, wider_mode, mode,
2567                                     unoptab != clrsb_optab, false);
2568               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2569                                   unoptab != clrsb_optab);
2570               if (temp != 0)
2571                 temp = expand_binop
2572                   (wider_mode, sub_optab, temp,
2573                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
2574                                  - GET_MODE_PRECISION (mode),
2575                                  wider_mode),
2576                    target, true, OPTAB_DIRECT);
2577               if (temp == 0)
2578                 delete_insns_since (last);
2579
2580               return temp;
2581             }
2582         }
2583     }
2584   return 0;
2585 }
2586
2587 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2588    quantities, choosing which based on whether the high word is nonzero.  */
2589 static rtx
2590 expand_doubleword_clz (enum machine_mode mode, rtx op0, rtx target)
2591 {
2592   rtx xop0 = force_reg (mode, op0);
2593   rtx subhi = gen_highpart (word_mode, xop0);
2594   rtx sublo = gen_lowpart (word_mode, xop0);
2595   rtx_code_label *hi0_label = gen_label_rtx ();
2596   rtx_code_label *after_label = gen_label_rtx ();
2597   rtx_insn *seq;
2598   rtx temp, result;
2599
2600   /* If we were not given a target, use a word_mode register, not a
2601      'mode' register.  The result will fit, and nobody is expecting
2602      anything bigger (the return type of __builtin_clz* is int).  */
2603   if (!target)
2604     target = gen_reg_rtx (word_mode);
2605
2606   /* In any case, write to a word_mode scratch in both branches of the
2607      conditional, so we can ensure there is a single move insn setting
2608      'target' to tag a REG_EQUAL note on.  */
2609   result = gen_reg_rtx (word_mode);
2610
2611   start_sequence ();
2612
2613   /* If the high word is not equal to zero,
2614      then clz of the full value is clz of the high word.  */
2615   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2616                            word_mode, true, hi0_label);
2617
2618   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2619   if (!temp)
2620     goto fail;
2621
2622   if (temp != result)
2623     convert_move (result, temp, true);
2624
2625   emit_jump_insn (gen_jump (after_label));
2626   emit_barrier ();
2627
2628   /* Else clz of the full value is clz of the low word plus the number
2629      of bits in the high word.  */
2630   emit_label (hi0_label);
2631
2632   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2633   if (!temp)
2634     goto fail;
2635   temp = expand_binop (word_mode, add_optab, temp,
2636                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2637                        result, true, OPTAB_DIRECT);
2638   if (!temp)
2639     goto fail;
2640   if (temp != result)
2641     convert_move (result, temp, true);
2642
2643   emit_label (after_label);
2644   convert_move (target, result, true);
2645
2646   seq = get_insns ();
2647   end_sequence ();
2648
2649   add_equal_note (seq, target, CLZ, xop0, 0);
2650   emit_insn (seq);
2651   return target;
2652
2653  fail:
2654   end_sequence ();
2655   return 0;
2656 }
2657
2658 /* Try calculating
2659         (bswap:narrow x)
2660    as
2661         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2662 static rtx
2663 widen_bswap (enum machine_mode mode, rtx op0, rtx target)
2664 {
2665   enum mode_class mclass = GET_MODE_CLASS (mode);
2666   enum machine_mode wider_mode;
2667   rtx x;
2668   rtx_insn *last;
2669
2670   if (!CLASS_HAS_WIDER_MODES_P (mclass))
2671     return NULL_RTX;
2672
2673   for (wider_mode = GET_MODE_WIDER_MODE (mode);
2674        wider_mode != VOIDmode;
2675        wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2676     if (optab_handler (bswap_optab, wider_mode) != CODE_FOR_nothing)
2677       goto found;
2678   return NULL_RTX;
2679
2680  found:
2681   last = get_last_insn ();
2682
2683   x = widen_operand (op0, wider_mode, mode, true, true);
2684   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2685
2686   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2687               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2688   if (x != 0)
2689     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2690                       GET_MODE_BITSIZE (wider_mode)
2691                       - GET_MODE_BITSIZE (mode),
2692                       NULL_RTX, true);
2693
2694   if (x != 0)
2695     {
2696       if (target == 0)
2697         target = gen_reg_rtx (mode);
2698       emit_move_insn (target, gen_lowpart (mode, x));
2699     }
2700   else
2701     delete_insns_since (last);
2702
2703   return target;
2704 }
2705
2706 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2707
2708 static rtx
2709 expand_doubleword_bswap (enum machine_mode mode, rtx op, rtx target)
2710 {
2711   rtx t0, t1;
2712
2713   t1 = expand_unop (word_mode, bswap_optab,
2714                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2715   t0 = expand_unop (word_mode, bswap_optab,
2716                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2717
2718   if (target == 0 || !valid_multiword_target_p (target))
2719     target = gen_reg_rtx (mode);
2720   if (REG_P (target))
2721     emit_clobber (target);
2722   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2723   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2724
2725   return target;
2726 }
2727
2728 /* Try calculating (parity x) as (and (popcount x) 1), where
2729    popcount can also be done in a wider mode.  */
2730 static rtx
2731 expand_parity (enum machine_mode mode, rtx op0, rtx target)
2732 {
2733   enum mode_class mclass = GET_MODE_CLASS (mode);
2734   if (CLASS_HAS_WIDER_MODES_P (mclass))
2735     {
2736       enum machine_mode wider_mode;
2737       for (wider_mode = mode; wider_mode != VOIDmode;
2738            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2739         {
2740           if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2741             {
2742               rtx xop0, temp;
2743               rtx_insn *last;
2744
2745               last = get_last_insn ();
2746
2747               if (target == 0)
2748                 target = gen_reg_rtx (mode);
2749               xop0 = widen_operand (op0, wider_mode, mode, true, false);
2750               temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2751                                   true);
2752               if (temp != 0)
2753                 temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2754                                      target, true, OPTAB_DIRECT);
2755               if (temp == 0)
2756                 delete_insns_since (last);
2757
2758               return temp;
2759             }
2760         }
2761     }
2762   return 0;
2763 }
2764
2765 /* Try calculating ctz(x) as K - clz(x & -x) ,
2766    where K is GET_MODE_PRECISION(mode) - 1.
2767
2768    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2769    don't have to worry about what the hardware does in that case.  (If
2770    the clz instruction produces the usual value at 0, which is K, the
2771    result of this code sequence will be -1; expand_ffs, below, relies
2772    on this.  It might be nice to have it be K instead, for consistency
2773    with the (very few) processors that provide a ctz with a defined
2774    value, but that would take one more instruction, and it would be
2775    less convenient for expand_ffs anyway.  */
2776
2777 static rtx
2778 expand_ctz (enum machine_mode mode, rtx op0, rtx target)
2779 {
2780   rtx_insn *seq;
2781   rtx temp;
2782
2783   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2784     return 0;
2785
2786   start_sequence ();
2787
2788   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2789   if (temp)
2790     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2791                          true, OPTAB_DIRECT);
2792   if (temp)
2793     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2794   if (temp)
2795     temp = expand_binop (mode, sub_optab,
2796                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2797                          temp, target,
2798                          true, OPTAB_DIRECT);
2799   if (temp == 0)
2800     {
2801       end_sequence ();
2802       return 0;
2803     }
2804
2805   seq = get_insns ();
2806   end_sequence ();
2807
2808   add_equal_note (seq, temp, CTZ, op0, 0);
2809   emit_insn (seq);
2810   return temp;
2811 }
2812
2813
2814 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2815    else with the sequence used by expand_clz.
2816
2817    The ffs builtin promises to return zero for a zero value and ctz/clz
2818    may have an undefined value in that case.  If they do not give us a
2819    convenient value, we have to generate a test and branch.  */
2820 static rtx
2821 expand_ffs (enum machine_mode mode, rtx op0, rtx target)
2822 {
2823   HOST_WIDE_INT val = 0;
2824   bool defined_at_zero = false;
2825   rtx temp;
2826   rtx_insn *seq;
2827
2828   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2829     {
2830       start_sequence ();
2831
2832       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2833       if (!temp)
2834         goto fail;
2835
2836       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2837     }
2838   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2839     {
2840       start_sequence ();
2841       temp = expand_ctz (mode, op0, 0);
2842       if (!temp)
2843         goto fail;
2844
2845       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2846         {
2847           defined_at_zero = true;
2848           val = (GET_MODE_PRECISION (mode) - 1) - val;
2849         }
2850     }
2851   else
2852     return 0;
2853
2854   if (defined_at_zero && val == -1)
2855     /* No correction needed at zero.  */;
2856   else
2857     {
2858       /* We don't try to do anything clever with the situation found
2859          on some processors (eg Alpha) where ctz(0:mode) ==
2860          bitsize(mode).  If someone can think of a way to send N to -1
2861          and leave alone all values in the range 0..N-1 (where N is a
2862          power of two), cheaper than this test-and-branch, please add it.
2863
2864          The test-and-branch is done after the operation itself, in case
2865          the operation sets condition codes that can be recycled for this.
2866          (This is true on i386, for instance.)  */
2867
2868       rtx_code_label *nonzero_label = gen_label_rtx ();
2869       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2870                                mode, true, nonzero_label);
2871
2872       convert_move (temp, GEN_INT (-1), false);
2873       emit_label (nonzero_label);
2874     }
2875
2876   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2877      to produce a value in the range 0..bitsize.  */
2878   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2879                        target, false, OPTAB_DIRECT);
2880   if (!temp)
2881     goto fail;
2882
2883   seq = get_insns ();
2884   end_sequence ();
2885
2886   add_equal_note (seq, temp, FFS, op0, 0);
2887   emit_insn (seq);
2888   return temp;
2889
2890  fail:
2891   end_sequence ();
2892   return 0;
2893 }
2894
2895 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2896    conditions, VAL may already be a SUBREG against which we cannot generate
2897    a further SUBREG.  In this case, we expect forcing the value into a
2898    register will work around the situation.  */
2899
2900 static rtx
2901 lowpart_subreg_maybe_copy (enum machine_mode omode, rtx val,
2902                            enum machine_mode imode)
2903 {
2904   rtx ret;
2905   ret = lowpart_subreg (omode, val, imode);
2906   if (ret == NULL)
2907     {
2908       val = force_reg (imode, val);
2909       ret = lowpart_subreg (omode, val, imode);
2910       gcc_assert (ret != NULL);
2911     }
2912   return ret;
2913 }
2914
2915 /* Expand a floating point absolute value or negation operation via a
2916    logical operation on the sign bit.  */
2917
2918 static rtx
2919 expand_absneg_bit (enum rtx_code code, enum machine_mode mode,
2920                    rtx op0, rtx target)
2921 {
2922   const struct real_format *fmt;
2923   int bitpos, word, nwords, i;
2924   enum machine_mode imode;
2925   rtx temp;
2926   rtx_insn *insns;
2927
2928   /* The format has to have a simple sign bit.  */
2929   fmt = REAL_MODE_FORMAT (mode);
2930   if (fmt == NULL)
2931     return NULL_RTX;
2932
2933   bitpos = fmt->signbit_rw;
2934   if (bitpos < 0)
2935     return NULL_RTX;
2936
2937   /* Don't create negative zeros if the format doesn't support them.  */
2938   if (code == NEG && !fmt->has_signed_zero)
2939     return NULL_RTX;
2940
2941   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2942     {
2943       imode = int_mode_for_mode (mode);
2944       if (imode == BLKmode)
2945         return NULL_RTX;
2946       word = 0;
2947       nwords = 1;
2948     }
2949   else
2950     {
2951       imode = word_mode;
2952
2953       if (FLOAT_WORDS_BIG_ENDIAN)
2954         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2955       else
2956         word = bitpos / BITS_PER_WORD;
2957       bitpos = bitpos % BITS_PER_WORD;
2958       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2959     }
2960
2961   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2962   if (code == ABS)
2963     mask = ~mask;
2964
2965   if (target == 0
2966       || target == op0
2967       || (nwords > 1 && !valid_multiword_target_p (target)))
2968     target = gen_reg_rtx (mode);
2969
2970   if (nwords > 1)
2971     {
2972       start_sequence ();
2973
2974       for (i = 0; i < nwords; ++i)
2975         {
2976           rtx targ_piece = operand_subword (target, i, 1, mode);
2977           rtx op0_piece = operand_subword_force (op0, i, mode);
2978
2979           if (i == word)
2980             {
2981               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2982                                    op0_piece,
2983                                    immed_wide_int_const (mask, imode),
2984                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2985               if (temp != targ_piece)
2986                 emit_move_insn (targ_piece, temp);
2987             }
2988           else
2989             emit_move_insn (targ_piece, op0_piece);
2990         }
2991
2992       insns = get_insns ();
2993       end_sequence ();
2994
2995       emit_insn (insns);
2996     }
2997   else
2998     {
2999       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
3000                            gen_lowpart (imode, op0),
3001                            immed_wide_int_const (mask, imode),
3002                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3003       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3004
3005       set_dst_reg_note (get_last_insn (), REG_EQUAL,
3006                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
3007                         target);
3008     }
3009
3010   return target;
3011 }
3012
3013 /* As expand_unop, but will fail rather than attempt the operation in a
3014    different mode or with a libcall.  */
3015 static rtx
3016 expand_unop_direct (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
3017              int unsignedp)
3018 {
3019   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
3020     {
3021       struct expand_operand ops[2];
3022       enum insn_code icode = optab_handler (unoptab, mode);
3023       rtx_insn *last = get_last_insn ();
3024       rtx pat;
3025
3026       create_output_operand (&ops[0], target, mode);
3027       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
3028       pat = maybe_gen_insn (icode, 2, ops);
3029       if (pat)
3030         {
3031           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3032               && ! add_equal_note (pat, ops[0].value, optab_to_code (unoptab),
3033                                    ops[1].value, NULL_RTX))
3034             {
3035               delete_insns_since (last);
3036               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
3037             }
3038
3039           emit_insn (pat);
3040
3041           return ops[0].value;
3042         }
3043     }
3044   return 0;
3045 }
3046
3047 /* Generate code to perform an operation specified by UNOPTAB
3048    on operand OP0, with result having machine-mode MODE.
3049
3050    UNSIGNEDP is for the case where we have to widen the operands
3051    to perform the operation.  It says to use zero-extension.
3052
3053    If TARGET is nonzero, the value
3054    is generated there, if it is convenient to do so.
3055    In all cases an rtx is returned for the locus of the value;
3056    this may or may not be TARGET.  */
3057
3058 rtx
3059 expand_unop (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
3060              int unsignedp)
3061 {
3062   enum mode_class mclass = GET_MODE_CLASS (mode);
3063   enum machine_mode wider_mode;
3064   rtx temp;
3065   rtx libfunc;
3066
3067   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
3068   if (temp)
3069     return temp;
3070
3071   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
3072
3073   /* Widening (or narrowing) clz needs special treatment.  */
3074   if (unoptab == clz_optab)
3075     {
3076       temp = widen_leading (mode, op0, target, unoptab);
3077       if (temp)
3078         return temp;
3079
3080       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3081           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3082         {
3083           temp = expand_doubleword_clz (mode, op0, target);
3084           if (temp)
3085             return temp;
3086         }
3087
3088       goto try_libcall;
3089     }
3090
3091   if (unoptab == clrsb_optab)
3092     {
3093       temp = widen_leading (mode, op0, target, unoptab);
3094       if (temp)
3095         return temp;
3096       goto try_libcall;
3097     }
3098
3099   /* Widening (or narrowing) bswap needs special treatment.  */
3100   if (unoptab == bswap_optab)
3101     {
3102       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
3103          or ROTATERT.  First try these directly; if this fails, then try the
3104          obvious pair of shifts with allowed widening, as this will probably
3105          be always more efficient than the other fallback methods.  */
3106       if (mode == HImode)
3107         {
3108           rtx_insn *last;
3109           rtx temp1, temp2;
3110
3111           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
3112             {
3113               temp = expand_binop (mode, rotl_optab, op0, GEN_INT (8), target,
3114                                    unsignedp, OPTAB_DIRECT);
3115               if (temp)
3116                 return temp;
3117              }
3118
3119           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
3120             {
3121               temp = expand_binop (mode, rotr_optab, op0, GEN_INT (8), target,
3122                                    unsignedp, OPTAB_DIRECT);
3123               if (temp)
3124                 return temp;
3125             }
3126
3127           last = get_last_insn ();
3128
3129           temp1 = expand_binop (mode, ashl_optab, op0, GEN_INT (8), NULL_RTX,
3130                                 unsignedp, OPTAB_WIDEN);
3131           temp2 = expand_binop (mode, lshr_optab, op0, GEN_INT (8), NULL_RTX,
3132                                 unsignedp, OPTAB_WIDEN);
3133           if (temp1 && temp2)
3134             {
3135               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
3136                                    unsignedp, OPTAB_WIDEN);
3137               if (temp)
3138                 return temp;
3139             }
3140
3141           delete_insns_since (last);
3142         }
3143
3144       temp = widen_bswap (mode, op0, target);
3145       if (temp)
3146         return temp;
3147
3148       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3149           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3150         {
3151           temp = expand_doubleword_bswap (mode, op0, target);
3152           if (temp)
3153             return temp;
3154         }
3155
3156       goto try_libcall;
3157     }
3158
3159   if (CLASS_HAS_WIDER_MODES_P (mclass))
3160     for (wider_mode = GET_MODE_WIDER_MODE (mode);
3161          wider_mode != VOIDmode;
3162          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3163       {
3164         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
3165           {
3166             rtx xop0 = op0;
3167             rtx_insn *last = get_last_insn ();
3168
3169             /* For certain operations, we need not actually extend
3170                the narrow operand, as long as we will truncate the
3171                results to the same narrowness.  */
3172
3173             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3174                                   (unoptab == neg_optab
3175                                    || unoptab == one_cmpl_optab)
3176                                   && mclass == MODE_INT);
3177
3178             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3179                                 unsignedp);
3180
3181             if (temp)
3182               {
3183                 if (mclass != MODE_INT
3184                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
3185                   {
3186                     if (target == 0)
3187                       target = gen_reg_rtx (mode);
3188                     convert_move (target, temp, 0);
3189                     return target;
3190                   }
3191                 else
3192                   return gen_lowpart (mode, temp);
3193               }
3194             else
3195               delete_insns_since (last);
3196           }
3197       }
3198
3199   /* These can be done a word at a time.  */
3200   if (unoptab == one_cmpl_optab
3201       && mclass == MODE_INT
3202       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
3203       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3204     {
3205       int i;
3206       rtx_insn *insns;
3207
3208       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
3209         target = gen_reg_rtx (mode);
3210
3211       start_sequence ();
3212
3213       /* Do the actual arithmetic.  */
3214       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
3215         {
3216           rtx target_piece = operand_subword (target, i, 1, mode);
3217           rtx x = expand_unop (word_mode, unoptab,
3218                                operand_subword_force (op0, i, mode),
3219                                target_piece, unsignedp);
3220
3221           if (target_piece != x)
3222             emit_move_insn (target_piece, x);
3223         }
3224
3225       insns = get_insns ();
3226       end_sequence ();
3227
3228       emit_insn (insns);
3229       return target;
3230     }
3231
3232   if (optab_to_code (unoptab) == NEG)
3233     {
3234       /* Try negating floating point values by flipping the sign bit.  */
3235       if (SCALAR_FLOAT_MODE_P (mode))
3236         {
3237           temp = expand_absneg_bit (NEG, mode, op0, target);
3238           if (temp)
3239             return temp;
3240         }
3241
3242       /* If there is no negation pattern, and we have no negative zero,
3243          try subtracting from zero.  */
3244       if (!HONOR_SIGNED_ZEROS (mode))
3245         {
3246           temp = expand_binop (mode, (unoptab == negv_optab
3247                                       ? subv_optab : sub_optab),
3248                                CONST0_RTX (mode), op0, target,
3249                                unsignedp, OPTAB_DIRECT);
3250           if (temp)
3251             return temp;
3252         }
3253     }
3254
3255   /* Try calculating parity (x) as popcount (x) % 2.  */
3256   if (unoptab == parity_optab)
3257     {
3258       temp = expand_parity (mode, op0, target);
3259       if (temp)
3260         return temp;
3261     }
3262
3263   /* Try implementing ffs (x) in terms of clz (x).  */
3264   if (unoptab == ffs_optab)
3265     {
3266       temp = expand_ffs (mode, op0, target);
3267       if (temp)
3268         return temp;
3269     }
3270
3271   /* Try implementing ctz (x) in terms of clz (x).  */
3272   if (unoptab == ctz_optab)
3273     {
3274       temp = expand_ctz (mode, op0, target);
3275       if (temp)
3276         return temp;
3277     }
3278
3279  try_libcall:
3280   /* Now try a library call in this mode.  */
3281   libfunc = optab_libfunc (unoptab, mode);
3282   if (libfunc)
3283     {
3284       rtx_insn *insns;
3285       rtx value;
3286       rtx eq_value;
3287       enum machine_mode outmode = mode;
3288
3289       /* All of these functions return small values.  Thus we choose to
3290          have them return something that isn't a double-word.  */
3291       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
3292           || unoptab == clrsb_optab || unoptab == popcount_optab
3293           || unoptab == parity_optab)
3294         outmode
3295           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3296                                           optab_libfunc (unoptab, mode)));
3297
3298       start_sequence ();
3299
3300       /* Pass 1 for NO_QUEUE so we don't lose any increments
3301          if the libcall is cse'd or moved.  */
3302       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3303                                        1, op0, mode);
3304       insns = get_insns ();
3305       end_sequence ();
3306
3307       target = gen_reg_rtx (outmode);
3308       eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3309       if (GET_MODE_SIZE (outmode) < GET_MODE_SIZE (mode))
3310         eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3311       else if (GET_MODE_SIZE (outmode) > GET_MODE_SIZE (mode))
3312         eq_value = simplify_gen_unary (ZERO_EXTEND, outmode, eq_value, mode);
3313       emit_libcall_block_1 (insns, target, value, eq_value,
3314                             trapv_unoptab_p (unoptab));
3315
3316       return target;
3317     }
3318
3319   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3320
3321   if (CLASS_HAS_WIDER_MODES_P (mclass))
3322     {
3323       for (wider_mode = GET_MODE_WIDER_MODE (mode);
3324            wider_mode != VOIDmode;
3325            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3326         {
3327           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3328               || optab_libfunc (unoptab, wider_mode))
3329             {
3330               rtx xop0 = op0;
3331               rtx_insn *last = get_last_insn ();
3332
3333               /* For certain operations, we need not actually extend
3334                  the narrow operand, as long as we will truncate the
3335                  results to the same narrowness.  */
3336               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3337                                     (unoptab == neg_optab
3338                                      || unoptab == one_cmpl_optab
3339                                      || unoptab == bswap_optab)
3340                                     && mclass == MODE_INT);
3341
3342               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3343                                   unsignedp);
3344
3345               /* If we are generating clz using wider mode, adjust the
3346                  result.  Similarly for clrsb.  */
3347               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3348                   && temp != 0)
3349                 temp = expand_binop
3350                   (wider_mode, sub_optab, temp,
3351                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
3352                                  - GET_MODE_PRECISION (mode),
3353                                  wider_mode),
3354                    target, true, OPTAB_DIRECT);
3355
3356               /* Likewise for bswap.  */
3357               if (unoptab == bswap_optab && temp != 0)
3358                 {
3359                   gcc_assert (GET_MODE_PRECISION (wider_mode)
3360                               == GET_MODE_BITSIZE (wider_mode)
3361                               && GET_MODE_PRECISION (mode)
3362                                  == GET_MODE_BITSIZE (mode));
3363
3364                   temp = expand_shift (RSHIFT_EXPR, wider_mode, temp,
3365                                        GET_MODE_BITSIZE (wider_mode)
3366                                        - GET_MODE_BITSIZE (mode),
3367                                        NULL_RTX, true);
3368                 }
3369
3370               if (temp)
3371                 {
3372                   if (mclass != MODE_INT)
3373                     {
3374                       if (target == 0)
3375                         target = gen_reg_rtx (mode);
3376                       convert_move (target, temp, 0);
3377                       return target;
3378                     }
3379                   else
3380                     return gen_lowpart (mode, temp);
3381                 }
3382               else
3383                 delete_insns_since (last);
3384             }
3385         }
3386     }
3387
3388   /* One final attempt at implementing negation via subtraction,
3389      this time allowing widening of the operand.  */
3390   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3391     {
3392       rtx temp;
3393       temp = expand_binop (mode,
3394                            unoptab == negv_optab ? subv_optab : sub_optab,
3395                            CONST0_RTX (mode), op0,
3396                            target, unsignedp, OPTAB_LIB_WIDEN);
3397       if (temp)
3398         return temp;
3399     }
3400
3401   return 0;
3402 }
3403 \f
3404 /* Emit code to compute the absolute value of OP0, with result to
3405    TARGET if convenient.  (TARGET may be 0.)  The return value says
3406    where the result actually is to be found.
3407
3408    MODE is the mode of the operand; the mode of the result is
3409    different but can be deduced from MODE.
3410
3411  */
3412
3413 rtx
3414 expand_abs_nojump (enum machine_mode mode, rtx op0, rtx target,
3415                    int result_unsignedp)
3416 {
3417   rtx temp;
3418
3419   if (GET_MODE_CLASS (mode) != MODE_INT
3420       || ! flag_trapv)
3421     result_unsignedp = 1;
3422
3423   /* First try to do it with a special abs instruction.  */
3424   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3425                       op0, target, 0);
3426   if (temp != 0)
3427     return temp;
3428
3429   /* For floating point modes, try clearing the sign bit.  */
3430   if (SCALAR_FLOAT_MODE_P (mode))
3431     {
3432       temp = expand_absneg_bit (ABS, mode, op0, target);
3433       if (temp)
3434         return temp;
3435     }
3436
3437   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3438   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3439       && !HONOR_SIGNED_ZEROS (mode))
3440     {
3441       rtx_insn *last = get_last_insn ();
3442
3443       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3444                           op0, NULL_RTX, 0);
3445       if (temp != 0)
3446         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3447                              OPTAB_WIDEN);
3448
3449       if (temp != 0)
3450         return temp;
3451
3452       delete_insns_since (last);
3453     }
3454
3455   /* If this machine has expensive jumps, we can do integer absolute
3456      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3457      where W is the width of MODE.  */
3458
3459   if (GET_MODE_CLASS (mode) == MODE_INT
3460       && BRANCH_COST (optimize_insn_for_speed_p (),
3461                       false) >= 2)
3462     {
3463       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3464                                    GET_MODE_PRECISION (mode) - 1,
3465                                    NULL_RTX, 0);
3466
3467       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3468                            OPTAB_LIB_WIDEN);
3469       if (temp != 0)
3470         temp = expand_binop (mode, result_unsignedp ? sub_optab : subv_optab,
3471                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3472
3473       if (temp != 0)
3474         return temp;
3475     }
3476
3477   return NULL_RTX;
3478 }
3479
3480 rtx
3481 expand_abs (enum machine_mode mode, rtx op0, rtx target,
3482             int result_unsignedp, int safe)
3483 {
3484   rtx temp;
3485   rtx_code_label *op1;
3486
3487   if (GET_MODE_CLASS (mode) != MODE_INT
3488       || ! flag_trapv)
3489     result_unsignedp = 1;
3490
3491   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3492   if (temp != 0)
3493     return temp;
3494
3495   /* If that does not win, use conditional jump and negate.  */
3496
3497   /* It is safe to use the target if it is the same
3498      as the source if this is also a pseudo register */
3499   if (op0 == target && REG_P (op0)
3500       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3501     safe = 1;
3502
3503   op1 = gen_label_rtx ();
3504   if (target == 0 || ! safe
3505       || GET_MODE (target) != mode
3506       || (MEM_P (target) && MEM_VOLATILE_P (target))
3507       || (REG_P (target)
3508           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3509     target = gen_reg_rtx (mode);
3510
3511   emit_move_insn (target, op0);
3512   NO_DEFER_POP;
3513
3514   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3515                            NULL_RTX, NULL_RTX, op1, -1);
3516
3517   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3518                      target, target, 0);
3519   if (op0 != target)
3520     emit_move_insn (target, op0);
3521   emit_label (op1);
3522   OK_DEFER_POP;
3523   return target;
3524 }
3525
3526 /* Emit code to compute the one's complement absolute value of OP0
3527    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3528    (TARGET may be NULL_RTX.)  The return value says where the result
3529    actually is to be found.
3530
3531    MODE is the mode of the operand; the mode of the result is
3532    different but can be deduced from MODE.  */
3533
3534 rtx
3535 expand_one_cmpl_abs_nojump (enum machine_mode mode, rtx op0, rtx target)
3536 {
3537   rtx temp;
3538
3539   /* Not applicable for floating point modes.  */
3540   if (FLOAT_MODE_P (mode))
3541     return NULL_RTX;
3542
3543   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3544   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3545     {
3546       rtx_insn *last = get_last_insn ();
3547
3548       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3549       if (temp != 0)
3550         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3551                              OPTAB_WIDEN);
3552
3553       if (temp != 0)
3554         return temp;
3555
3556       delete_insns_since (last);
3557     }
3558
3559   /* If this machine has expensive jumps, we can do one's complement
3560      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3561
3562   if (GET_MODE_CLASS (mode) == MODE_INT
3563       && BRANCH_COST (optimize_insn_for_speed_p (),
3564                      false) >= 2)
3565     {
3566       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3567                                    GET_MODE_PRECISION (mode) - 1,
3568                                    NULL_RTX, 0);
3569
3570       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3571                            OPTAB_LIB_WIDEN);
3572
3573       if (temp != 0)
3574         return temp;
3575     }
3576
3577   return NULL_RTX;
3578 }
3579
3580 /* A subroutine of expand_copysign, perform the copysign operation using the
3581    abs and neg primitives advertised to exist on the target.  The assumption
3582    is that we have a split register file, and leaving op0 in fp registers,
3583    and not playing with subregs so much, will help the register allocator.  */
3584
3585 static rtx
3586 expand_copysign_absneg (enum machine_mode mode, rtx op0, rtx op1, rtx target,
3587                         int bitpos, bool op0_is_abs)
3588 {
3589   enum machine_mode imode;
3590   enum insn_code icode;
3591   rtx sign;
3592   rtx_code_label *label;
3593
3594   if (target == op1)
3595     target = NULL_RTX;
3596
3597   /* Check if the back end provides an insn that handles signbit for the
3598      argument's mode. */
3599   icode = optab_handler (signbit_optab, mode);
3600   if (icode != CODE_FOR_nothing)
3601     {
3602       imode = insn_data[(int) icode].operand[0].mode;
3603       sign = gen_reg_rtx (imode);
3604       emit_unop_insn (icode, sign, op1, UNKNOWN);
3605     }
3606   else
3607     {
3608       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3609         {
3610           imode = int_mode_for_mode (mode);
3611           if (imode == BLKmode)
3612             return NULL_RTX;
3613           op1 = gen_lowpart (imode, op1);
3614         }
3615       else
3616         {
3617           int word;
3618
3619           imode = word_mode;
3620           if (FLOAT_WORDS_BIG_ENDIAN)
3621             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3622           else
3623             word = bitpos / BITS_PER_WORD;
3624           bitpos = bitpos % BITS_PER_WORD;
3625           op1 = operand_subword_force (op1, word, mode);
3626         }
3627
3628       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3629       sign = expand_binop (imode, and_optab, op1,
3630                            immed_wide_int_const (mask, imode),
3631                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3632     }
3633
3634   if (!op0_is_abs)
3635     {
3636       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3637       if (op0 == NULL)
3638         return NULL_RTX;
3639       target = op0;
3640     }
3641   else
3642     {
3643       if (target == NULL_RTX)
3644         target = copy_to_reg (op0);
3645       else
3646         emit_move_insn (target, op0);
3647     }
3648
3649   label = gen_label_rtx ();
3650   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3651
3652   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3653     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3654   else
3655     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3656   if (op0 != target)
3657     emit_move_insn (target, op0);
3658
3659   emit_label (label);
3660
3661   return target;
3662 }
3663
3664
3665 /* A subroutine of expand_copysign, perform the entire copysign operation
3666    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3667    is true if op0 is known to have its sign bit clear.  */
3668
3669 static rtx
3670 expand_copysign_bit (enum machine_mode mode, rtx op0, rtx op1, rtx target,
3671                      int bitpos, bool op0_is_abs)
3672 {
3673   enum machine_mode imode;
3674   int word, nwords, i;
3675   rtx temp;
3676   rtx_insn *insns;
3677
3678   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3679     {
3680       imode = int_mode_for_mode (mode);
3681       if (imode == BLKmode)
3682         return NULL_RTX;
3683       word = 0;
3684       nwords = 1;
3685     }
3686   else
3687     {
3688       imode = word_mode;
3689
3690       if (FLOAT_WORDS_BIG_ENDIAN)
3691         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3692       else
3693         word = bitpos / BITS_PER_WORD;
3694       bitpos = bitpos % BITS_PER_WORD;
3695       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3696     }
3697
3698   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3699
3700   if (target == 0
3701       || target == op0
3702       || target == op1
3703       || (nwords > 1 && !valid_multiword_target_p (target)))
3704     target = gen_reg_rtx (mode);
3705
3706   if (nwords > 1)
3707     {
3708       start_sequence ();
3709
3710       for (i = 0; i < nwords; ++i)
3711         {
3712           rtx targ_piece = operand_subword (target, i, 1, mode);
3713           rtx op0_piece = operand_subword_force (op0, i, mode);
3714
3715           if (i == word)
3716             {
3717               if (!op0_is_abs)
3718                 op0_piece
3719                   = expand_binop (imode, and_optab, op0_piece,
3720                                   immed_wide_int_const (~mask, imode),
3721                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3722               op1 = expand_binop (imode, and_optab,
3723                                   operand_subword_force (op1, i, mode),
3724                                   immed_wide_int_const (mask, imode),
3725                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3726
3727               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3728                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3729               if (temp != targ_piece)
3730                 emit_move_insn (targ_piece, temp);
3731             }
3732           else
3733             emit_move_insn (targ_piece, op0_piece);
3734         }
3735
3736       insns = get_insns ();
3737       end_sequence ();
3738
3739       emit_insn (insns);
3740     }
3741   else
3742     {
3743       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3744                           immed_wide_int_const (mask, imode),
3745                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3746
3747       op0 = gen_lowpart (imode, op0);
3748       if (!op0_is_abs)
3749         op0 = expand_binop (imode, and_optab, op0,
3750                             immed_wide_int_const (~mask, imode),
3751                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3752
3753       temp = expand_binop (imode, ior_optab, op0, op1,
3754                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3755       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3756     }
3757
3758   return target;
3759 }
3760
3761 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3762    scalar floating point mode.  Return NULL if we do not know how to
3763    expand the operation inline.  */
3764
3765 rtx
3766 expand_copysign (rtx op0, rtx op1, rtx target)
3767 {
3768   enum machine_mode mode = GET_MODE (op0);
3769   const struct real_format *fmt;
3770   bool op0_is_abs;
3771   rtx temp;
3772
3773   gcc_assert (SCALAR_FLOAT_MODE_P (mode));
3774   gcc_assert (GET_MODE (op1) == mode);
3775
3776   /* First try to do it with a special instruction.  */
3777   temp = expand_binop (mode, copysign_optab, op0, op1,
3778                        target, 0, OPTAB_DIRECT);
3779   if (temp)
3780     return temp;
3781
3782   fmt = REAL_MODE_FORMAT (mode);
3783   if (fmt == NULL || !fmt->has_signed_zero)
3784     return NULL_RTX;
3785
3786   op0_is_abs = false;
3787   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3788     {
3789       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3790         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3791       op0_is_abs = true;
3792     }
3793
3794   if (fmt->signbit_ro >= 0
3795       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3796           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3797               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3798     {
3799       temp = expand_copysign_absneg (mode, op0, op1, target,
3800                                      fmt->signbit_ro, op0_is_abs);
3801       if (temp)
3802         return temp;
3803     }
3804
3805   if (fmt->signbit_rw < 0)
3806     return NULL_RTX;
3807   return expand_copysign_bit (mode, op0, op1, target,
3808                               fmt->signbit_rw, op0_is_abs);
3809 }
3810 \f
3811 /* Generate an instruction whose insn-code is INSN_CODE,
3812    with two operands: an output TARGET and an input OP0.
3813    TARGET *must* be nonzero, and the output is always stored there.
3814    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3815    the value that is stored into TARGET.
3816
3817    Return false if expansion failed.  */
3818
3819 bool
3820 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3821                       enum rtx_code code)
3822 {
3823   struct expand_operand ops[2];
3824   rtx pat;
3825
3826   create_output_operand (&ops[0], target, GET_MODE (target));
3827   create_input_operand (&ops[1], op0, GET_MODE (op0));
3828   pat = maybe_gen_insn (icode, 2, ops);
3829   if (!pat)
3830     return false;
3831
3832   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX && code != UNKNOWN)
3833     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3834
3835   emit_insn (pat);
3836
3837   if (ops[0].value != target)
3838     emit_move_insn (target, ops[0].value);
3839   return true;
3840 }
3841 /* Generate an instruction whose insn-code is INSN_CODE,
3842    with two operands: an output TARGET and an input OP0.
3843    TARGET *must* be nonzero, and the output is always stored there.
3844    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3845    the value that is stored into TARGET.  */
3846
3847 void
3848 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3849 {
3850   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3851   gcc_assert (ok);
3852 }
3853 \f
3854 struct no_conflict_data
3855 {
3856   rtx target;
3857   rtx_insn *first, *insn;
3858   bool must_stay;
3859 };
3860
3861 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3862    the currently examined clobber / store has to stay in the list of
3863    insns that constitute the actual libcall block.  */
3864 static void
3865 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3866 {
3867   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3868
3869   /* If this inns directly contributes to setting the target, it must stay.  */
3870   if (reg_overlap_mentioned_p (p->target, dest))
3871     p->must_stay = true;
3872   /* If we haven't committed to keeping any other insns in the list yet,
3873      there is nothing more to check.  */
3874   else if (p->insn == p->first)
3875     return;
3876   /* If this insn sets / clobbers a register that feeds one of the insns
3877      already in the list, this insn has to stay too.  */
3878   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3879            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3880            || reg_used_between_p (dest, p->first, p->insn)
3881            /* Likewise if this insn depends on a register set by a previous
3882               insn in the list, or if it sets a result (presumably a hard
3883               register) that is set or clobbered by a previous insn.
3884               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3885               SET_DEST perform the former check on the address, and the latter
3886               check on the MEM.  */
3887            || (GET_CODE (set) == SET
3888                && (modified_in_p (SET_SRC (set), p->first)
3889                    || modified_in_p (SET_DEST (set), p->first)
3890                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3891                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3892     p->must_stay = true;
3893 }
3894
3895 \f
3896 /* Emit code to make a call to a constant function or a library call.
3897
3898    INSNS is a list containing all insns emitted in the call.
3899    These insns leave the result in RESULT.  Our block is to copy RESULT
3900    to TARGET, which is logically equivalent to EQUIV.
3901
3902    We first emit any insns that set a pseudo on the assumption that these are
3903    loading constants into registers; doing so allows them to be safely cse'ed
3904    between blocks.  Then we emit all the other insns in the block, followed by
3905    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3906    note with an operand of EQUIV.  */
3907
3908 static void
3909 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3910                       bool equiv_may_trap)
3911 {
3912   rtx final_dest = target;
3913   rtx_insn *next, *last, *insn;
3914
3915   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3916      into a MEM later.  Protect the libcall block from this change.  */
3917   if (! REG_P (target) || REG_USERVAR_P (target))
3918     target = gen_reg_rtx (GET_MODE (target));
3919
3920   /* If we're using non-call exceptions, a libcall corresponding to an
3921      operation that may trap may also trap.  */
3922   /* ??? See the comment in front of make_reg_eh_region_note.  */
3923   if (cfun->can_throw_non_call_exceptions
3924       && (equiv_may_trap || may_trap_p (equiv)))
3925     {
3926       for (insn = insns; insn; insn = NEXT_INSN (insn))
3927         if (CALL_P (insn))
3928           {
3929             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3930             if (note)
3931               {
3932                 int lp_nr = INTVAL (XEXP (note, 0));
3933                 if (lp_nr == 0 || lp_nr == INT_MIN)
3934                   remove_note (insn, note);
3935               }
3936           }
3937     }
3938   else
3939     {
3940       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3941          reg note to indicate that this call cannot throw or execute a nonlocal
3942          goto (unless there is already a REG_EH_REGION note, in which case
3943          we update it).  */
3944       for (insn = insns; insn; insn = NEXT_INSN (insn))
3945         if (CALL_P (insn))
3946           make_reg_eh_region_note_nothrow_nononlocal (insn);
3947     }
3948
3949   /* First emit all insns that set pseudos.  Remove them from the list as
3950      we go.  Avoid insns that set pseudos which were referenced in previous
3951      insns.  These can be generated by move_by_pieces, for example,
3952      to update an address.  Similarly, avoid insns that reference things
3953      set in previous insns.  */
3954
3955   for (insn = insns; insn; insn = next)
3956     {
3957       rtx set = single_set (insn);
3958
3959       next = NEXT_INSN (insn);
3960
3961       if (set != 0 && REG_P (SET_DEST (set))
3962           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3963         {
3964           struct no_conflict_data data;
3965
3966           data.target = const0_rtx;
3967           data.first = insns;
3968           data.insn = insn;
3969           data.must_stay = 0;
3970           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3971           if (! data.must_stay)
3972             {
3973               if (PREV_INSN (insn))
3974                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3975               else
3976                 insns = next;
3977
3978               if (next)
3979                 SET_PREV_INSN (next) = PREV_INSN (insn);
3980
3981               add_insn (insn);
3982             }
3983         }
3984
3985       /* Some ports use a loop to copy large arguments onto the stack.
3986          Don't move anything outside such a loop.  */
3987       if (LABEL_P (insn))
3988         break;
3989     }
3990
3991   /* Write the remaining insns followed by the final copy.  */
3992   for (insn = insns; insn; insn = next)
3993     {
3994       next = NEXT_INSN (insn);
3995
3996       add_insn (insn);
3997     }
3998
3999   last = emit_move_insn (target, result);
4000   set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
4001
4002   if (final_dest != target)
4003     emit_move_insn (final_dest, target);
4004 }
4005
4006 void
4007 emit_libcall_block (rtx insns, rtx target, rtx result, rtx equiv)
4008 {
4009   emit_libcall_block_1 (safe_as_a <rtx_insn *> (insns),
4010                         target, result, equiv, false);
4011 }
4012 \f
4013 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
4014    PURPOSE describes how this comparison will be used.  CODE is the rtx
4015    comparison code we will be using.
4016
4017    ??? Actually, CODE is slightly weaker than that.  A target is still
4018    required to implement all of the normal bcc operations, but not
4019    required to implement all (or any) of the unordered bcc operations.  */
4020
4021 int
4022 can_compare_p (enum rtx_code code, enum machine_mode mode,
4023                enum can_compare_purpose purpose)
4024 {
4025   rtx test;
4026   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
4027   do
4028     {
4029       enum insn_code icode;
4030
4031       if (purpose == ccp_jump
4032           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
4033           && insn_operand_matches (icode, 0, test))
4034         return 1;
4035       if (purpose == ccp_store_flag
4036           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
4037           && insn_operand_matches (icode, 1, test))
4038         return 1;
4039       if (purpose == ccp_cmov
4040           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
4041         return 1;
4042
4043       mode = GET_MODE_WIDER_MODE (mode);
4044       PUT_MODE (test, mode);
4045     }
4046   while (mode != VOIDmode);
4047
4048   return 0;
4049 }
4050
4051 /* This function is called when we are going to emit a compare instruction that
4052    compares the values found in *PX and *PY, using the rtl operator COMPARISON.
4053
4054    *PMODE is the mode of the inputs (in case they are const_int).
4055    *PUNSIGNEDP nonzero says that the operands are unsigned;
4056    this matters if they need to be widened (as given by METHODS).
4057
4058    If they have mode BLKmode, then SIZE specifies the size of both operands.
4059
4060    This function performs all the setup necessary so that the caller only has
4061    to emit a single comparison insn.  This setup can involve doing a BLKmode
4062    comparison or emitting a library call to perform the comparison if no insn
4063    is available to handle it.
4064    The values which are passed in through pointers can be modified; the caller
4065    should perform the comparison on the modified values.  Constant
4066    comparisons must have already been folded.  */
4067
4068 static void
4069 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
4070                   int unsignedp, enum optab_methods methods,
4071                   rtx *ptest, enum machine_mode *pmode)
4072 {
4073   enum machine_mode mode = *pmode;
4074   rtx libfunc, test;
4075   enum machine_mode cmp_mode;
4076   enum mode_class mclass;
4077
4078   /* The other methods are not needed.  */
4079   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
4080               || methods == OPTAB_LIB_WIDEN);
4081
4082   /* If we are optimizing, force expensive constants into a register.  */
4083   if (CONSTANT_P (x) && optimize
4084       && (rtx_cost (x, COMPARE, 0, optimize_insn_for_speed_p ())
4085           > COSTS_N_INSNS (1)))
4086     x = force_reg (mode, x);
4087
4088   if (CONSTANT_P (y) && optimize
4089       && (rtx_cost (y, COMPARE, 1, optimize_insn_for_speed_p ())
4090           > COSTS_N_INSNS (1)))
4091     y = force_reg (mode, y);
4092
4093 #ifdef HAVE_cc0
4094   /* Make sure if we have a canonical comparison.  The RTL
4095      documentation states that canonical comparisons are required only
4096      for targets which have cc0.  */
4097   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
4098 #endif
4099
4100   /* Don't let both operands fail to indicate the mode.  */
4101   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
4102     x = force_reg (mode, x);
4103   if (mode == VOIDmode)
4104     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
4105
4106   /* Handle all BLKmode compares.  */
4107
4108   if (mode == BLKmode)
4109     {
4110       enum machine_mode result_mode;
4111       enum insn_code cmp_code;
4112       tree length_type;
4113       rtx libfunc;
4114       rtx result;
4115       rtx opalign
4116         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
4117
4118       gcc_assert (size);
4119
4120       /* Try to use a memory block compare insn - either cmpstr
4121          or cmpmem will do.  */
4122       for (cmp_mode = GET_CLASS_NARROWEST_MODE (MODE_INT);
4123            cmp_mode != VOIDmode;
4124            cmp_mode = GET_MODE_WIDER_MODE (cmp_mode))
4125         {
4126           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
4127           if (cmp_code == CODE_FOR_nothing)
4128             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
4129           if (cmp_code == CODE_FOR_nothing)
4130             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
4131           if (cmp_code == CODE_FOR_nothing)
4132             continue;
4133
4134           /* Must make sure the size fits the insn's mode.  */
4135           if ((CONST_INT_P (size)
4136                && INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode)))
4137               || (GET_MODE_BITSIZE (GET_MODE (size))
4138                   > GET_MODE_BITSIZE (cmp_mode)))
4139             continue;
4140
4141           result_mode = insn_data[cmp_code].operand[0].mode;
4142           result = gen_reg_rtx (result_mode);
4143           size = convert_to_mode (cmp_mode, size, 1);
4144           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
4145
4146           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
4147           *pmode = result_mode;
4148           return;
4149         }
4150
4151       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
4152         goto fail;
4153
4154       /* Otherwise call a library function, memcmp.  */
4155       libfunc = memcmp_libfunc;
4156       length_type = sizetype;
4157       result_mode = TYPE_MODE (integer_type_node);
4158       cmp_mode = TYPE_MODE (length_type);
4159       size = convert_to_mode (TYPE_MODE (length_type), size,
4160                               TYPE_UNSIGNED (length_type));
4161
4162       result = emit_library_call_value (libfunc, 0, LCT_PURE,
4163                                         result_mode, 3,
4164                                         XEXP (x, 0), Pmode,
4165                                         XEXP (y, 0), Pmode,
4166                                         size, cmp_mode);
4167       x = result;
4168       y = const0_rtx;
4169       mode = result_mode;
4170       methods = OPTAB_LIB_WIDEN;
4171       unsignedp = false;
4172     }
4173
4174   /* Don't allow operands to the compare to trap, as that can put the
4175      compare and branch in different basic blocks.  */
4176   if (cfun->can_throw_non_call_exceptions)
4177     {
4178       if (may_trap_p (x))
4179         x = force_reg (mode, x);
4180       if (may_trap_p (y))
4181         y = force_reg (mode, y);
4182     }
4183
4184   if (GET_MODE_CLASS (mode) == MODE_CC)
4185     {
4186       gcc_assert (can_compare_p (comparison, CCmode, ccp_jump));
4187       *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4188       return;
4189     }
4190
4191   mclass = GET_MODE_CLASS (mode);
4192   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4193   cmp_mode = mode;
4194   do
4195    {
4196       enum insn_code icode;
4197       icode = optab_handler (cbranch_optab, cmp_mode);
4198       if (icode != CODE_FOR_nothing
4199           && insn_operand_matches (icode, 0, test))
4200         {
4201           rtx_insn *last = get_last_insn ();
4202           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
4203           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
4204           if (op0 && op1
4205               && insn_operand_matches (icode, 1, op0)
4206               && insn_operand_matches (icode, 2, op1))
4207             {
4208               XEXP (test, 0) = op0;
4209               XEXP (test, 1) = op1;
4210               *ptest = test;
4211               *pmode = cmp_mode;
4212               return;
4213             }
4214           delete_insns_since (last);
4215         }
4216
4217       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
4218         break;
4219       cmp_mode = GET_MODE_WIDER_MODE (cmp_mode);
4220     }
4221   while (cmp_mode != VOIDmode);
4222
4223   if (methods != OPTAB_LIB_WIDEN)
4224     goto fail;
4225
4226   if (!SCALAR_FLOAT_MODE_P (mode))
4227     {
4228       rtx result;
4229       enum machine_mode ret_mode;
4230
4231       /* Handle a libcall just for the mode we are using.  */
4232       libfunc = optab_libfunc (cmp_optab, mode);
4233       gcc_assert (libfunc);
4234
4235       /* If we want unsigned, and this mode has a distinct unsigned
4236          comparison routine, use that.  */
4237       if (unsignedp)
4238         {
4239           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
4240           if (ulibfunc)
4241             libfunc = ulibfunc;
4242         }
4243
4244       ret_mode = targetm.libgcc_cmp_return_mode ();
4245       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4246                                         ret_mode, 2, x, mode, y, mode);
4247
4248       /* There are two kinds of comparison routines. Biased routines
4249          return 0/1/2, and unbiased routines return -1/0/1. Other parts
4250          of gcc expect that the comparison operation is equivalent
4251          to the modified comparison. For signed comparisons compare the
4252          result against 1 in the biased case, and zero in the unbiased
4253          case. For unsigned comparisons always compare against 1 after
4254          biasing the unbiased result by adding 1. This gives us a way to
4255          represent LTU.
4256          The comparisons in the fixed-point helper library are always
4257          biased.  */
4258       x = result;
4259       y = const1_rtx;
4260
4261       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
4262         {
4263           if (unsignedp)
4264             x = plus_constant (ret_mode, result, 1);
4265           else
4266             y = const0_rtx;
4267         }
4268
4269       *pmode = word_mode;
4270       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
4271                         ptest, pmode);
4272     }
4273   else
4274     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
4275
4276   return;
4277
4278  fail:
4279   *ptest = NULL_RTX;
4280 }
4281
4282 /* Before emitting an insn with code ICODE, make sure that X, which is going
4283    to be used for operand OPNUM of the insn, is converted from mode MODE to
4284    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
4285    that it is accepted by the operand predicate.  Return the new value.  */
4286
4287 rtx
4288 prepare_operand (enum insn_code icode, rtx x, int opnum, enum machine_mode mode,
4289                  enum machine_mode wider_mode, int unsignedp)
4290 {
4291   if (mode != wider_mode)
4292     x = convert_modes (wider_mode, mode, x, unsignedp);
4293
4294   if (!insn_operand_matches (icode, opnum, x))
4295     {
4296       if (reload_completed)
4297         return NULL_RTX;
4298       x = copy_to_mode_reg (insn_data[(int) icode].operand[opnum].mode, x);
4299     }
4300
4301   return x;
4302 }
4303
4304 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4305    we can do the branch.  */
4306
4307 static void
4308 emit_cmp_and_jump_insn_1 (rtx test, enum machine_mode mode, rtx label, int prob)
4309 {
4310   enum machine_mode optab_mode;
4311   enum mode_class mclass;
4312   enum insn_code icode;
4313   rtx_insn *insn;
4314
4315   mclass = GET_MODE_CLASS (mode);
4316   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4317   icode = optab_handler (cbranch_optab, optab_mode);
4318
4319   gcc_assert (icode != CODE_FOR_nothing);
4320   gcc_assert (insn_operand_matches (icode, 0, test));
4321   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4322                                           XEXP (test, 1), label));
4323   if (prob != -1
4324       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4325       && insn
4326       && JUMP_P (insn)
4327       && any_condjump_p (insn)
4328       && !find_reg_note (insn, REG_BR_PROB, 0))
4329     add_int_reg_note (insn, REG_BR_PROB, prob);
4330 }
4331
4332 /* Generate code to compare X with Y so that the condition codes are
4333    set and to jump to LABEL if the condition is true.  If X is a
4334    constant and Y is not a constant, then the comparison is swapped to
4335    ensure that the comparison RTL has the canonical form.
4336
4337    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4338    need to be widened.  UNSIGNEDP is also used to select the proper
4339    branch condition code.
4340
4341    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4342
4343    MODE is the mode of the inputs (in case they are const_int).
4344
4345    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4346    It will be potentially converted into an unsigned variant based on
4347    UNSIGNEDP to select a proper jump instruction.
4348
4349    PROB is the probability of jumping to LABEL.  */
4350
4351 void
4352 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4353                          enum machine_mode mode, int unsignedp, rtx label,
4354                          int prob)
4355 {
4356   rtx op0 = x, op1 = y;
4357   rtx test;
4358
4359   /* Swap operands and condition to ensure canonical RTL.  */
4360   if (swap_commutative_operands_p (x, y)
4361       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4362     {
4363       op0 = y, op1 = x;
4364       comparison = swap_condition (comparison);
4365     }
4366
4367   /* If OP0 is still a constant, then both X and Y must be constants
4368      or the opposite comparison is not supported.  Force X into a register
4369      to create canonical RTL.  */
4370   if (CONSTANT_P (op0))
4371     op0 = force_reg (mode, op0);
4372
4373   if (unsignedp)
4374     comparison = unsigned_condition (comparison);
4375
4376   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4377                     &test, &mode);
4378   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4379 }
4380
4381 \f
4382 /* Emit a library call comparison between floating point X and Y.
4383    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4384
4385 static void
4386 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4387                        rtx *ptest, enum machine_mode *pmode)
4388 {
4389   enum rtx_code swapped = swap_condition (comparison);
4390   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4391   enum machine_mode orig_mode = GET_MODE (x);
4392   enum machine_mode mode, cmp_mode;
4393   rtx true_rtx, false_rtx;
4394   rtx value, target, equiv;
4395   rtx_insn *insns;
4396   rtx libfunc = 0;
4397   bool reversed_p = false;
4398   cmp_mode = targetm.libgcc_cmp_return_mode ();
4399
4400   for (mode = orig_mode;
4401        mode != VOIDmode;
4402        mode = GET_MODE_WIDER_MODE (mode))
4403     {
4404       if (code_to_optab (comparison)
4405           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4406         break;
4407
4408       if (code_to_optab (swapped)
4409           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4410         {
4411           rtx tmp;
4412           tmp = x; x = y; y = tmp;
4413           comparison = swapped;
4414           break;
4415         }
4416
4417       if (code_to_optab (reversed)
4418           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4419         {
4420           comparison = reversed;
4421           reversed_p = true;
4422           break;
4423         }
4424     }
4425
4426   gcc_assert (mode != VOIDmode);
4427
4428   if (mode != orig_mode)
4429     {
4430       x = convert_to_mode (mode, x, 0);
4431       y = convert_to_mode (mode, y, 0);
4432     }
4433
4434   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4435      the RTL.  The allows the RTL optimizers to delete the libcall if the
4436      condition can be determined at compile-time.  */
4437   if (comparison == UNORDERED
4438       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4439     {
4440       true_rtx = const_true_rtx;
4441       false_rtx = const0_rtx;
4442     }
4443   else
4444     {
4445       switch (comparison)
4446         {
4447         case EQ:
4448           true_rtx = const0_rtx;
4449           false_rtx = const_true_rtx;
4450           break;
4451
4452         case NE:
4453           true_rtx = const_true_rtx;
4454           false_rtx = const0_rtx;
4455           break;
4456
4457         case GT:
4458           true_rtx = const1_rtx;
4459           false_rtx = const0_rtx;
4460           break;
4461
4462         case GE:
4463           true_rtx = const0_rtx;
4464           false_rtx = constm1_rtx;
4465           break;
4466
4467         case LT:
4468           true_rtx = constm1_rtx;
4469           false_rtx = const0_rtx;
4470           break;
4471
4472         case LE:
4473           true_rtx = const0_rtx;
4474           false_rtx = const1_rtx;
4475           break;
4476
4477         default:
4478           gcc_unreachable ();
4479         }
4480     }
4481
4482   if (comparison == UNORDERED)
4483     {
4484       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4485       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4486       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4487                                     temp, const_true_rtx, equiv);
4488     }
4489   else
4490     {
4491       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4492       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4493         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4494                                       equiv, true_rtx, false_rtx);
4495     }
4496
4497   start_sequence ();
4498   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4499                                    cmp_mode, 2, x, mode, y, mode);
4500   insns = get_insns ();
4501   end_sequence ();
4502
4503   target = gen_reg_rtx (cmp_mode);
4504   emit_libcall_block (insns, target, value, equiv);
4505
4506   if (comparison == UNORDERED
4507       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4508       || reversed_p)
4509     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4510   else
4511     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4512
4513   *pmode = cmp_mode;
4514 }
4515 \f
4516 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4517
4518 void
4519 emit_indirect_jump (rtx loc)
4520 {
4521   struct expand_operand ops[1];
4522
4523   create_address_operand (&ops[0], loc);
4524   expand_jump_insn (CODE_FOR_indirect_jump, 1, ops);
4525   emit_barrier ();
4526 }
4527 \f
4528 #ifdef HAVE_conditional_move
4529
4530 /* Emit a conditional move instruction if the machine supports one for that
4531    condition and machine mode.
4532
4533    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4534    the mode to use should they be constants.  If it is VOIDmode, they cannot
4535    both be constants.
4536
4537    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4538    should be stored there.  MODE is the mode to use should they be constants.
4539    If it is VOIDmode, they cannot both be constants.
4540
4541    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4542    is not supported.  */
4543
4544 rtx
4545 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4546                        enum machine_mode cmode, rtx op2, rtx op3,
4547                        enum machine_mode mode, int unsignedp)
4548 {
4549   rtx tem, comparison;
4550   rtx_insn *last;
4551   enum insn_code icode;
4552   enum rtx_code reversed;
4553
4554   /* If one operand is constant, make it the second one.  Only do this
4555      if the other operand is not constant as well.  */
4556
4557   if (swap_commutative_operands_p (op0, op1))
4558     {
4559       tem = op0;
4560       op0 = op1;
4561       op1 = tem;
4562       code = swap_condition (code);
4563     }
4564
4565   /* get_condition will prefer to generate LT and GT even if the old
4566      comparison was against zero, so undo that canonicalization here since
4567      comparisons against zero are cheaper.  */
4568   if (code == LT && op1 == const1_rtx)
4569     code = LE, op1 = const0_rtx;
4570   else if (code == GT && op1 == constm1_rtx)
4571     code = GE, op1 = const0_rtx;
4572
4573   if (cmode == VOIDmode)
4574     cmode = GET_MODE (op0);
4575
4576   if (swap_commutative_operands_p (op2, op3)
4577       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4578           != UNKNOWN))
4579     {
4580       tem = op2;
4581       op2 = op3;
4582       op3 = tem;
4583       code = reversed;
4584     }
4585
4586   if (mode == VOIDmode)
4587     mode = GET_MODE (op2);
4588
4589   icode = direct_optab_handler (movcc_optab, mode);
4590
4591   if (icode == CODE_FOR_nothing)
4592     return 0;
4593
4594   if (!target)
4595     target = gen_reg_rtx (mode);
4596
4597   code = unsignedp ? unsigned_condition (code) : code;
4598   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4599
4600   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4601      return NULL and let the caller figure out how best to deal with this
4602      situation.  */
4603   if (!COMPARISON_P (comparison))
4604     return NULL_RTX;
4605
4606   saved_pending_stack_adjust save;
4607   save_pending_stack_adjust (&save);
4608   last = get_last_insn ();
4609   do_pending_stack_adjust ();
4610   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4611                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4612                     &comparison, &cmode);
4613   if (comparison)
4614     {
4615       struct expand_operand ops[4];
4616
4617       create_output_operand (&ops[0], target, mode);
4618       create_fixed_operand (&ops[1], comparison);
4619       create_input_operand (&ops[2], op2, mode);
4620       create_input_operand (&ops[3], op3, mode);
4621       if (maybe_expand_insn (icode, 4, ops))
4622         {
4623           if (ops[0].value != target)
4624             convert_move (target, ops[0].value, false);
4625           return target;
4626         }
4627     }
4628   delete_insns_since (last);
4629   restore_pending_stack_adjust (&save);
4630   return NULL_RTX;
4631 }
4632
4633 /* Return nonzero if a conditional move of mode MODE is supported.
4634
4635    This function is for combine so it can tell whether an insn that looks
4636    like a conditional move is actually supported by the hardware.  If we
4637    guess wrong we lose a bit on optimization, but that's it.  */
4638 /* ??? sparc64 supports conditionally moving integers values based on fp
4639    comparisons, and vice versa.  How do we handle them?  */
4640
4641 int
4642 can_conditionally_move_p (enum machine_mode mode)
4643 {
4644   if (direct_optab_handler (movcc_optab, mode) != CODE_FOR_nothing)
4645     return 1;
4646
4647   return 0;
4648 }
4649
4650 #endif /* HAVE_conditional_move */
4651
4652 /* Emit a conditional addition instruction if the machine supports one for that
4653    condition and machine mode.
4654
4655    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4656    the mode to use should they be constants.  If it is VOIDmode, they cannot
4657    both be constants.
4658
4659    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4660    should be stored there.  MODE is the mode to use should they be constants.
4661    If it is VOIDmode, they cannot both be constants.
4662
4663    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4664    is not supported.  */
4665
4666 rtx
4667 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4668                       enum machine_mode cmode, rtx op2, rtx op3,
4669                       enum machine_mode mode, int unsignedp)
4670 {
4671   rtx tem, comparison;
4672   rtx_insn *last;
4673   enum insn_code icode;
4674
4675   /* If one operand is constant, make it the second one.  Only do this
4676      if the other operand is not constant as well.  */
4677
4678   if (swap_commutative_operands_p (op0, op1))
4679     {
4680       tem = op0;
4681       op0 = op1;
4682       op1 = tem;
4683       code = swap_condition (code);
4684     }
4685
4686   /* get_condition will prefer to generate LT and GT even if the old
4687      comparison was against zero, so undo that canonicalization here since
4688      comparisons against zero are cheaper.  */
4689   if (code == LT && op1 == const1_rtx)
4690     code = LE, op1 = const0_rtx;
4691   else if (code == GT && op1 == constm1_rtx)
4692     code = GE, op1 = const0_rtx;
4693
4694   if (cmode == VOIDmode)
4695     cmode = GET_MODE (op0);
4696
4697   if (mode == VOIDmode)
4698     mode = GET_MODE (op2);
4699
4700   icode = optab_handler (addcc_optab, mode);
4701
4702   if (icode == CODE_FOR_nothing)
4703     return 0;
4704
4705   if (!target)
4706     target = gen_reg_rtx (mode);
4707
4708   code = unsignedp ? unsigned_condition (code) : code;
4709   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4710
4711   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4712      return NULL and let the caller figure out how best to deal with this
4713      situation.  */
4714   if (!COMPARISON_P (comparison))
4715     return NULL_RTX;
4716
4717   do_pending_stack_adjust ();
4718   last = get_last_insn ();
4719   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4720                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4721                     &comparison, &cmode);
4722   if (comparison)
4723     {
4724       struct expand_operand ops[4];
4725
4726       create_output_operand (&ops[0], target, mode);
4727       create_fixed_operand (&ops[1], comparison);
4728       create_input_operand (&ops[2], op2, mode);
4729       create_input_operand (&ops[3], op3, mode);
4730       if (maybe_expand_insn (icode, 4, ops))
4731         {
4732           if (ops[0].value != target)
4733             convert_move (target, ops[0].value, false);
4734           return target;
4735         }
4736     }
4737   delete_insns_since (last);
4738   return NULL_RTX;
4739 }
4740 \f
4741 /* These functions attempt to generate an insn body, rather than
4742    emitting the insn, but if the gen function already emits them, we
4743    make no attempt to turn them back into naked patterns.  */
4744
4745 /* Generate and return an insn body to add Y to X.  */
4746
4747 rtx
4748 gen_add2_insn (rtx x, rtx y)
4749 {
4750   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4751
4752   gcc_assert (insn_operand_matches (icode, 0, x));
4753   gcc_assert (insn_operand_matches (icode, 1, x));
4754   gcc_assert (insn_operand_matches (icode, 2, y));
4755
4756   return GEN_FCN (icode) (x, x, y);
4757 }
4758
4759 /* Generate and return an insn body to add r1 and c,
4760    storing the result in r0.  */
4761
4762 rtx
4763 gen_add3_insn (rtx r0, rtx r1, rtx c)
4764 {
4765   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4766
4767   if (icode == CODE_FOR_nothing
4768       || !insn_operand_matches (icode, 0, r0)
4769       || !insn_operand_matches (icode, 1, r1)
4770       || !insn_operand_matches (icode, 2, c))
4771     return NULL_RTX;
4772
4773   return GEN_FCN (icode) (r0, r1, c);
4774 }
4775
4776 int
4777 have_add2_insn (rtx x, rtx y)
4778 {
4779   enum insn_code icode;
4780
4781   gcc_assert (GET_MODE (x) != VOIDmode);
4782
4783   icode = optab_handler (add_optab, GET_MODE (x));
4784
4785   if (icode == CODE_FOR_nothing)
4786     return 0;
4787
4788   if (!insn_operand_matches (icode, 0, x)
4789       || !insn_operand_matches (icode, 1, x)
4790       || !insn_operand_matches (icode, 2, y))
4791     return 0;
4792
4793   return 1;
4794 }
4795
4796 /* Generate and return an insn body to add Y to X.  */
4797
4798 rtx
4799 gen_addptr3_insn (rtx x, rtx y, rtx z)
4800 {
4801   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4802
4803   gcc_assert (insn_operand_matches (icode, 0, x));
4804   gcc_assert (insn_operand_matches (icode, 1, y));
4805   gcc_assert (insn_operand_matches (icode, 2, z));
4806
4807   return GEN_FCN (icode) (x, y, z);
4808 }
4809
4810 /* Return true if the target implements an addptr pattern and X, Y,
4811    and Z are valid for the pattern predicates.  */
4812
4813 int
4814 have_addptr3_insn (rtx x, rtx y, rtx z)
4815 {
4816   enum insn_code icode;
4817
4818   gcc_assert (GET_MODE (x) != VOIDmode);
4819
4820   icode = optab_handler (addptr3_optab, GET_MODE (x));
4821
4822   if (icode == CODE_FOR_nothing)
4823     return 0;
4824
4825   if (!insn_operand_matches (icode, 0, x)
4826       || !insn_operand_matches (icode, 1, y)
4827       || !insn_operand_matches (icode, 2, z))
4828     return 0;
4829
4830   return 1;
4831 }
4832
4833 /* Generate and return an insn body to subtract Y from X.  */
4834
4835 rtx
4836 gen_sub2_insn (rtx x, rtx y)
4837 {
4838   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4839
4840   gcc_assert (insn_operand_matches (icode, 0, x));
4841   gcc_assert (insn_operand_matches (icode, 1, x));
4842   gcc_assert (insn_operand_matches (icode, 2, y));
4843
4844   return GEN_FCN (icode) (x, x, y);
4845 }
4846
4847 /* Generate and return an insn body to subtract r1 and c,
4848    storing the result in r0.  */
4849
4850 rtx
4851 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4852 {
4853   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4854
4855   if (icode == CODE_FOR_nothing
4856       || !insn_operand_matches (icode, 0, r0)
4857       || !insn_operand_matches (icode, 1, r1)
4858       || !insn_operand_matches (icode, 2, c))
4859     return NULL_RTX;
4860
4861   return GEN_FCN (icode) (r0, r1, c);
4862 }
4863
4864 int
4865 have_sub2_insn (rtx x, rtx y)
4866 {
4867   enum insn_code icode;
4868
4869   gcc_assert (GET_MODE (x) != VOIDmode);
4870
4871   icode = optab_handler (sub_optab, GET_MODE (x));
4872
4873   if (icode == CODE_FOR_nothing)
4874     return 0;
4875
4876   if (!insn_operand_matches (icode, 0, x)
4877       || !insn_operand_matches (icode, 1, x)
4878       || !insn_operand_matches (icode, 2, y))
4879     return 0;
4880
4881   return 1;
4882 }
4883
4884 /* Generate the body of an instruction to copy Y into X.
4885    It may be a list of insns, if one insn isn't enough.  */
4886
4887 rtx
4888 gen_move_insn (rtx x, rtx y)
4889 {
4890   rtx_insn *seq;
4891
4892   start_sequence ();
4893   emit_move_insn_1 (x, y);
4894   seq = get_insns ();
4895   end_sequence ();
4896   return seq;
4897 }
4898 \f
4899 /* Return the insn code used to extend FROM_MODE to TO_MODE.
4900    UNSIGNEDP specifies zero-extension instead of sign-extension.  If
4901    no such operation exists, CODE_FOR_nothing will be returned.  */
4902
4903 enum insn_code
4904 can_extend_p (enum machine_mode to_mode, enum machine_mode from_mode,
4905               int unsignedp)
4906 {
4907   convert_optab tab;
4908 #ifdef HAVE_ptr_extend
4909   if (unsignedp < 0)
4910     return CODE_FOR_ptr_extend;
4911 #endif
4912
4913   tab = unsignedp ? zext_optab : sext_optab;
4914   return convert_optab_handler (tab, to_mode, from_mode);
4915 }
4916
4917 /* Generate the body of an insn to extend Y (with mode MFROM)
4918    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4919
4920 rtx
4921 gen_extend_insn (rtx x, rtx y, enum machine_mode mto,
4922                  enum machine_mode mfrom, int unsignedp)
4923 {
4924   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4925   return GEN_FCN (icode) (x, y);
4926 }
4927 \f
4928 /* can_fix_p and can_float_p say whether the target machine
4929    can directly convert a given fixed point type to
4930    a given floating point type, or vice versa.
4931    The returned value is the CODE_FOR_... value to use,
4932    or CODE_FOR_nothing if these modes cannot be directly converted.
4933
4934    *TRUNCP_PTR is set to 1 if it is necessary to output
4935    an explicit FTRUNC insn before the fix insn; otherwise 0.  */
4936
4937 static enum insn_code
4938 can_fix_p (enum machine_mode fixmode, enum machine_mode fltmode,
4939            int unsignedp, int *truncp_ptr)
4940 {
4941   convert_optab tab;
4942   enum insn_code icode;
4943
4944   tab = unsignedp ? ufixtrunc_optab : sfixtrunc_optab;
4945   icode = convert_optab_handler (tab, fixmode, fltmode);
4946   if (icode != CODE_FOR_nothing)
4947     {
4948       *truncp_ptr = 0;
4949       return icode;
4950     }
4951
4952   /* FIXME: This requires a port to define both FIX and FTRUNC pattern
4953      for this to work. We need to rework the fix* and ftrunc* patterns
4954      and documentation.  */
4955   tab = unsignedp ? ufix_optab : sfix_optab;
4956   icode = convert_optab_handler (tab, fixmode, fltmode);
4957   if (icode != CODE_FOR_nothing
4958       && optab_handler (ftrunc_optab, fltmode) != CODE_FOR_nothing)
4959     {
4960       *truncp_ptr = 1;
4961       return icode;
4962     }
4963
4964   *truncp_ptr = 0;
4965   return CODE_FOR_nothing;
4966 }
4967
4968 enum insn_code
4969 can_float_p (enum machine_mode fltmode, enum machine_mode fixmode,
4970              int unsignedp)
4971 {
4972   convert_optab tab;
4973
4974   tab = unsignedp ? ufloat_optab : sfloat_optab;
4975   return convert_optab_handler (tab, fltmode, fixmode);
4976 }
4977
4978 /* Function supportable_convert_operation
4979
4980    Check whether an operation represented by the code CODE is a
4981    convert operation that is supported by the target platform in
4982    vector form (i.e., when operating on arguments of type VECTYPE_IN
4983    producing a result of type VECTYPE_OUT).
4984
4985    Convert operations we currently support directly are FIX_TRUNC and FLOAT.
4986    This function checks if these operations are supported
4987    by the target platform either directly (via vector tree-codes), or via
4988    target builtins.
4989
4990    Output:
4991    - CODE1 is code of vector operation to be used when
4992    vectorizing the operation, if available.
4993    - DECL is decl of target builtin functions to be used
4994    when vectorizing the operation, if available.  In this case,
4995    CODE1 is CALL_EXPR.  */
4996
4997 bool
4998 supportable_convert_operation (enum tree_code code,
4999                                     tree vectype_out, tree vectype_in,
5000                                     tree *decl, enum tree_code *code1)
5001 {
5002   enum machine_mode m1,m2;
5003   int truncp;
5004
5005   m1 = TYPE_MODE (vectype_out);
5006   m2 = TYPE_MODE (vectype_in);
5007
5008   /* First check if we can done conversion directly.  */
5009   if ((code == FIX_TRUNC_EXPR
5010        && can_fix_p (m1,m2,TYPE_UNSIGNED (vectype_out), &truncp)
5011           != CODE_FOR_nothing)
5012       || (code == FLOAT_EXPR
5013           && can_float_p (m1,m2,TYPE_UNSIGNED (vectype_in))
5014              != CODE_FOR_nothing))
5015     {
5016       *code1 = code;
5017       return true;
5018     }
5019
5020   /* Now check for builtin.  */
5021   if (targetm.vectorize.builtin_conversion
5022       && targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in))
5023     {
5024       *code1 = CALL_EXPR;
5025       *decl = targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in);
5026       return true;
5027     }
5028   return false;
5029 }
5030
5031 \f
5032 /* Generate code to convert FROM to floating point
5033    and store in TO.  FROM must be fixed point and not VOIDmode.
5034    UNSIGNEDP nonzero means regard FROM as unsigned.
5035    Normally this is done by correcting the final value
5036    if it is negative.  */
5037
5038 void
5039 expand_float (rtx to, rtx from, int unsignedp)
5040 {
5041   enum insn_code icode;
5042   rtx target = to;
5043   enum machine_mode fmode, imode;
5044   bool can_do_signed = false;
5045
5046   /* Crash now, because we won't be able to decide which mode to use.  */
5047   gcc_assert (GET_MODE (from) != VOIDmode);
5048
5049   /* Look for an insn to do the conversion.  Do it in the specified
5050      modes if possible; otherwise convert either input, output or both to
5051      wider mode.  If the integer mode is wider than the mode of FROM,
5052      we can do the conversion signed even if the input is unsigned.  */
5053
5054   for (fmode = GET_MODE (to); fmode != VOIDmode;
5055        fmode = GET_MODE_WIDER_MODE (fmode))
5056     for (imode = GET_MODE (from); imode != VOIDmode;
5057          imode = GET_MODE_WIDER_MODE (imode))
5058       {
5059         int doing_unsigned = unsignedp;
5060
5061         if (fmode != GET_MODE (to)
5062             && significand_size (fmode) < GET_MODE_PRECISION (GET_MODE (from)))
5063           continue;
5064
5065         icode = can_float_p (fmode, imode, unsignedp);
5066         if (icode == CODE_FOR_nothing && unsignedp)
5067           {
5068             enum insn_code scode = can_float_p (fmode, imode, 0);
5069             if (scode != CODE_FOR_nothing)
5070               can_do_signed = true;
5071             if (imode != GET_MODE (from))
5072               icode = scode, doing_unsigned = 0;
5073           }
5074
5075         if (icode != CODE_FOR_nothing)
5076           {
5077             if (imode != GET_MODE (from))
5078               from = convert_to_mode (imode, from, unsignedp);
5079
5080             if (fmode != GET_MODE (to))
5081               target = gen_reg_rtx (fmode);
5082
5083             emit_unop_insn (icode, target, from,
5084                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
5085
5086             if (target != to)
5087               convert_move (to, target, 0);
5088             return;
5089           }
5090       }
5091
5092   /* Unsigned integer, and no way to convert directly.  Convert as signed,
5093      then unconditionally adjust the result.  */
5094   if (unsignedp && can_do_signed)
5095     {
5096       rtx_code_label *label = gen_label_rtx ();
5097       rtx temp;
5098       REAL_VALUE_TYPE offset;
5099
5100       /* Look for a usable floating mode FMODE wider than the source and at
5101          least as wide as the target.  Using FMODE will avoid rounding woes
5102          with unsigned values greater than the signed maximum value.  */
5103
5104       for (fmode = GET_MODE (to);  fmode != VOIDmode;
5105            fmode = GET_MODE_WIDER_MODE (fmode))
5106         if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_BITSIZE (fmode)
5107             && can_float_p (fmode, GET_MODE (from), 0) != CODE_FOR_nothing)
5108           break;
5109
5110       if (fmode == VOIDmode)
5111         {
5112           /* There is no such mode.  Pretend the target is wide enough.  */
5113           fmode = GET_MODE (to);
5114
5115           /* Avoid double-rounding when TO is narrower than FROM.  */
5116           if ((significand_size (fmode) + 1)
5117               < GET_MODE_PRECISION (GET_MODE (from)))
5118             {
5119               rtx temp1;
5120               rtx_code_label *neglabel = gen_label_rtx ();
5121
5122               /* Don't use TARGET if it isn't a register, is a hard register,
5123                  or is the wrong mode.  */
5124               if (!REG_P (target)
5125                   || REGNO (target) < FIRST_PSEUDO_REGISTER
5126                   || GET_MODE (target) != fmode)
5127                 target = gen_reg_rtx (fmode);
5128
5129               imode = GET_MODE (from);
5130               do_pending_stack_adjust ();
5131
5132               /* Test whether the sign bit is set.  */
5133               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
5134                                        0, neglabel);
5135
5136               /* The sign bit is not set.  Convert as signed.  */
5137               expand_float (target, from, 0);
5138               emit_jump_insn (gen_jump (label));
5139               emit_barrier ();
5140
5141               /* The sign bit is set.
5142                  Convert to a usable (positive signed) value by shifting right
5143                  one bit, while remembering if a nonzero bit was shifted
5144                  out; i.e., compute  (from & 1) | (from >> 1).  */
5145
5146               emit_label (neglabel);
5147               temp = expand_binop (imode, and_optab, from, const1_rtx,
5148                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
5149               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
5150               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
5151                                    OPTAB_LIB_WIDEN);
5152               expand_float (target, temp, 0);
5153
5154               /* Multiply by 2 to undo the shift above.  */
5155               temp = expand_binop (fmode, add_optab, target, target,
5156                                    target, 0, OPTAB_LIB_WIDEN);
5157               if (temp != target)
5158                 emit_move_insn (target, temp);
5159
5160               do_pending_stack_adjust ();
5161               emit_label (label);
5162               goto done;
5163             }
5164         }
5165
5166       /* If we are about to do some arithmetic to correct for an
5167          unsigned operand, do it in a pseudo-register.  */
5168
5169       if (GET_MODE (to) != fmode
5170           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
5171         target = gen_reg_rtx (fmode);
5172
5173       /* Convert as signed integer to floating.  */
5174       expand_float (target, from, 0);
5175
5176       /* If FROM is negative (and therefore TO is negative),
5177          correct its value by 2**bitwidth.  */
5178
5179       do_pending_stack_adjust ();
5180       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, GET_MODE (from),
5181                                0, label);
5182
5183
5184       real_2expN (&offset, GET_MODE_PRECISION (GET_MODE (from)), fmode);
5185       temp = expand_binop (fmode, add_optab, target,
5186                            CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode),
5187                            target, 0, OPTAB_LIB_WIDEN);
5188       if (temp != target)
5189         emit_move_insn (target, temp);
5190
5191       do_pending_stack_adjust ();
5192       emit_label (label);
5193       goto done;
5194     }
5195
5196   /* No hardware instruction available; call a library routine.  */
5197     {
5198       rtx libfunc;
5199       rtx_insn *insns;
5200       rtx value;
5201       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
5202
5203       if (GET_MODE_SIZE (GET_MODE (from)) < GET_MODE_SIZE (SImode))
5204         from = convert_to_mode (SImode, from, unsignedp);
5205
5206       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5207       gcc_assert (libfunc);
5208
5209       start_sequence ();
5210
5211       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5212                                        GET_MODE (to), 1, from,
5213                                        GET_MODE (from));
5214       insns = get_insns ();
5215       end_sequence ();
5216
5217       emit_libcall_block (insns, target, value,
5218                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
5219                                          GET_MODE (to), from));
5220     }
5221
5222  done:
5223
5224   /* Copy result to requested destination
5225      if we have been computing in a temp location.  */
5226
5227   if (target != to)
5228     {
5229       if (GET_MODE (target) == GET_MODE (to))
5230         emit_move_insn (to, target);
5231       else
5232         convert_move (to, target, 0);
5233     }
5234 }
5235 \f
5236 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5237    must be floating point.  */
5238
5239 void
5240 expand_fix (rtx to, rtx from, int unsignedp)
5241 {
5242   enum insn_code icode;
5243   rtx target = to;
5244   enum machine_mode fmode, imode;
5245   int must_trunc = 0;
5246
5247   /* We first try to find a pair of modes, one real and one integer, at
5248      least as wide as FROM and TO, respectively, in which we can open-code
5249      this conversion.  If the integer mode is wider than the mode of TO,
5250      we can do the conversion either signed or unsigned.  */
5251
5252   for (fmode = GET_MODE (from); fmode != VOIDmode;
5253        fmode = GET_MODE_WIDER_MODE (fmode))
5254     for (imode = GET_MODE (to); imode != VOIDmode;
5255          imode = GET_MODE_WIDER_MODE (imode))
5256       {
5257         int doing_unsigned = unsignedp;
5258
5259         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
5260         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
5261           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
5262
5263         if (icode != CODE_FOR_nothing)
5264           {
5265             rtx_insn *last = get_last_insn ();
5266             if (fmode != GET_MODE (from))
5267               from = convert_to_mode (fmode, from, 0);
5268
5269             if (must_trunc)
5270               {
5271                 rtx temp = gen_reg_rtx (GET_MODE (from));
5272                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
5273                                     temp, 0);
5274               }
5275
5276             if (imode != GET_MODE (to))
5277               target = gen_reg_rtx (imode);
5278
5279             if (maybe_emit_unop_insn (icode, target, from,
5280                                       doing_unsigned ? UNSIGNED_FIX : FIX))
5281               {
5282                 if (target != to)
5283                   convert_move (to, target, unsignedp);
5284                 return;
5285               }
5286             delete_insns_since (last);
5287           }
5288       }
5289
5290   /* For an unsigned conversion, there is one more way to do it.
5291      If we have a signed conversion, we generate code that compares
5292      the real value to the largest representable positive number.  If if
5293      is smaller, the conversion is done normally.  Otherwise, subtract
5294      one plus the highest signed number, convert, and add it back.
5295
5296      We only need to check all real modes, since we know we didn't find
5297      anything with a wider integer mode.
5298
5299      This code used to extend FP value into mode wider than the destination.
5300      This is needed for decimal float modes which cannot accurately
5301      represent one plus the highest signed number of the same size, but
5302      not for binary modes.  Consider, for instance conversion from SFmode
5303      into DImode.
5304
5305      The hot path through the code is dealing with inputs smaller than 2^63
5306      and doing just the conversion, so there is no bits to lose.
5307
5308      In the other path we know the value is positive in the range 2^63..2^64-1
5309      inclusive.  (as for other input overflow happens and result is undefined)
5310      So we know that the most important bit set in mantissa corresponds to
5311      2^63.  The subtraction of 2^63 should not generate any rounding as it
5312      simply clears out that bit.  The rest is trivial.  */
5313
5314   if (unsignedp && GET_MODE_PRECISION (GET_MODE (to)) <= HOST_BITS_PER_WIDE_INT)
5315     for (fmode = GET_MODE (from); fmode != VOIDmode;
5316          fmode = GET_MODE_WIDER_MODE (fmode))
5317       if (CODE_FOR_nothing != can_fix_p (GET_MODE (to), fmode, 0, &must_trunc)
5318           && (!DECIMAL_FLOAT_MODE_P (fmode)
5319               || GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (GET_MODE (to))))
5320         {
5321           int bitsize;
5322           REAL_VALUE_TYPE offset;
5323           rtx limit;
5324           rtx_code_label *lab1, *lab2;
5325           rtx_insn *insn;
5326
5327           bitsize = GET_MODE_PRECISION (GET_MODE (to));
5328           real_2expN (&offset, bitsize - 1, fmode);
5329           limit = CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode);
5330           lab1 = gen_label_rtx ();
5331           lab2 = gen_label_rtx ();
5332
5333           if (fmode != GET_MODE (from))
5334             from = convert_to_mode (fmode, from, 0);
5335
5336           /* See if we need to do the subtraction.  */
5337           do_pending_stack_adjust ();
5338           emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX, GET_MODE (from),
5339                                    0, lab1);
5340
5341           /* If not, do the signed "fix" and branch around fixup code.  */
5342           expand_fix (to, from, 0);
5343           emit_jump_insn (gen_jump (lab2));
5344           emit_barrier ();
5345
5346           /* Otherwise, subtract 2**(N-1), convert to signed number,
5347              then add 2**(N-1).  Do the addition using XOR since this
5348              will often generate better code.  */
5349           emit_label (lab1);
5350           target = expand_binop (GET_MODE (from), sub_optab, from, limit,
5351                                  NULL_RTX, 0, OPTAB_LIB_WIDEN);
5352           expand_fix (to, target, 0);
5353           target = expand_binop (GET_MODE (to), xor_optab, to,
5354                                  gen_int_mode
5355                                  ((HOST_WIDE_INT) 1 << (bitsize - 1),
5356                                   GET_MODE (to)),
5357                                  to, 1, OPTAB_LIB_WIDEN);
5358
5359           if (target != to)
5360             emit_move_insn (to, target);
5361
5362           emit_label (lab2);
5363
5364           if (optab_handler (mov_optab, GET_MODE (to)) != CODE_FOR_nothing)
5365             {
5366               /* Make a place for a REG_NOTE and add it.  */
5367               insn = emit_move_insn (to, to);
5368               set_dst_reg_note (insn, REG_EQUAL,
5369                                 gen_rtx_fmt_e (UNSIGNED_FIX, GET_MODE (to),
5370                                                copy_rtx (from)),
5371                                 to);
5372             }
5373
5374           return;
5375         }
5376
5377   /* We can't do it with an insn, so use a library call.  But first ensure
5378      that the mode of TO is at least as wide as SImode, since those are the
5379      only library calls we know about.  */
5380
5381   if (GET_MODE_SIZE (GET_MODE (to)) < GET_MODE_SIZE (SImode))
5382     {
5383       target = gen_reg_rtx (SImode);
5384
5385       expand_fix (target, from, unsignedp);
5386     }
5387   else
5388     {
5389       rtx_insn *insns;
5390       rtx value;
5391       rtx libfunc;
5392
5393       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5394       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5395       gcc_assert (libfunc);
5396
5397       start_sequence ();
5398
5399       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5400                                        GET_MODE (to), 1, from,
5401                                        GET_MODE (from));
5402       insns = get_insns ();
5403       end_sequence ();
5404
5405       emit_libcall_block (insns, target, value,
5406                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5407                                          GET_MODE (to), from));
5408     }
5409
5410   if (target != to)
5411     {
5412       if (GET_MODE (to) == GET_MODE (target))
5413         emit_move_insn (to, target);
5414       else
5415         convert_move (to, target, 0);
5416     }
5417 }
5418
5419 /* Generate code to convert FROM or TO a fixed-point.
5420    If UINTP is true, either TO or FROM is an unsigned integer.
5421    If SATP is true, we need to saturate the result.  */
5422
5423 void
5424 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5425 {
5426   enum machine_mode to_mode = GET_MODE (to);
5427   enum machine_mode from_mode = GET_MODE (from);
5428   convert_optab tab;
5429   enum rtx_code this_code;
5430   enum insn_code code;
5431   rtx_insn *insns;
5432   rtx value;
5433   rtx libfunc;
5434
5435   if (to_mode == from_mode)
5436     {
5437       emit_move_insn (to, from);
5438       return;
5439     }
5440
5441   if (uintp)
5442     {
5443       tab = satp ? satfractuns_optab : fractuns_optab;
5444       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5445     }
5446   else
5447     {
5448       tab = satp ? satfract_optab : fract_optab;
5449       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5450     }
5451   code = convert_optab_handler (tab, to_mode, from_mode);
5452   if (code != CODE_FOR_nothing)
5453     {
5454       emit_unop_insn (code, to, from, this_code);
5455       return;
5456     }
5457
5458   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5459   gcc_assert (libfunc);
5460
5461   start_sequence ();
5462   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5463                                    1, from, from_mode);
5464   insns = get_insns ();
5465   end_sequence ();
5466
5467   emit_libcall_block (insns, to, value,
5468                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5469 }
5470
5471 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5472    must be floating point, TO must be signed.  Use the conversion optab
5473    TAB to do the conversion.  */
5474
5475 bool
5476 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5477 {
5478   enum insn_code icode;
5479   rtx target = to;
5480   enum machine_mode fmode, imode;
5481
5482   /* We first try to find a pair of modes, one real and one integer, at
5483      least as wide as FROM and TO, respectively, in which we can open-code
5484      this conversion.  If the integer mode is wider than the mode of TO,
5485      we can do the conversion either signed or unsigned.  */
5486
5487   for (fmode = GET_MODE (from); fmode != VOIDmode;
5488        fmode = GET_MODE_WIDER_MODE (fmode))
5489     for (imode = GET_MODE (to); imode != VOIDmode;
5490          imode = GET_MODE_WIDER_MODE (imode))
5491       {
5492         icode = convert_optab_handler (tab, imode, fmode);
5493         if (icode != CODE_FOR_nothing)
5494           {
5495             rtx_insn *last = get_last_insn ();
5496             if (fmode != GET_MODE (from))
5497               from = convert_to_mode (fmode, from, 0);
5498
5499             if (imode != GET_MODE (to))
5500               target = gen_reg_rtx (imode);
5501
5502             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5503               {
5504                 delete_insns_since (last);
5505                 continue;
5506               }
5507             if (target != to)
5508               convert_move (to, target, 0);
5509             return true;
5510           }
5511       }
5512
5513   return false;
5514 }
5515 \f
5516 /* Report whether we have an instruction to perform the operation
5517    specified by CODE on operands of mode MODE.  */
5518 int
5519 have_insn_for (enum rtx_code code, enum machine_mode mode)
5520 {
5521   return (code_to_optab (code)
5522           && (optab_handler (code_to_optab (code), mode)
5523               != CODE_FOR_nothing));
5524 }
5525
5526 /* Initialize the libfunc fields of an entire group of entries in some
5527    optab.  Each entry is set equal to a string consisting of a leading
5528    pair of underscores followed by a generic operation name followed by
5529    a mode name (downshifted to lowercase) followed by a single character
5530    representing the number of operands for the given operation (which is
5531    usually one of the characters '2', '3', or '4').
5532
5533    OPTABLE is the table in which libfunc fields are to be initialized.
5534    OPNAME is the generic (string) name of the operation.
5535    SUFFIX is the character which specifies the number of operands for
5536      the given generic operation.
5537    MODE is the mode to generate for.
5538 */
5539
5540 static void
5541 gen_libfunc (optab optable, const char *opname, int suffix,
5542              enum machine_mode mode)
5543 {
5544   unsigned opname_len = strlen (opname);
5545   const char *mname = GET_MODE_NAME (mode);
5546   unsigned mname_len = strlen (mname);
5547   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5548   int len = prefix_len + opname_len + mname_len + 1 + 1;
5549   char *libfunc_name = XALLOCAVEC (char, len);
5550   char *p;
5551   const char *q;
5552
5553   p = libfunc_name;
5554   *p++ = '_';
5555   *p++ = '_';
5556   if (targetm.libfunc_gnu_prefix)
5557     {
5558       *p++ = 'g';
5559       *p++ = 'n';
5560       *p++ = 'u';
5561       *p++ = '_';
5562     }
5563   for (q = opname; *q; )
5564     *p++ = *q++;
5565   for (q = mname; *q; q++)
5566     *p++ = TOLOWER (*q);
5567   *p++ = suffix;
5568   *p = '\0';
5569
5570   set_optab_libfunc (optable, mode,
5571                      ggc_alloc_string (libfunc_name, p - libfunc_name));
5572 }
5573
5574 /* Like gen_libfunc, but verify that integer operation is involved.  */
5575
5576 void
5577 gen_int_libfunc (optab optable, const char *opname, char suffix,
5578                  enum machine_mode mode)
5579 {
5580   int maxsize = 2 * BITS_PER_WORD;
5581   int minsize = BITS_PER_WORD;
5582
5583   if (GET_MODE_CLASS (mode) != MODE_INT)
5584     return;
5585   if (maxsize < LONG_LONG_TYPE_SIZE)
5586     maxsize = LONG_LONG_TYPE_SIZE;
5587   if (minsize > INT_TYPE_SIZE
5588       && (trapv_binoptab_p (optable)
5589           || trapv_unoptab_p (optable)))
5590     minsize = INT_TYPE_SIZE;
5591   if (GET_MODE_BITSIZE (mode) < minsize
5592       || GET_MODE_BITSIZE (mode) > maxsize)
5593     return;
5594   gen_libfunc (optable, opname, suffix, mode);
5595 }
5596
5597 /* Like gen_libfunc, but verify that FP and set decimal prefix if needed.  */
5598
5599 void
5600 gen_fp_libfunc (optab optable, const char *opname, char suffix,
5601                 enum machine_mode mode)
5602 {
5603   char *dec_opname;
5604
5605   if (GET_MODE_CLASS (mode) == MODE_FLOAT)
5606     gen_libfunc (optable, opname, suffix, mode);
5607   if (DECIMAL_FLOAT_MODE_P (mode))
5608     {
5609       dec_opname = XALLOCAVEC (char, sizeof (DECIMAL_PREFIX) + strlen (opname));
5610       /* For BID support, change the name to have either a bid_ or dpd_ prefix
5611          depending on the low level floating format used.  */
5612       memcpy (dec_opname, DECIMAL_PREFIX, sizeof (DECIMAL_PREFIX) - 1);
5613       strcpy (dec_opname + sizeof (DECIMAL_PREFIX) - 1, opname);
5614       gen_libfunc (optable, dec_opname, suffix, mode);
5615     }
5616 }
5617
5618 /* Like gen_libfunc, but verify that fixed-point operation is involved.  */
5619
5620 void
5621 gen_fixed_libfunc (optab optable, const char *opname, char suffix,
5622                    enum machine_mode mode)
5623 {
5624   if (!ALL_FIXED_POINT_MODE_P (mode))
5625     return;
5626   gen_libfunc (optable, opname, suffix, mode);
5627 }
5628
5629 /* Like gen_libfunc, but verify that signed fixed-point operation is
5630    involved.  */
5631
5632 void
5633 gen_signed_fixed_libfunc (optab optable, const char *opname, char suffix,
5634                           enum machine_mode mode)
5635 {
5636   if (!SIGNED_FIXED_POINT_MODE_P (mode))
5637     return;
5638   gen_libfunc (optable, opname, suffix, mode);
5639 }
5640
5641 /* Like gen_libfunc, but verify that unsigned fixed-point operation is
5642    involved.  */
5643
5644 void
5645 gen_unsigned_fixed_libfunc (optab optable, const char *opname, char suffix,
5646                             enum machine_mode mode)
5647 {
5648   if (!UNSIGNED_FIXED_POINT_MODE_P (mode))
5649     return;
5650   gen_libfunc (optable, opname, suffix, mode);
5651 }
5652
5653 /* Like gen_libfunc, but verify that FP or INT operation is involved.  */
5654
5655 void
5656 gen_int_fp_libfunc (optab optable, const char *name, char suffix,
5657                     enum machine_mode mode)
5658 {
5659   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5660     gen_fp_libfunc (optable, name, suffix, mode);
5661   if (INTEGRAL_MODE_P (mode))
5662     gen_int_libfunc (optable, name, suffix, mode);
5663 }
5664
5665 /* Like gen_libfunc, but verify that FP or INT operation is involved
5666    and add 'v' suffix for integer operation.  */
5667
5668 void
5669 gen_intv_fp_libfunc (optab optable, const char *name, char suffix,
5670                      enum machine_mode mode)
5671 {
5672   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5673     gen_fp_libfunc (optable, name, suffix, mode);
5674   if (GET_MODE_CLASS (mode) == MODE_INT)
5675     {
5676       int len = strlen (name);
5677       char *v_name = XALLOCAVEC (char, len + 2);
5678       strcpy (v_name, name);
5679       v_name[len] = 'v';
5680       v_name[len + 1] = 0;
5681       gen_int_libfunc (optable, v_name, suffix, mode);
5682     }
5683 }
5684
5685 /* Like gen_libfunc, but verify that FP or INT or FIXED operation is
5686    involved.  */
5687
5688 void
5689 gen_int_fp_fixed_libfunc (optab optable, const char *name, char suffix,
5690                           enum machine_mode mode)
5691 {
5692   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5693     gen_fp_libfunc (optable, name, suffix, mode);
5694   if (INTEGRAL_MODE_P (mode))
5695     gen_int_libfunc (optable, name, suffix, mode);
5696   if (ALL_FIXED_POINT_MODE_P (mode))
5697     gen_fixed_libfunc (optable, name, suffix, mode);
5698 }
5699
5700 /* Like gen_libfunc, but verify that FP or INT or signed FIXED operation is
5701    involved.  */
5702
5703 void
5704 gen_int_fp_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5705                                  enum machine_mode mode)
5706 {
5707   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5708     gen_fp_libfunc (optable, name, suffix, mode);
5709   if (INTEGRAL_MODE_P (mode))
5710     gen_int_libfunc (optable, name, suffix, mode);
5711   if (SIGNED_FIXED_POINT_MODE_P (mode))
5712     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5713 }
5714
5715 /* Like gen_libfunc, but verify that INT or FIXED operation is
5716    involved.  */
5717
5718 void
5719 gen_int_fixed_libfunc (optab optable, const char *name, char suffix,
5720                        enum machine_mode mode)
5721 {
5722   if (INTEGRAL_MODE_P (mode))
5723     gen_int_libfunc (optable, name, suffix, mode);
5724   if (ALL_FIXED_POINT_MODE_P (mode))
5725     gen_fixed_libfunc (optable, name, suffix, mode);
5726 }
5727
5728 /* Like gen_libfunc, but verify that INT or signed FIXED operation is
5729    involved.  */
5730
5731 void
5732 gen_int_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5733                               enum machine_mode mode)
5734 {
5735   if (INTEGRAL_MODE_P (mode))
5736     gen_int_libfunc (optable, name, suffix, mode);
5737   if (SIGNED_FIXED_POINT_MODE_P (mode))
5738     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5739 }
5740
5741 /* Like gen_libfunc, but verify that INT or unsigned FIXED operation is
5742    involved.  */
5743
5744 void
5745 gen_int_unsigned_fixed_libfunc (optab optable, const char *name, char suffix,
5746                                 enum machine_mode mode)
5747 {
5748   if (INTEGRAL_MODE_P (mode))
5749     gen_int_libfunc (optable, name, suffix, mode);
5750   if (UNSIGNED_FIXED_POINT_MODE_P (mode))
5751     gen_unsigned_fixed_libfunc (optable, name, suffix, mode);
5752 }
5753
5754 /* Initialize the libfunc fields of an entire group of entries of an
5755    inter-mode-class conversion optab.  The string formation rules are
5756    similar to the ones for init_libfuncs, above, but instead of having
5757    a mode name and an operand count these functions have two mode names
5758    and no operand count.  */
5759
5760 void
5761 gen_interclass_conv_libfunc (convert_optab tab,
5762                              const char *opname,
5763                              enum machine_mode tmode,
5764                              enum machine_mode fmode)
5765 {
5766   size_t opname_len = strlen (opname);
5767   size_t mname_len = 0;
5768
5769   const char *fname, *tname;
5770   const char *q;
5771   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5772   char *libfunc_name, *suffix;
5773   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5774   char *p;
5775
5776   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5777      depends on which underlying decimal floating point format is used.  */
5778   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5779
5780   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5781
5782   nondec_name = XALLOCAVEC (char, prefix_len + opname_len + mname_len + 1 + 1);
5783   nondec_name[0] = '_';
5784   nondec_name[1] = '_';
5785   if (targetm.libfunc_gnu_prefix)
5786     {
5787       nondec_name[2] = 'g';
5788       nondec_name[3] = 'n';
5789       nondec_name[4] = 'u';
5790       nondec_name[5] = '_';
5791     }
5792
5793   memcpy (&nondec_name[prefix_len], opname, opname_len);
5794   nondec_suffix = nondec_name + opname_len + prefix_len;
5795
5796   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5797   dec_name[0] = '_';
5798   dec_name[1] = '_';
5799   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5800   memcpy (&dec_name[2+dec_len], opname, opname_len);
5801   dec_suffix = dec_name + dec_len + opname_len + 2;
5802
5803   fname = GET_MODE_NAME (fmode);
5804   tname = GET_MODE_NAME (tmode);
5805
5806   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5807     {
5808       libfunc_name = dec_name;
5809       suffix = dec_suffix;
5810     }
5811   else
5812     {
5813       libfunc_name = nondec_name;
5814       suffix = nondec_suffix;
5815     }
5816
5817   p = suffix;
5818   for (q = fname; *q; p++, q++)
5819     *p = TOLOWER (*q);
5820   for (q = tname; *q; p++, q++)
5821     *p = TOLOWER (*q);
5822
5823   *p = '\0';
5824
5825   set_conv_libfunc (tab, tmode, fmode,
5826                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5827 }
5828
5829 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5830    int->fp conversion.  */
5831
5832 void
5833 gen_int_to_fp_conv_libfunc (convert_optab tab,
5834                             const char *opname,
5835                             enum machine_mode tmode,
5836                             enum machine_mode fmode)
5837 {
5838   if (GET_MODE_CLASS (fmode) != MODE_INT)
5839     return;
5840   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5841     return;
5842   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5843 }
5844
5845 /* ufloat_optab is special by using floatun for FP and floatuns decimal fp
5846    naming scheme.  */
5847
5848 void
5849 gen_ufloat_conv_libfunc (convert_optab tab,
5850                          const char *opname ATTRIBUTE_UNUSED,
5851                          enum machine_mode tmode,
5852                          enum machine_mode fmode)
5853 {
5854   if (DECIMAL_FLOAT_MODE_P (tmode))
5855     gen_int_to_fp_conv_libfunc (tab, "floatuns", tmode, fmode);
5856   else
5857     gen_int_to_fp_conv_libfunc (tab, "floatun", tmode, fmode);
5858 }
5859
5860 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5861    fp->int conversion.  */
5862
5863 void
5864 gen_int_to_fp_nondecimal_conv_libfunc (convert_optab tab,
5865                                        const char *opname,
5866                                        enum machine_mode tmode,
5867                                        enum machine_mode fmode)
5868 {
5869   if (GET_MODE_CLASS (fmode) != MODE_INT)
5870     return;
5871   if (GET_MODE_CLASS (tmode) != MODE_FLOAT)
5872     return;
5873   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5874 }
5875
5876 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5877    fp->int conversion with no decimal floating point involved.  */
5878
5879 void
5880 gen_fp_to_int_conv_libfunc (convert_optab tab,
5881                             const char *opname,
5882                             enum machine_mode tmode,
5883                             enum machine_mode fmode)
5884 {
5885   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5886     return;
5887   if (GET_MODE_CLASS (tmode) != MODE_INT)
5888     return;
5889   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5890 }
5891
5892 /* Initialize the libfunc fields of an of an intra-mode-class conversion optab.
5893    The string formation rules are
5894    similar to the ones for init_libfunc, above.  */
5895
5896 void
5897 gen_intraclass_conv_libfunc (convert_optab tab, const char *opname,
5898                              enum machine_mode tmode, enum machine_mode fmode)
5899 {
5900   size_t opname_len = strlen (opname);
5901   size_t mname_len = 0;
5902
5903   const char *fname, *tname;
5904   const char *q;
5905   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5906   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5907   char *libfunc_name, *suffix;
5908   char *p;
5909
5910   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5911      depends on which underlying decimal floating point format is used.  */
5912   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5913
5914   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5915
5916   nondec_name = XALLOCAVEC (char, 2 + opname_len + mname_len + 1 + 1);
5917   nondec_name[0] = '_';
5918   nondec_name[1] = '_';
5919   if (targetm.libfunc_gnu_prefix)
5920     {
5921       nondec_name[2] = 'g';
5922       nondec_name[3] = 'n';
5923       nondec_name[4] = 'u';
5924       nondec_name[5] = '_';
5925     }
5926   memcpy (&nondec_name[prefix_len], opname, opname_len);
5927   nondec_suffix = nondec_name + opname_len + prefix_len;
5928
5929   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5930   dec_name[0] = '_';
5931   dec_name[1] = '_';
5932   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5933   memcpy (&dec_name[2 + dec_len], opname, opname_len);
5934   dec_suffix = dec_name + dec_len + opname_len + 2;
5935
5936   fname = GET_MODE_NAME (fmode);
5937   tname = GET_MODE_NAME (tmode);
5938
5939   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5940     {
5941       libfunc_name = dec_name;
5942       suffix = dec_suffix;
5943     }
5944   else
5945     {
5946       libfunc_name = nondec_name;
5947       suffix = nondec_suffix;
5948     }
5949
5950   p = suffix;
5951   for (q = fname; *q; p++, q++)
5952     *p = TOLOWER (*q);
5953   for (q = tname; *q; p++, q++)
5954     *p = TOLOWER (*q);
5955
5956   *p++ = '2';
5957   *p = '\0';
5958
5959   set_conv_libfunc (tab, tmode, fmode,
5960                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5961 }
5962
5963 /* Pick proper libcall for trunc_optab.  We need to chose if we do
5964    truncation or extension and interclass or intraclass.  */
5965
5966 void
5967 gen_trunc_conv_libfunc (convert_optab tab,
5968                          const char *opname,
5969                          enum machine_mode tmode,
5970                          enum machine_mode fmode)
5971 {
5972   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5973     return;
5974   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5975     return;
5976   if (tmode == fmode)
5977     return;
5978
5979   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
5980       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
5981      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5982
5983   if (GET_MODE_PRECISION (fmode) <= GET_MODE_PRECISION (tmode))
5984     return;
5985
5986   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
5987        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
5988       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
5989     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5990 }
5991
5992 /* Pick proper libcall for extend_optab.  We need to chose if we do
5993    truncation or extension and interclass or intraclass.  */
5994
5995 void
5996 gen_extend_conv_libfunc (convert_optab tab,
5997                          const char *opname ATTRIBUTE_UNUSED,
5998                          enum machine_mode tmode,
5999                          enum machine_mode fmode)
6000 {
6001   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
6002     return;
6003   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
6004     return;
6005   if (tmode == fmode)
6006     return;
6007
6008   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
6009       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
6010      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6011
6012   if (GET_MODE_PRECISION (fmode) > GET_MODE_PRECISION (tmode))
6013     return;
6014
6015   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
6016        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
6017       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
6018     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6019 }
6020
6021 /* Pick proper libcall for fract_optab.  We need to chose if we do
6022    interclass or intraclass.  */
6023
6024 void
6025 gen_fract_conv_libfunc (convert_optab tab,
6026                         const char *opname,
6027                         enum machine_mode tmode,
6028                         enum machine_mode fmode)
6029 {
6030   if (tmode == fmode)
6031     return;
6032   if (!(ALL_FIXED_POINT_MODE_P (tmode) || ALL_FIXED_POINT_MODE_P (fmode)))
6033     return;
6034
6035   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6036     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6037   else
6038     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6039 }
6040
6041 /* Pick proper libcall for fractuns_optab.  */
6042
6043 void
6044 gen_fractuns_conv_libfunc (convert_optab tab,
6045                            const char *opname,
6046                            enum machine_mode tmode,
6047                            enum machine_mode fmode)
6048 {
6049   if (tmode == fmode)
6050     return;
6051   /* One mode must be a fixed-point mode, and the other must be an integer
6052      mode. */
6053   if (!((ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT)
6054         || (ALL_FIXED_POINT_MODE_P (fmode)
6055             && GET_MODE_CLASS (tmode) == MODE_INT)))
6056     return;
6057
6058   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6059 }
6060
6061 /* Pick proper libcall for satfract_optab.  We need to chose if we do
6062    interclass or intraclass.  */
6063
6064 void
6065 gen_satfract_conv_libfunc (convert_optab tab,
6066                            const char *opname,
6067                            enum machine_mode tmode,
6068                            enum machine_mode fmode)
6069 {
6070   if (tmode == fmode)
6071     return;
6072   /* TMODE must be a fixed-point mode.  */
6073   if (!ALL_FIXED_POINT_MODE_P (tmode))
6074     return;
6075
6076   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6077     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6078   else
6079     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6080 }
6081
6082 /* Pick proper libcall for satfractuns_optab.  */
6083
6084 void
6085 gen_satfractuns_conv_libfunc (convert_optab tab,
6086                               const char *opname,
6087                               enum machine_mode tmode,
6088                               enum machine_mode fmode)
6089 {
6090   if (tmode == fmode)
6091     return;
6092   /* TMODE must be a fixed-point mode, and FMODE must be an integer mode. */
6093   if (!(ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT))
6094     return;
6095
6096   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6097 }
6098
6099 /* A table of previously-created libfuncs, hashed by name.  */
6100 static GTY ((param_is (union tree_node))) htab_t libfunc_decls;
6101
6102 /* Hashtable callbacks for libfunc_decls.  */
6103
6104 static hashval_t
6105 libfunc_decl_hash (const void *entry)
6106 {
6107   return IDENTIFIER_HASH_VALUE (DECL_NAME ((const_tree) entry));
6108 }
6109
6110 static int
6111 libfunc_decl_eq (const void *entry1, const void *entry2)
6112 {
6113   return DECL_NAME ((const_tree) entry1) == (const_tree) entry2;
6114 }
6115
6116 /* Build a decl for a libfunc named NAME. */
6117
6118 tree
6119 build_libfunc_function (const char *name)
6120 {
6121   tree decl = build_decl (UNKNOWN_LOCATION, FUNCTION_DECL,
6122                           get_identifier (name),
6123                           build_function_type (integer_type_node, NULL_TREE));
6124   /* ??? We don't have any type information except for this is
6125      a function.  Pretend this is "int foo()".  */
6126   DECL_ARTIFICIAL (decl) = 1;
6127   DECL_EXTERNAL (decl) = 1;
6128   TREE_PUBLIC (decl) = 1;
6129   gcc_assert (DECL_ASSEMBLER_NAME (decl));
6130
6131   /* Zap the nonsensical SYMBOL_REF_DECL for this.  What we're left with
6132      are the flags assigned by targetm.encode_section_info.  */
6133   SET_SYMBOL_REF_DECL (XEXP (DECL_RTL (decl), 0), NULL);
6134
6135   return decl;
6136 }
6137
6138 rtx
6139 init_one_libfunc (const char *name)
6140 {
6141   tree id, decl;
6142   void **slot;
6143   hashval_t hash;
6144
6145   if (libfunc_decls == NULL)
6146     libfunc_decls = htab_create_ggc (37, libfunc_decl_hash,
6147                                      libfunc_decl_eq, NULL);
6148
6149   /* See if we have already created a libfunc decl for this function.  */
6150   id = get_identifier (name);
6151   hash = IDENTIFIER_HASH_VALUE (id);
6152   slot = htab_find_slot_with_hash (libfunc_decls, id, hash, INSERT);
6153   decl = (tree) *slot;
6154   if (decl == NULL)
6155     {
6156       /* Create a new decl, so that it can be passed to
6157          targetm.encode_section_info.  */
6158       decl = build_libfunc_function (name);
6159       *slot = decl;
6160     }
6161   return XEXP (DECL_RTL (decl), 0);
6162 }
6163
6164 /* Adjust the assembler name of libfunc NAME to ASMSPEC.  */
6165
6166 rtx
6167 set_user_assembler_libfunc (const char *name, const char *asmspec)
6168 {
6169   tree id, decl;
6170   void **slot;
6171   hashval_t hash;
6172
6173   id = get_identifier (name);
6174   hash = IDENTIFIER_HASH_VALUE (id);
6175   slot = htab_find_slot_with_hash (libfunc_decls, id, hash, NO_INSERT);
6176   gcc_assert (slot);
6177   decl = (tree) *slot;
6178   set_user_assembler_name (decl, asmspec);
6179   return XEXP (DECL_RTL (decl), 0);
6180 }
6181
6182 /* Call this to reset the function entry for one optab (OPTABLE) in mode
6183    MODE to NAME, which should be either 0 or a string constant.  */
6184 void
6185 set_optab_libfunc (optab op, enum machine_mode mode, const char *name)
6186 {
6187   rtx val;
6188   struct libfunc_entry e;
6189   struct libfunc_entry **slot;
6190
6191   e.op = op;
6192   e.mode1 = mode;
6193   e.mode2 = VOIDmode;
6194
6195   if (name)
6196     val = init_one_libfunc (name);
6197   else
6198     val = 0;
6199   slot = (struct libfunc_entry **) htab_find_slot (libfunc_hash, &e, INSERT);
6200   if (*slot == NULL)
6201     *slot = ggc_alloc<libfunc_entry> ();
6202   (*slot)->op = op;
6203   (*slot)->mode1 = mode;
6204   (*slot)->mode2 = VOIDmode;
6205   (*slot)->libfunc = val;
6206 }
6207
6208 /* Call this to reset the function entry for one conversion optab
6209    (OPTABLE) from mode FMODE to mode TMODE to NAME, which should be
6210    either 0 or a string constant.  */
6211 void
6212 set_conv_libfunc (convert_optab optab, enum machine_mode tmode,
6213                   enum machine_mode fmode, const char *name)
6214 {
6215   rtx val;
6216   struct libfunc_entry e;
6217   struct libfunc_entry **slot;
6218
6219   e.op = optab;
6220   e.mode1 = tmode;
6221   e.mode2 = fmode;
6222
6223   if (name)
6224     val = init_one_libfunc (name);
6225   else
6226     val = 0;
6227   slot = (struct libfunc_entry **) htab_find_slot (libfunc_hash, &e, INSERT);
6228   if (*slot == NULL)
6229     *slot = ggc_alloc<libfunc_entry> ();
6230   (*slot)->op = optab;
6231   (*slot)->mode1 = tmode;
6232   (*slot)->mode2 = fmode;
6233   (*slot)->libfunc = val;
6234 }
6235
6236 /* Call this to initialize the contents of the optabs
6237    appropriately for the current target machine.  */
6238
6239 void
6240 init_optabs (void)
6241 {
6242   if (libfunc_hash)
6243     htab_empty (libfunc_hash);
6244   else
6245     libfunc_hash = htab_create_ggc (10, hash_libfunc, eq_libfunc, NULL);
6246
6247   /* Fill in the optabs with the insns we support.  */
6248   init_all_optabs (this_fn_optabs);
6249
6250   /* The ffs function operates on `int'.  Fall back on it if we do not
6251      have a libgcc2 function for that width.  */
6252   if (INT_TYPE_SIZE < BITS_PER_WORD)
6253     set_optab_libfunc (ffs_optab, mode_for_size (INT_TYPE_SIZE, MODE_INT, 0),
6254                        "ffs");
6255
6256   /* Explicitly initialize the bswap libfuncs since we need them to be
6257      valid for things other than word_mode.  */
6258   if (targetm.libfunc_gnu_prefix)
6259     {
6260       set_optab_libfunc (bswap_optab, SImode, "__gnu_bswapsi2");
6261       set_optab_libfunc (bswap_optab, DImode, "__gnu_bswapdi2");
6262     }
6263   else
6264     {
6265       set_optab_libfunc (bswap_optab, SImode, "__bswapsi2");
6266       set_optab_libfunc (bswap_optab, DImode, "__bswapdi2");
6267     }
6268
6269   /* Use cabs for double complex abs, since systems generally have cabs.
6270      Don't define any libcall for float complex, so that cabs will be used.  */
6271   if (complex_double_type_node)
6272     set_optab_libfunc (abs_optab, TYPE_MODE (complex_double_type_node),
6273                        "cabs");
6274
6275   abort_libfunc = init_one_libfunc ("abort");
6276   memcpy_libfunc = init_one_libfunc ("memcpy");
6277   memmove_libfunc = init_one_libfunc ("memmove");
6278   memcmp_libfunc = init_one_libfunc ("memcmp");
6279   memset_libfunc = init_one_libfunc ("memset");
6280   setbits_libfunc = init_one_libfunc ("__setbits");
6281
6282 #ifndef DONT_USE_BUILTIN_SETJMP
6283   setjmp_libfunc = init_one_libfunc ("__builtin_setjmp");
6284   longjmp_libfunc = init_one_libfunc ("__builtin_longjmp");
6285 #else
6286   setjmp_libfunc = init_one_libfunc ("setjmp");
6287   longjmp_libfunc = init_one_libfunc ("longjmp");
6288 #endif
6289   unwind_sjlj_register_libfunc = init_one_libfunc ("_Unwind_SjLj_Register");
6290   unwind_sjlj_unregister_libfunc
6291     = init_one_libfunc ("_Unwind_SjLj_Unregister");
6292
6293   /* For function entry/exit instrumentation.  */
6294   profile_function_entry_libfunc
6295     = init_one_libfunc ("__cyg_profile_func_enter");
6296   profile_function_exit_libfunc
6297     = init_one_libfunc ("__cyg_profile_func_exit");
6298
6299   gcov_flush_libfunc = init_one_libfunc ("__gcov_flush");
6300
6301   /* Allow the target to add more libcalls or rename some, etc.  */
6302   targetm.init_libfuncs ();
6303 }
6304
6305 /* Use the current target and options to initialize
6306    TREE_OPTIMIZATION_OPTABS (OPTNODE).  */
6307
6308 void
6309 init_tree_optimization_optabs (tree optnode)
6310 {
6311   /* Quick exit if we have already computed optabs for this target.  */
6312   if (TREE_OPTIMIZATION_BASE_OPTABS (optnode) == this_target_optabs)
6313     return;
6314
6315   /* Forget any previous information and set up for the current target.  */
6316   TREE_OPTIMIZATION_BASE_OPTABS (optnode) = this_target_optabs;
6317   struct target_optabs *tmp_optabs = (struct target_optabs *)
6318     TREE_OPTIMIZATION_OPTABS (optnode);
6319   if (tmp_optabs)
6320     memset (tmp_optabs, 0, sizeof (struct target_optabs));
6321   else
6322     tmp_optabs = ggc_alloc<target_optabs> ();
6323
6324   /* Generate a new set of optabs into tmp_optabs.  */
6325   init_all_optabs (tmp_optabs);
6326
6327   /* If the optabs changed, record it.  */
6328   if (memcmp (tmp_optabs, this_target_optabs, sizeof (struct target_optabs)))
6329     TREE_OPTIMIZATION_OPTABS (optnode) = tmp_optabs;
6330   else
6331     {
6332       TREE_OPTIMIZATION_OPTABS (optnode) = NULL;
6333       ggc_free (tmp_optabs);
6334     }
6335 }
6336
6337 /* A helper function for init_sync_libfuncs.  Using the basename BASE,
6338    install libfuncs into TAB for BASE_N for 1 <= N <= MAX.  */
6339
6340 static void
6341 init_sync_libfuncs_1 (optab tab, const char *base, int max)
6342 {
6343   enum machine_mode mode;
6344   char buf[64];
6345   size_t len = strlen (base);
6346   int i;
6347
6348   gcc_assert (max <= 8);
6349   gcc_assert (len + 3 < sizeof (buf));
6350
6351   memcpy (buf, base, len);
6352   buf[len] = '_';
6353   buf[len + 1] = '0';
6354   buf[len + 2] = '\0';
6355
6356   mode = QImode;
6357   for (i = 1; i <= max; i *= 2)
6358     {
6359       buf[len + 1] = '0' + i;
6360       set_optab_libfunc (tab, mode, buf);
6361       mode = GET_MODE_2XWIDER_MODE (mode);
6362     }
6363 }
6364
6365 void
6366 init_sync_libfuncs (int max)
6367 {
6368   if (!flag_sync_libcalls)
6369     return;
6370
6371   init_sync_libfuncs_1 (sync_compare_and_swap_optab,
6372                         "__sync_val_compare_and_swap", max);
6373   init_sync_libfuncs_1 (sync_lock_test_and_set_optab,
6374                         "__sync_lock_test_and_set", max);
6375
6376   init_sync_libfuncs_1 (sync_old_add_optab, "__sync_fetch_and_add", max);
6377   init_sync_libfuncs_1 (sync_old_sub_optab, "__sync_fetch_and_sub", max);
6378   init_sync_libfuncs_1 (sync_old_ior_optab, "__sync_fetch_and_or", max);
6379   init_sync_libfuncs_1 (sync_old_and_optab, "__sync_fetch_and_and", max);
6380   init_sync_libfuncs_1 (sync_old_xor_optab, "__sync_fetch_and_xor", max);
6381   init_sync_libfuncs_1 (sync_old_nand_optab, "__sync_fetch_and_nand", max);
6382
6383   init_sync_libfuncs_1 (sync_new_add_optab, "__sync_add_and_fetch", max);
6384   init_sync_libfuncs_1 (sync_new_sub_optab, "__sync_sub_and_fetch", max);
6385   init_sync_libfuncs_1 (sync_new_ior_optab, "__sync_or_and_fetch", max);
6386   init_sync_libfuncs_1 (sync_new_and_optab, "__sync_and_and_fetch", max);
6387   init_sync_libfuncs_1 (sync_new_xor_optab, "__sync_xor_and_fetch", max);
6388   init_sync_libfuncs_1 (sync_new_nand_optab, "__sync_nand_and_fetch", max);
6389 }
6390
6391 /* Print information about the current contents of the optabs on
6392    STDERR.  */
6393
6394 DEBUG_FUNCTION void
6395 debug_optab_libfuncs (void)
6396 {
6397   int i, j, k;
6398
6399   /* Dump the arithmetic optabs.  */
6400   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
6401     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6402       {
6403         rtx l = optab_libfunc ((optab) i, (enum machine_mode) j);
6404         if (l)
6405           {
6406             gcc_assert (GET_CODE (l) == SYMBOL_REF);
6407             fprintf (stderr, "%s\t%s:\t%s\n",
6408                      GET_RTX_NAME (optab_to_code ((optab) i)),
6409                      GET_MODE_NAME (j),
6410                      XSTR (l, 0));
6411           }
6412       }
6413
6414   /* Dump the conversion optabs.  */
6415   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
6416     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6417       for (k = 0; k < NUM_MACHINE_MODES; ++k)
6418         {
6419           rtx l = convert_optab_libfunc ((optab) i, (enum machine_mode) j,
6420                                          (enum machine_mode) k);
6421           if (l)
6422             {
6423               gcc_assert (GET_CODE (l) == SYMBOL_REF);
6424               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
6425                        GET_RTX_NAME (optab_to_code ((optab) i)),
6426                        GET_MODE_NAME (j),
6427                        GET_MODE_NAME (k),
6428                        XSTR (l, 0));
6429             }
6430         }
6431 }
6432
6433 \f
6434 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
6435    CODE.  Return 0 on failure.  */
6436
6437 rtx
6438 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
6439 {
6440   enum machine_mode mode = GET_MODE (op1);
6441   enum insn_code icode;
6442   rtx insn;
6443   rtx trap_rtx;
6444
6445   if (mode == VOIDmode)
6446     return 0;
6447
6448   icode = optab_handler (ctrap_optab, mode);
6449   if (icode == CODE_FOR_nothing)
6450     return 0;
6451
6452   /* Some targets only accept a zero trap code.  */
6453   if (!insn_operand_matches (icode, 3, tcode))
6454     return 0;
6455
6456   do_pending_stack_adjust ();
6457   start_sequence ();
6458   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
6459                     &trap_rtx, &mode);
6460   if (!trap_rtx)
6461     insn = NULL_RTX;
6462   else
6463     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
6464                             tcode);
6465
6466   /* If that failed, then give up.  */
6467   if (insn == 0)
6468     {
6469       end_sequence ();
6470       return 0;
6471     }
6472
6473   emit_insn (insn);
6474   insn = get_insns ();
6475   end_sequence ();
6476   return insn;
6477 }
6478
6479 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
6480    or unsigned operation code.  */
6481
6482 static enum rtx_code
6483 get_rtx_code (enum tree_code tcode, bool unsignedp)
6484 {
6485   enum rtx_code code;
6486   switch (tcode)
6487     {
6488     case EQ_EXPR:
6489       code = EQ;
6490       break;
6491     case NE_EXPR:
6492       code = NE;
6493       break;
6494     case LT_EXPR:
6495       code = unsignedp ? LTU : LT;
6496       break;
6497     case LE_EXPR:
6498       code = unsignedp ? LEU : LE;
6499       break;
6500     case GT_EXPR:
6501       code = unsignedp ? GTU : GT;
6502       break;
6503     case GE_EXPR:
6504       code = unsignedp ? GEU : GE;
6505       break;
6506
6507     case UNORDERED_EXPR:
6508       code = UNORDERED;
6509       break;
6510     case ORDERED_EXPR:
6511       code = ORDERED;
6512       break;
6513     case UNLT_EXPR:
6514       code = UNLT;
6515       break;
6516     case UNLE_EXPR:
6517       code = UNLE;
6518       break;
6519     case UNGT_EXPR:
6520       code = UNGT;
6521       break;
6522     case UNGE_EXPR:
6523       code = UNGE;
6524       break;
6525     case UNEQ_EXPR:
6526       code = UNEQ;
6527       break;
6528     case LTGT_EXPR:
6529       code = LTGT;
6530       break;
6531
6532     default:
6533       gcc_unreachable ();
6534     }
6535   return code;
6536 }
6537
6538 /* Return comparison rtx for COND. Use UNSIGNEDP to select signed or
6539    unsigned operators. Do not generate compare instruction.  */
6540
6541 static rtx
6542 vector_compare_rtx (enum tree_code tcode, tree t_op0, tree t_op1,
6543                     bool unsignedp, enum insn_code icode)
6544 {
6545   struct expand_operand ops[2];
6546   rtx rtx_op0, rtx_op1;
6547   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
6548
6549   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
6550
6551   /* Expand operands.  */
6552   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
6553                          EXPAND_STACK_PARM);
6554   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
6555                          EXPAND_STACK_PARM);
6556
6557   create_input_operand (&ops[0], rtx_op0, GET_MODE (rtx_op0));
6558   create_input_operand (&ops[1], rtx_op1, GET_MODE (rtx_op1));
6559   if (!maybe_legitimize_operands (icode, 4, 2, ops))
6560     gcc_unreachable ();
6561   return gen_rtx_fmt_ee (rcode, VOIDmode, ops[0].value, ops[1].value);
6562 }
6563
6564 /* Return true if VEC_PERM_EXPR can be expanded using SIMD extensions
6565    of the CPU.  SEL may be NULL, which stands for an unknown constant.  */
6566
6567 bool
6568 can_vec_perm_p (enum machine_mode mode, bool variable,
6569                 const unsigned char *sel)
6570 {
6571   enum machine_mode qimode;
6572
6573   /* If the target doesn't implement a vector mode for the vector type,
6574      then no operations are supported.  */
6575   if (!VECTOR_MODE_P (mode))
6576     return false;
6577
6578   if (!variable)
6579     {
6580       if (direct_optab_handler (vec_perm_const_optab, mode) != CODE_FOR_nothing
6581           && (sel == NULL
6582               || targetm.vectorize.vec_perm_const_ok == NULL
6583               || targetm.vectorize.vec_perm_const_ok (mode, sel)))
6584         return true;
6585     }
6586
6587   if (direct_optab_handler (vec_perm_optab, mode) != CODE_FOR_nothing)
6588     return true;
6589
6590   /* We allow fallback to a QI vector mode, and adjust the mask.  */
6591   if (GET_MODE_INNER (mode) == QImode)
6592     return false;
6593   qimode = mode_for_vector (QImode, GET_MODE_SIZE (mode));
6594   if (!VECTOR_MODE_P (qimode))
6595     return false;
6596
6597   /* ??? For completeness, we ought to check the QImode version of
6598       vec_perm_const_optab.  But all users of this implicit lowering
6599       feature implement the variable vec_perm_optab.  */
6600   if (direct_optab_handler (vec_perm_optab, qimode) == CODE_FOR_nothing)
6601     return false;
6602
6603   /* In order to support the lowering of variable permutations,
6604      we need to support shifts and adds.  */
6605   if (variable)
6606     {
6607       if (GET_MODE_UNIT_SIZE (mode) > 2
6608           && optab_handler (ashl_optab, mode) == CODE_FOR_nothing
6609           && optab_handler (vashl_optab, mode) == CODE_FOR_nothing)
6610         return false;
6611       if (optab_handler (add_optab, qimode) == CODE_FOR_nothing)
6612         return false;
6613     }
6614
6615   return true;
6616 }
6617
6618 /* A subroutine of expand_vec_perm for expanding one vec_perm insn.  */
6619
6620 static rtx
6621 expand_vec_perm_1 (enum insn_code icode, rtx target,
6622                    rtx v0, rtx v1, rtx sel)
6623 {
6624   enum machine_mode tmode = GET_MODE (target);
6625   enum machine_mode smode = GET_MODE (sel);
6626   struct expand_operand ops[4];
6627
6628   create_output_operand (&ops[0], target, tmode);
6629   create_input_operand (&ops[3], sel, smode);
6630
6631   /* Make an effort to preserve v0 == v1.  The target expander is able to
6632      rely on this to determine if we're permuting a single input operand.  */
6633   if (rtx_equal_p (v0, v1))
6634     {
6635       if (!insn_operand_matches (icode, 1, v0))
6636         v0 = force_reg (tmode, v0);
6637       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
6638       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
6639
6640       create_fixed_operand (&ops[1], v0);
6641       create_fixed_operand (&ops[2], v0);
6642     }
6643   else
6644     {
6645       create_input_operand (&ops[1], v0, tmode);
6646       create_input_operand (&ops[2], v1, tmode);
6647     }
6648
6649   if (maybe_expand_insn (icode, 4, ops))
6650     return ops[0].value;
6651   return NULL_RTX;
6652 }
6653
6654 /* Generate instructions for vec_perm optab given its mode
6655    and three operands.  */
6656
6657 rtx
6658 expand_vec_perm (enum machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
6659 {
6660   enum insn_code icode;
6661   enum machine_mode qimode;
6662   unsigned int i, w, e, u;
6663   rtx tmp, sel_qi = NULL;
6664   rtvec vec;
6665
6666   if (!target || GET_MODE (target) != mode)
6667     target = gen_reg_rtx (mode);
6668
6669   w = GET_MODE_SIZE (mode);
6670   e = GET_MODE_NUNITS (mode);
6671   u = GET_MODE_UNIT_SIZE (mode);
6672
6673   /* Set QIMODE to a different vector mode with byte elements.
6674      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
6675   qimode = VOIDmode;
6676   if (GET_MODE_INNER (mode) != QImode)
6677     {
6678       qimode = mode_for_vector (QImode, w);
6679       if (!VECTOR_MODE_P (qimode))
6680         qimode = VOIDmode;
6681     }
6682
6683   /* If the input is a constant, expand it specially.  */
6684   gcc_assert (GET_MODE_CLASS (GET_MODE (sel)) == MODE_VECTOR_INT);
6685   if (GET_CODE (sel) == CONST_VECTOR)
6686     {
6687       icode = direct_optab_handler (vec_perm_const_optab, mode);
6688       if (icode != CODE_FOR_nothing)
6689         {
6690           tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6691           if (tmp)
6692             return tmp;
6693         }
6694
6695       /* Fall back to a constant byte-based permutation.  */
6696       if (qimode != VOIDmode)
6697         {
6698           vec = rtvec_alloc (w);
6699           for (i = 0; i < e; ++i)
6700             {
6701               unsigned int j, this_e;
6702
6703               this_e = INTVAL (CONST_VECTOR_ELT (sel, i));
6704               this_e &= 2 * e - 1;
6705               this_e *= u;
6706
6707               for (j = 0; j < u; ++j)
6708                 RTVEC_ELT (vec, i * u + j) = GEN_INT (this_e + j);
6709             }
6710           sel_qi = gen_rtx_CONST_VECTOR (qimode, vec);
6711
6712           icode = direct_optab_handler (vec_perm_const_optab, qimode);
6713           if (icode != CODE_FOR_nothing)
6714             {
6715               tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6716               tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6717                                        gen_lowpart (qimode, v1), sel_qi);
6718               if (tmp)
6719                 return gen_lowpart (mode, tmp);
6720             }
6721         }
6722     }
6723
6724   /* Otherwise expand as a fully variable permuation.  */
6725   icode = direct_optab_handler (vec_perm_optab, mode);
6726   if (icode != CODE_FOR_nothing)
6727     {
6728       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6729       if (tmp)
6730         return tmp;
6731     }
6732
6733   /* As a special case to aid several targets, lower the element-based
6734      permutation to a byte-based permutation and try again.  */
6735   if (qimode == VOIDmode)
6736     return NULL_RTX;
6737   icode = direct_optab_handler (vec_perm_optab, qimode);
6738   if (icode == CODE_FOR_nothing)
6739     return NULL_RTX;
6740
6741   if (sel_qi == NULL)
6742     {
6743       /* Multiply each element by its byte size.  */
6744       enum machine_mode selmode = GET_MODE (sel);
6745       if (u == 2)
6746         sel = expand_simple_binop (selmode, PLUS, sel, sel,
6747                                    sel, 0, OPTAB_DIRECT);
6748       else
6749         sel = expand_simple_binop (selmode, ASHIFT, sel,
6750                                    GEN_INT (exact_log2 (u)),
6751                                    sel, 0, OPTAB_DIRECT);
6752       gcc_assert (sel != NULL);
6753
6754       /* Broadcast the low byte each element into each of its bytes.  */
6755       vec = rtvec_alloc (w);
6756       for (i = 0; i < w; ++i)
6757         {
6758           int this_e = i / u * u;
6759           if (BYTES_BIG_ENDIAN)
6760             this_e += u - 1;
6761           RTVEC_ELT (vec, i) = GEN_INT (this_e);
6762         }
6763       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6764       sel = gen_lowpart (qimode, sel);
6765       sel = expand_vec_perm (qimode, sel, sel, tmp, NULL);
6766       gcc_assert (sel != NULL);
6767
6768       /* Add the byte offset to each byte element.  */
6769       /* Note that the definition of the indicies here is memory ordering,
6770          so there should be no difference between big and little endian.  */
6771       vec = rtvec_alloc (w);
6772       for (i = 0; i < w; ++i)
6773         RTVEC_ELT (vec, i) = GEN_INT (i % u);
6774       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6775       sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
6776                                     sel, 0, OPTAB_DIRECT);
6777       gcc_assert (sel_qi != NULL);
6778     }
6779
6780   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6781   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6782                            gen_lowpart (qimode, v1), sel_qi);
6783   if (tmp)
6784     tmp = gen_lowpart (mode, tmp);
6785   return tmp;
6786 }
6787
6788 /* Return insn code for a conditional operator with a comparison in
6789    mode CMODE, unsigned if UNS is true, resulting in a value of mode VMODE.  */
6790
6791 static inline enum insn_code
6792 get_vcond_icode (enum machine_mode vmode, enum machine_mode cmode, bool uns)
6793 {
6794   enum insn_code icode = CODE_FOR_nothing;
6795   if (uns)
6796     icode = convert_optab_handler (vcondu_optab, vmode, cmode);
6797   else
6798     icode = convert_optab_handler (vcond_optab, vmode, cmode);
6799   return icode;
6800 }
6801
6802 /* Return TRUE iff, appropriate vector insns are available
6803    for vector cond expr with vector type VALUE_TYPE and a comparison
6804    with operand vector types in CMP_OP_TYPE.  */
6805
6806 bool
6807 expand_vec_cond_expr_p (tree value_type, tree cmp_op_type)
6808 {
6809   enum machine_mode value_mode = TYPE_MODE (value_type);
6810   enum machine_mode cmp_op_mode = TYPE_MODE (cmp_op_type);
6811   if (GET_MODE_SIZE (value_mode) != GET_MODE_SIZE (cmp_op_mode)
6812       || GET_MODE_NUNITS (value_mode) != GET_MODE_NUNITS (cmp_op_mode)
6813       || get_vcond_icode (TYPE_MODE (value_type), TYPE_MODE (cmp_op_type),
6814                           TYPE_UNSIGNED (cmp_op_type)) == CODE_FOR_nothing)
6815     return false;
6816   return true;
6817 }
6818
6819 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
6820    three operands.  */
6821
6822 rtx
6823 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
6824                       rtx target)
6825 {
6826   struct expand_operand ops[6];
6827   enum insn_code icode;
6828   rtx comparison, rtx_op1, rtx_op2;
6829   enum machine_mode mode = TYPE_MODE (vec_cond_type);
6830   enum machine_mode cmp_op_mode;
6831   bool unsignedp;
6832   tree op0a, op0b;
6833   enum tree_code tcode;
6834
6835   if (COMPARISON_CLASS_P (op0))
6836     {
6837       op0a = TREE_OPERAND (op0, 0);
6838       op0b = TREE_OPERAND (op0, 1);
6839       tcode = TREE_CODE (op0);
6840     }
6841   else
6842     {
6843       /* Fake op0 < 0.  */
6844       gcc_assert (!TYPE_UNSIGNED (TREE_TYPE (op0)));
6845       op0a = op0;
6846       op0b = build_zero_cst (TREE_TYPE (op0));
6847       tcode = LT_EXPR;
6848     }
6849   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
6850   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
6851
6852
6853   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
6854               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
6855
6856   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
6857   if (icode == CODE_FOR_nothing)
6858     return 0;
6859
6860   comparison = vector_compare_rtx (tcode, op0a, op0b, unsignedp, icode);
6861   rtx_op1 = expand_normal (op1);
6862   rtx_op2 = expand_normal (op2);
6863
6864   create_output_operand (&ops[0], target, mode);
6865   create_input_operand (&ops[1], rtx_op1, mode);
6866   create_input_operand (&ops[2], rtx_op2, mode);
6867   create_fixed_operand (&ops[3], comparison);
6868   create_fixed_operand (&ops[4], XEXP (comparison, 0));
6869   create_fixed_operand (&ops[5], XEXP (comparison, 1));
6870   expand_insn (icode, 6, ops);
6871   return ops[0].value;
6872 }
6873
6874 /* Return non-zero if a highpart multiply is supported of can be synthisized.
6875    For the benefit of expand_mult_highpart, the return value is 1 for direct,
6876    2 for even/odd widening, and 3 for hi/lo widening.  */
6877
6878 int
6879 can_mult_highpart_p (enum machine_mode mode, bool uns_p)
6880 {
6881   optab op;
6882   unsigned char *sel;
6883   unsigned i, nunits;
6884
6885   op = uns_p ? umul_highpart_optab : smul_highpart_optab;
6886   if (optab_handler (op, mode) != CODE_FOR_nothing)
6887     return 1;
6888
6889   /* If the mode is an integral vector, synth from widening operations.  */
6890   if (GET_MODE_CLASS (mode) != MODE_VECTOR_INT)
6891     return 0;
6892
6893   nunits = GET_MODE_NUNITS (mode);
6894   sel = XALLOCAVEC (unsigned char, nunits);
6895
6896   op = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6897   if (optab_handler (op, mode) != CODE_FOR_nothing)
6898     {
6899       op = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6900       if (optab_handler (op, mode) != CODE_FOR_nothing)
6901         {
6902           for (i = 0; i < nunits; ++i)
6903             sel[i] = !BYTES_BIG_ENDIAN + (i & ~1) + ((i & 1) ? nunits : 0);
6904           if (can_vec_perm_p (mode, false, sel))
6905             return 2;
6906         }
6907     }
6908
6909   op = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6910   if (optab_handler (op, mode) != CODE_FOR_nothing)
6911     {
6912       op = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6913       if (optab_handler (op, mode) != CODE_FOR_nothing)
6914         {
6915           for (i = 0; i < nunits; ++i)
6916             sel[i] = 2 * i + (BYTES_BIG_ENDIAN ? 0 : 1);
6917           if (can_vec_perm_p (mode, false, sel))
6918             return 3;
6919         }
6920     }
6921
6922   return 0;
6923 }
6924
6925 /* Expand a highpart multiply.  */
6926
6927 rtx
6928 expand_mult_highpart (enum machine_mode mode, rtx op0, rtx op1,
6929                       rtx target, bool uns_p)
6930 {
6931   struct expand_operand eops[3];
6932   enum insn_code icode;
6933   int method, i, nunits;
6934   enum machine_mode wmode;
6935   rtx m1, m2, perm;
6936   optab tab1, tab2;
6937   rtvec v;
6938
6939   method = can_mult_highpart_p (mode, uns_p);
6940   switch (method)
6941     {
6942     case 0:
6943       return NULL_RTX;
6944     case 1:
6945       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
6946       return expand_binop (mode, tab1, op0, op1, target, uns_p,
6947                            OPTAB_LIB_WIDEN);
6948     case 2:
6949       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6950       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6951       break;
6952     case 3:
6953       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6954       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6955       if (BYTES_BIG_ENDIAN)
6956         {
6957           optab t = tab1;
6958           tab1 = tab2;
6959           tab2 = t;
6960         }
6961       break;
6962     default:
6963       gcc_unreachable ();
6964     }
6965
6966   icode = optab_handler (tab1, mode);
6967   nunits = GET_MODE_NUNITS (mode);
6968   wmode = insn_data[icode].operand[0].mode;
6969   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
6970   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
6971
6972   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6973   create_input_operand (&eops[1], op0, mode);
6974   create_input_operand (&eops[2], op1, mode);
6975   expand_insn (icode, 3, eops);
6976   m1 = gen_lowpart (mode, eops[0].value);
6977
6978   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6979   create_input_operand (&eops[1], op0, mode);
6980   create_input_operand (&eops[2], op1, mode);
6981   expand_insn (optab_handler (tab2, mode), 3, eops);
6982   m2 = gen_lowpart (mode, eops[0].value);
6983
6984   v = rtvec_alloc (nunits);
6985   if (method == 2)
6986     {
6987       for (i = 0; i < nunits; ++i)
6988         RTVEC_ELT (v, i) = GEN_INT (!BYTES_BIG_ENDIAN + (i & ~1)
6989                                     + ((i & 1) ? nunits : 0));
6990     }
6991   else
6992     {
6993       for (i = 0; i < nunits; ++i)
6994         RTVEC_ELT (v, i) = GEN_INT (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
6995     }
6996   perm = gen_rtx_CONST_VECTOR (mode, v);
6997
6998   return expand_vec_perm (mode, m1, m2, perm, target);
6999 }
7000
7001 /* Return true if target supports vector masked load/store for mode.  */
7002 bool
7003 can_vec_mask_load_store_p (enum machine_mode mode, bool is_load)
7004 {
7005   optab op = is_load ? maskload_optab : maskstore_optab;
7006   enum machine_mode vmode;
7007   unsigned int vector_sizes;
7008
7009   /* If mode is vector mode, check it directly.  */
7010   if (VECTOR_MODE_P (mode))
7011     return optab_handler (op, mode) != CODE_FOR_nothing;
7012
7013   /* Otherwise, return true if there is some vector mode with
7014      the mask load/store supported.  */
7015
7016   /* See if there is any chance the mask load or store might be
7017      vectorized.  If not, punt.  */
7018   vmode = targetm.vectorize.preferred_simd_mode (mode);
7019   if (!VECTOR_MODE_P (vmode))
7020     return false;
7021
7022   if (optab_handler (op, vmode) != CODE_FOR_nothing)
7023     return true;
7024
7025   vector_sizes = targetm.vectorize.autovectorize_vector_sizes ();
7026   while (vector_sizes != 0)
7027     {
7028       unsigned int cur = 1 << floor_log2 (vector_sizes);
7029       vector_sizes &= ~cur;
7030       if (cur <= GET_MODE_SIZE (mode))
7031         continue;
7032       vmode = mode_for_vector (mode, cur / GET_MODE_SIZE (mode));
7033       if (VECTOR_MODE_P (vmode)
7034           && optab_handler (op, vmode) != CODE_FOR_nothing)
7035         return true;
7036     }
7037   return false;
7038 }
7039 \f
7040 /* Return true if there is a compare_and_swap pattern.  */
7041
7042 bool
7043 can_compare_and_swap_p (enum machine_mode mode, bool allow_libcall)
7044 {
7045   enum insn_code icode;
7046
7047   /* Check for __atomic_compare_and_swap.  */
7048   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7049   if (icode != CODE_FOR_nothing)
7050     return true;
7051
7052   /* Check for __sync_compare_and_swap.  */
7053   icode = optab_handler (sync_compare_and_swap_optab, mode);
7054   if (icode != CODE_FOR_nothing)
7055     return true;
7056   if (allow_libcall && optab_libfunc (sync_compare_and_swap_optab, mode))
7057     return true;
7058
7059   /* No inline compare and swap.  */
7060   return false;
7061 }
7062
7063 /* Return true if an atomic exchange can be performed.  */
7064
7065 bool
7066 can_atomic_exchange_p (enum machine_mode mode, bool allow_libcall)
7067 {
7068   enum insn_code icode;
7069
7070   /* Check for __atomic_exchange.  */
7071   icode = direct_optab_handler (atomic_exchange_optab, mode);
7072   if (icode != CODE_FOR_nothing)
7073     return true;
7074
7075   /* Don't check __sync_test_and_set, as on some platforms that
7076      has reduced functionality.  Targets that really do support
7077      a proper exchange should simply be updated to the __atomics.  */
7078
7079   return can_compare_and_swap_p (mode, allow_libcall);
7080 }
7081
7082
7083 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
7084    pattern.  */
7085
7086 static void
7087 find_cc_set (rtx x, const_rtx pat, void *data)
7088 {
7089   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
7090       && GET_CODE (pat) == SET)
7091     {
7092       rtx *p_cc_reg = (rtx *) data;
7093       gcc_assert (!*p_cc_reg);
7094       *p_cc_reg = x;
7095     }
7096 }
7097
7098 /* This is a helper function for the other atomic operations.  This function
7099    emits a loop that contains SEQ that iterates until a compare-and-swap
7100    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
7101    a set of instructions that takes a value from OLD_REG as an input and
7102    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
7103    set to the current contents of MEM.  After SEQ, a compare-and-swap will
7104    attempt to update MEM with NEW_REG.  The function returns true when the
7105    loop was generated successfully.  */
7106
7107 static bool
7108 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
7109 {
7110   enum machine_mode mode = GET_MODE (mem);
7111   rtx_code_label *label;
7112   rtx cmp_reg, success, oldval;
7113
7114   /* The loop we want to generate looks like
7115
7116         cmp_reg = mem;
7117       label:
7118         old_reg = cmp_reg;
7119         seq;
7120         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
7121         if (success)
7122           goto label;
7123
7124      Note that we only do the plain load from memory once.  Subsequent
7125      iterations use the value loaded by the compare-and-swap pattern.  */
7126
7127   label = gen_label_rtx ();
7128   cmp_reg = gen_reg_rtx (mode);
7129
7130   emit_move_insn (cmp_reg, mem);
7131   emit_label (label);
7132   emit_move_insn (old_reg, cmp_reg);
7133   if (seq)
7134     emit_insn (seq);
7135
7136   success = NULL_RTX;
7137   oldval = cmp_reg;
7138   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
7139                                        new_reg, false, MEMMODEL_SEQ_CST,
7140                                        MEMMODEL_RELAXED))
7141     return false;
7142
7143   if (oldval != cmp_reg)
7144     emit_move_insn (cmp_reg, oldval);
7145
7146   /* Mark this jump predicted not taken.  */
7147   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
7148                            GET_MODE (success), 1, label, 0);
7149   return true;
7150 }
7151
7152
7153 /* This function tries to emit an atomic_exchange intruction.  VAL is written
7154    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
7155    using TARGET if possible.  */
7156
7157 static rtx
7158 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7159 {
7160   enum machine_mode mode = GET_MODE (mem);
7161   enum insn_code icode;
7162
7163   /* If the target supports the exchange directly, great.  */
7164   icode = direct_optab_handler (atomic_exchange_optab, mode);
7165   if (icode != CODE_FOR_nothing)
7166     {
7167       struct expand_operand ops[4];
7168
7169       create_output_operand (&ops[0], target, mode);
7170       create_fixed_operand (&ops[1], mem);
7171       create_input_operand (&ops[2], val, mode);
7172       create_integer_operand (&ops[3], model);
7173       if (maybe_expand_insn (icode, 4, ops))
7174         return ops[0].value;
7175     }
7176
7177   return NULL_RTX;
7178 }
7179
7180 /* This function tries to implement an atomic exchange operation using
7181    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
7182    The previous contents of *MEM are returned, using TARGET if possible.
7183    Since this instructionn is an acquire barrier only, stronger memory
7184    models may require additional barriers to be emitted.  */
7185
7186 static rtx
7187 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
7188                                    enum memmodel model)
7189 {
7190   enum machine_mode mode = GET_MODE (mem);
7191   enum insn_code icode;
7192   rtx_insn *last_insn = get_last_insn ();
7193
7194   icode = optab_handler (sync_lock_test_and_set_optab, mode);
7195
7196   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
7197      exists, and the memory model is stronger than acquire, add a release
7198      barrier before the instruction.  */
7199
7200   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST
7201       || (model & MEMMODEL_MASK) == MEMMODEL_RELEASE
7202       || (model & MEMMODEL_MASK) == MEMMODEL_ACQ_REL)
7203     expand_mem_thread_fence (model);
7204
7205   if (icode != CODE_FOR_nothing)
7206     {
7207       struct expand_operand ops[3];
7208       create_output_operand (&ops[0], target, mode);
7209       create_fixed_operand (&ops[1], mem);
7210       create_input_operand (&ops[2], val, mode);
7211       if (maybe_expand_insn (icode, 3, ops))
7212         return ops[0].value;
7213     }
7214
7215   /* If an external test-and-set libcall is provided, use that instead of
7216      any external compare-and-swap that we might get from the compare-and-
7217      swap-loop expansion later.  */
7218   if (!can_compare_and_swap_p (mode, false))
7219     {
7220       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
7221       if (libfunc != NULL)
7222         {
7223           rtx addr;
7224
7225           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7226           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7227                                           mode, 2, addr, ptr_mode,
7228                                           val, mode);
7229         }
7230     }
7231
7232   /* If the test_and_set can't be emitted, eliminate any barrier that might
7233      have been emitted.  */
7234   delete_insns_since (last_insn);
7235   return NULL_RTX;
7236 }
7237
7238 /* This function tries to implement an atomic exchange operation using a
7239    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
7240    *MEM are returned, using TARGET if possible.  No memory model is required
7241    since a compare_and_swap loop is seq-cst.  */
7242
7243 static rtx
7244 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
7245 {
7246   enum machine_mode mode = GET_MODE (mem);
7247
7248   if (can_compare_and_swap_p (mode, true))
7249     {
7250       if (!target || !register_operand (target, mode))
7251         target = gen_reg_rtx (mode);
7252       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
7253         return target;
7254     }
7255
7256   return NULL_RTX;
7257 }
7258
7259 /* This function tries to implement an atomic test-and-set operation
7260    using the atomic_test_and_set instruction pattern.  A boolean value
7261    is returned from the operation, using TARGET if possible.  */
7262
7263 #ifndef HAVE_atomic_test_and_set
7264 #define HAVE_atomic_test_and_set 0
7265 #define CODE_FOR_atomic_test_and_set CODE_FOR_nothing
7266 #endif
7267
7268 static rtx
7269 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7270 {
7271   enum machine_mode pat_bool_mode;
7272   struct expand_operand ops[3];
7273
7274   if (!HAVE_atomic_test_and_set)
7275     return NULL_RTX;
7276
7277   /* While we always get QImode from __atomic_test_and_set, we get
7278      other memory modes from __sync_lock_test_and_set.  Note that we
7279      use no endian adjustment here.  This matches the 4.6 behavior
7280      in the Sparc backend.  */
7281   gcc_checking_assert
7282     (insn_data[CODE_FOR_atomic_test_and_set].operand[1].mode == QImode);
7283   if (GET_MODE (mem) != QImode)
7284     mem = adjust_address_nv (mem, QImode, 0);
7285
7286   pat_bool_mode = insn_data[CODE_FOR_atomic_test_and_set].operand[0].mode;
7287   create_output_operand (&ops[0], target, pat_bool_mode);
7288   create_fixed_operand (&ops[1], mem);
7289   create_integer_operand (&ops[2], model);
7290
7291   if (maybe_expand_insn (CODE_FOR_atomic_test_and_set, 3, ops))
7292     return ops[0].value;
7293   return NULL_RTX;
7294 }
7295
7296 /* This function expands the legacy _sync_lock test_and_set operation which is
7297    generally an atomic exchange.  Some limited targets only allow the
7298    constant 1 to be stored.  This is an ACQUIRE operation.
7299
7300    TARGET is an optional place to stick the return value.
7301    MEM is where VAL is stored.  */
7302
7303 rtx
7304 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
7305 {
7306   rtx ret;
7307
7308   /* Try an atomic_exchange first.  */
7309   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_ACQUIRE);
7310   if (ret)
7311     return ret;
7312
7313   ret = maybe_emit_sync_lock_test_and_set (target, mem, val, MEMMODEL_ACQUIRE);
7314   if (ret)
7315     return ret;
7316
7317   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7318   if (ret)
7319     return ret;
7320
7321   /* If there are no other options, try atomic_test_and_set if the value
7322      being stored is 1.  */
7323   if (val == const1_rtx)
7324     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_ACQUIRE);
7325
7326   return ret;
7327 }
7328
7329 /* This function expands the atomic test_and_set operation:
7330    atomically store a boolean TRUE into MEM and return the previous value.
7331
7332    MEMMODEL is the memory model variant to use.
7333    TARGET is an optional place to stick the return value.  */
7334
7335 rtx
7336 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7337 {
7338   enum machine_mode mode = GET_MODE (mem);
7339   rtx ret, trueval, subtarget;
7340
7341   ret = maybe_emit_atomic_test_and_set (target, mem, model);
7342   if (ret)
7343     return ret;
7344
7345   /* Be binary compatible with non-default settings of trueval, and different
7346      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
7347      another only has atomic-exchange.  */
7348   if (targetm.atomic_test_and_set_trueval == 1)
7349     {
7350       trueval = const1_rtx;
7351       subtarget = target ? target : gen_reg_rtx (mode);
7352     }
7353   else
7354     {
7355       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
7356       subtarget = gen_reg_rtx (mode);
7357     }
7358
7359   /* Try the atomic-exchange optab...  */
7360   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
7361
7362   /* ... then an atomic-compare-and-swap loop ... */
7363   if (!ret)
7364     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
7365
7366   /* ... before trying the vaguely defined legacy lock_test_and_set. */
7367   if (!ret)
7368     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
7369
7370   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
7371      things with the value 1.  Thus we try again without trueval.  */
7372   if (!ret && targetm.atomic_test_and_set_trueval != 1)
7373     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
7374
7375   /* Failing all else, assume a single threaded environment and simply
7376      perform the operation.  */
7377   if (!ret)
7378     {
7379       /* If the result is ignored skip the move to target.  */
7380       if (subtarget != const0_rtx)
7381         emit_move_insn (subtarget, mem);
7382
7383       emit_move_insn (mem, trueval);
7384       ret = subtarget;
7385     }
7386
7387   /* Recall that have to return a boolean value; rectify if trueval
7388      is not exactly one.  */
7389   if (targetm.atomic_test_and_set_trueval != 1)
7390     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
7391
7392   return ret;
7393 }
7394
7395 /* This function expands the atomic exchange operation:
7396    atomically store VAL in MEM and return the previous value in MEM.
7397
7398    MEMMODEL is the memory model variant to use.
7399    TARGET is an optional place to stick the return value.  */
7400
7401 rtx
7402 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7403 {
7404   rtx ret;
7405
7406   ret = maybe_emit_atomic_exchange (target, mem, val, model);
7407
7408   /* Next try a compare-and-swap loop for the exchange.  */
7409   if (!ret)
7410     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7411
7412   return ret;
7413 }
7414
7415 /* This function expands the atomic compare exchange operation:
7416
7417    *PTARGET_BOOL is an optional place to store the boolean success/failure.
7418    *PTARGET_OVAL is an optional place to store the old value from memory.
7419    Both target parameters may be NULL to indicate that we do not care about
7420    that return value.  Both target parameters are updated on success to
7421    the actual location of the corresponding result.
7422
7423    MEMMODEL is the memory model variant to use.
7424
7425    The return value of the function is true for success.  */
7426
7427 bool
7428 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
7429                                 rtx mem, rtx expected, rtx desired,
7430                                 bool is_weak, enum memmodel succ_model,
7431                                 enum memmodel fail_model)
7432 {
7433   enum machine_mode mode = GET_MODE (mem);
7434   struct expand_operand ops[8];
7435   enum insn_code icode;
7436   rtx target_oval, target_bool = NULL_RTX;
7437   rtx libfunc;
7438
7439   /* Load expected into a register for the compare and swap.  */
7440   if (MEM_P (expected))
7441     expected = copy_to_reg (expected);
7442
7443   /* Make sure we always have some place to put the return oldval.
7444      Further, make sure that place is distinct from the input expected,
7445      just in case we need that path down below.  */
7446   if (ptarget_oval == NULL
7447       || (target_oval = *ptarget_oval) == NULL
7448       || reg_overlap_mentioned_p (expected, target_oval))
7449     target_oval = gen_reg_rtx (mode);
7450
7451   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7452   if (icode != CODE_FOR_nothing)
7453     {
7454       enum machine_mode bool_mode = insn_data[icode].operand[0].mode;
7455
7456       /* Make sure we always have a place for the bool operand.  */
7457       if (ptarget_bool == NULL
7458           || (target_bool = *ptarget_bool) == NULL
7459           || GET_MODE (target_bool) != bool_mode)
7460         target_bool = gen_reg_rtx (bool_mode);
7461
7462       /* Emit the compare_and_swap.  */
7463       create_output_operand (&ops[0], target_bool, bool_mode);
7464       create_output_operand (&ops[1], target_oval, mode);
7465       create_fixed_operand (&ops[2], mem);
7466       create_input_operand (&ops[3], expected, mode);
7467       create_input_operand (&ops[4], desired, mode);
7468       create_integer_operand (&ops[5], is_weak);
7469       create_integer_operand (&ops[6], succ_model);
7470       create_integer_operand (&ops[7], fail_model);
7471       if (maybe_expand_insn (icode, 8, ops))
7472         {
7473           /* Return success/failure.  */
7474           target_bool = ops[0].value;
7475           target_oval = ops[1].value;
7476           goto success;
7477         }
7478     }
7479
7480   /* Otherwise fall back to the original __sync_val_compare_and_swap
7481      which is always seq-cst.  */
7482   icode = optab_handler (sync_compare_and_swap_optab, mode);
7483   if (icode != CODE_FOR_nothing)
7484     {
7485       rtx cc_reg;
7486
7487       create_output_operand (&ops[0], target_oval, mode);
7488       create_fixed_operand (&ops[1], mem);
7489       create_input_operand (&ops[2], expected, mode);
7490       create_input_operand (&ops[3], desired, mode);
7491       if (!maybe_expand_insn (icode, 4, ops))
7492         return false;
7493
7494       target_oval = ops[0].value;
7495
7496       /* If the caller isn't interested in the boolean return value,
7497          skip the computation of it.  */
7498       if (ptarget_bool == NULL)
7499         goto success;
7500
7501       /* Otherwise, work out if the compare-and-swap succeeded.  */
7502       cc_reg = NULL_RTX;
7503       if (have_insn_for (COMPARE, CCmode))
7504         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
7505       if (cc_reg)
7506         {
7507           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
7508                                                const0_rtx, VOIDmode, 0, 1);
7509           goto success;
7510         }
7511       goto success_bool_from_val;
7512     }
7513
7514   /* Also check for library support for __sync_val_compare_and_swap.  */
7515   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
7516   if (libfunc != NULL)
7517     {
7518       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7519       target_oval = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7520                                              mode, 3, addr, ptr_mode,
7521                                              expected, mode, desired, mode);
7522
7523       /* Compute the boolean return value only if requested.  */
7524       if (ptarget_bool)
7525         goto success_bool_from_val;
7526       else
7527         goto success;
7528     }
7529
7530   /* Failure.  */
7531   return false;
7532
7533  success_bool_from_val:
7534    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
7535                                         expected, VOIDmode, 1, 1);
7536  success:
7537   /* Make sure that the oval output winds up where the caller asked.  */
7538   if (ptarget_oval)
7539     *ptarget_oval = target_oval;
7540   if (ptarget_bool)
7541     *ptarget_bool = target_bool;
7542   return true;
7543 }
7544
7545 /* Generate asm volatile("" : : : "memory") as the memory barrier.  */
7546
7547 static void
7548 expand_asm_memory_barrier (void)
7549 {
7550   rtx asm_op, clob;
7551
7552   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, empty_string, empty_string, 0,
7553                                  rtvec_alloc (0), rtvec_alloc (0),
7554                                  rtvec_alloc (0), UNKNOWN_LOCATION);
7555   MEM_VOLATILE_P (asm_op) = 1;
7556
7557   clob = gen_rtx_SCRATCH (VOIDmode);
7558   clob = gen_rtx_MEM (BLKmode, clob);
7559   clob = gen_rtx_CLOBBER (VOIDmode, clob);
7560
7561   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
7562 }
7563
7564 /* This routine will either emit the mem_thread_fence pattern or issue a
7565    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7566
7567 #ifndef HAVE_mem_thread_fence
7568 # define HAVE_mem_thread_fence 0
7569 # define gen_mem_thread_fence(x) (gcc_unreachable (), NULL_RTX)
7570 #endif
7571 #ifndef HAVE_memory_barrier
7572 # define HAVE_memory_barrier 0
7573 # define gen_memory_barrier()  (gcc_unreachable (), NULL_RTX)
7574 #endif
7575
7576 void
7577 expand_mem_thread_fence (enum memmodel model)
7578 {
7579   if (HAVE_mem_thread_fence)
7580     emit_insn (gen_mem_thread_fence (GEN_INT (model)));
7581   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7582     {
7583       if (HAVE_memory_barrier)
7584         emit_insn (gen_memory_barrier ());
7585       else if (synchronize_libfunc != NULL_RTX)
7586         emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode, 0);
7587       else
7588         expand_asm_memory_barrier ();
7589     }
7590 }
7591
7592 /* This routine will either emit the mem_signal_fence pattern or issue a
7593    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7594
7595 #ifndef HAVE_mem_signal_fence
7596 # define HAVE_mem_signal_fence 0
7597 # define gen_mem_signal_fence(x) (gcc_unreachable (), NULL_RTX)
7598 #endif
7599
7600 void
7601 expand_mem_signal_fence (enum memmodel model)
7602 {
7603   if (HAVE_mem_signal_fence)
7604     emit_insn (gen_mem_signal_fence (GEN_INT (model)));
7605   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7606     {
7607       /* By default targets are coherent between a thread and the signal
7608          handler running on the same thread.  Thus this really becomes a
7609          compiler barrier, in that stores must not be sunk past
7610          (or raised above) a given point.  */
7611       expand_asm_memory_barrier ();
7612     }
7613 }
7614
7615 /* This function expands the atomic load operation:
7616    return the atomically loaded value in MEM.
7617
7618    MEMMODEL is the memory model variant to use.
7619    TARGET is an option place to stick the return value.  */
7620
7621 rtx
7622 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
7623 {
7624   enum machine_mode mode = GET_MODE (mem);
7625   enum insn_code icode;
7626
7627   /* If the target supports the load directly, great.  */
7628   icode = direct_optab_handler (atomic_load_optab, mode);
7629   if (icode != CODE_FOR_nothing)
7630     {
7631       struct expand_operand ops[3];
7632
7633       create_output_operand (&ops[0], target, mode);
7634       create_fixed_operand (&ops[1], mem);
7635       create_integer_operand (&ops[2], model);
7636       if (maybe_expand_insn (icode, 3, ops))
7637         return ops[0].value;
7638     }
7639
7640   /* If the size of the object is greater than word size on this target,
7641      then we assume that a load will not be atomic.  */
7642   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7643     {
7644       /* Issue val = compare_and_swap (mem, 0, 0).
7645          This may cause the occasional harmless store of 0 when the value is
7646          already 0, but it seems to be OK according to the standards guys.  */
7647       if (expand_atomic_compare_and_swap (NULL, &target, mem, const0_rtx,
7648                                           const0_rtx, false, model, model))
7649         return target;
7650       else
7651       /* Otherwise there is no atomic load, leave the library call.  */
7652         return NULL_RTX;
7653     }
7654
7655   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
7656   if (!target || target == const0_rtx)
7657     target = gen_reg_rtx (mode);
7658
7659   /* For SEQ_CST, emit a barrier before the load.  */
7660   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7661     expand_mem_thread_fence (model);
7662
7663   emit_move_insn (target, mem);
7664
7665   /* Emit the appropriate barrier after the load.  */
7666   expand_mem_thread_fence (model);
7667
7668   return target;
7669 }
7670
7671 /* This function expands the atomic store operation:
7672    Atomically store VAL in MEM.
7673    MEMMODEL is the memory model variant to use.
7674    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
7675    function returns const0_rtx if a pattern was emitted.  */
7676
7677 rtx
7678 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
7679 {
7680   enum machine_mode mode = GET_MODE (mem);
7681   enum insn_code icode;
7682   struct expand_operand ops[3];
7683
7684   /* If the target supports the store directly, great.  */
7685   icode = direct_optab_handler (atomic_store_optab, mode);
7686   if (icode != CODE_FOR_nothing)
7687     {
7688       create_fixed_operand (&ops[0], mem);
7689       create_input_operand (&ops[1], val, mode);
7690       create_integer_operand (&ops[2], model);
7691       if (maybe_expand_insn (icode, 3, ops))
7692         return const0_rtx;
7693     }
7694
7695   /* If using __sync_lock_release is a viable alternative, try it.  */
7696   if (use_release)
7697     {
7698       icode = direct_optab_handler (sync_lock_release_optab, mode);
7699       if (icode != CODE_FOR_nothing)
7700         {
7701           create_fixed_operand (&ops[0], mem);
7702           create_input_operand (&ops[1], const0_rtx, mode);
7703           if (maybe_expand_insn (icode, 2, ops))
7704             {
7705               /* lock_release is only a release barrier.  */
7706               if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7707                 expand_mem_thread_fence (model);
7708               return const0_rtx;
7709             }
7710         }
7711     }
7712
7713   /* If the size of the object is greater than word size on this target,
7714      a default store will not be atomic, Try a mem_exchange and throw away
7715      the result.  If that doesn't work, don't do anything.  */
7716   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7717     {
7718       rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
7719       if (!target)
7720         target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem, val);
7721       if (target)
7722         return const0_rtx;
7723       else
7724         return NULL_RTX;
7725     }
7726
7727   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
7728   expand_mem_thread_fence (model);
7729
7730   emit_move_insn (mem, val);
7731
7732   /* For SEQ_CST, also emit a barrier after the store.  */
7733   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7734     expand_mem_thread_fence (model);
7735
7736   return const0_rtx;
7737 }
7738
7739
7740 /* Structure containing the pointers and values required to process the
7741    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
7742
7743 struct atomic_op_functions
7744 {
7745   direct_optab mem_fetch_before;
7746   direct_optab mem_fetch_after;
7747   direct_optab mem_no_result;
7748   optab fetch_before;
7749   optab fetch_after;
7750   direct_optab no_result;
7751   enum rtx_code reverse_code;
7752 };
7753
7754
7755 /* Fill in structure pointed to by OP with the various optab entries for an
7756    operation of type CODE.  */
7757
7758 static void
7759 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
7760 {
7761   gcc_assert (op!= NULL);
7762
7763   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
7764      in the source code during compilation, and the optab entries are not
7765      computable until runtime.  Fill in the values at runtime.  */
7766   switch (code)
7767     {
7768     case PLUS:
7769       op->mem_fetch_before = atomic_fetch_add_optab;
7770       op->mem_fetch_after = atomic_add_fetch_optab;
7771       op->mem_no_result = atomic_add_optab;
7772       op->fetch_before = sync_old_add_optab;
7773       op->fetch_after = sync_new_add_optab;
7774       op->no_result = sync_add_optab;
7775       op->reverse_code = MINUS;
7776       break;
7777     case MINUS:
7778       op->mem_fetch_before = atomic_fetch_sub_optab;
7779       op->mem_fetch_after = atomic_sub_fetch_optab;
7780       op->mem_no_result = atomic_sub_optab;
7781       op->fetch_before = sync_old_sub_optab;
7782       op->fetch_after = sync_new_sub_optab;
7783       op->no_result = sync_sub_optab;
7784       op->reverse_code = PLUS;
7785       break;
7786     case XOR:
7787       op->mem_fetch_before = atomic_fetch_xor_optab;
7788       op->mem_fetch_after = atomic_xor_fetch_optab;
7789       op->mem_no_result = atomic_xor_optab;
7790       op->fetch_before = sync_old_xor_optab;
7791       op->fetch_after = sync_new_xor_optab;
7792       op->no_result = sync_xor_optab;
7793       op->reverse_code = XOR;
7794       break;
7795     case AND:
7796       op->mem_fetch_before = atomic_fetch_and_optab;
7797       op->mem_fetch_after = atomic_and_fetch_optab;
7798       op->mem_no_result = atomic_and_optab;
7799       op->fetch_before = sync_old_and_optab;
7800       op->fetch_after = sync_new_and_optab;
7801       op->no_result = sync_and_optab;
7802       op->reverse_code = UNKNOWN;
7803       break;
7804     case IOR:
7805       op->mem_fetch_before = atomic_fetch_or_optab;
7806       op->mem_fetch_after = atomic_or_fetch_optab;
7807       op->mem_no_result = atomic_or_optab;
7808       op->fetch_before = sync_old_ior_optab;
7809       op->fetch_after = sync_new_ior_optab;
7810       op->no_result = sync_ior_optab;
7811       op->reverse_code = UNKNOWN;
7812       break;
7813     case NOT:
7814       op->mem_fetch_before = atomic_fetch_nand_optab;
7815       op->mem_fetch_after = atomic_nand_fetch_optab;
7816       op->mem_no_result = atomic_nand_optab;
7817       op->fetch_before = sync_old_nand_optab;
7818       op->fetch_after = sync_new_nand_optab;
7819       op->no_result = sync_nand_optab;
7820       op->reverse_code = UNKNOWN;
7821       break;
7822     default:
7823       gcc_unreachable ();
7824     }
7825 }
7826
7827 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
7828    using memory order MODEL.  If AFTER is true the operation needs to return
7829    the value of *MEM after the operation, otherwise the previous value.
7830    TARGET is an optional place to place the result.  The result is unused if
7831    it is const0_rtx.
7832    Return the result if there is a better sequence, otherwise NULL_RTX.  */
7833
7834 static rtx
7835 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7836                          enum memmodel model, bool after)
7837 {
7838   /* If the value is prefetched, or not used, it may be possible to replace
7839      the sequence with a native exchange operation.  */
7840   if (!after || target == const0_rtx)
7841     {
7842       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
7843       if (code == AND && val == const0_rtx)
7844         {
7845           if (target == const0_rtx)
7846             target = gen_reg_rtx (GET_MODE (mem));
7847           return maybe_emit_atomic_exchange (target, mem, val, model);
7848         }
7849
7850       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
7851       if (code == IOR && val == constm1_rtx)
7852         {
7853           if (target == const0_rtx)
7854             target = gen_reg_rtx (GET_MODE (mem));
7855           return maybe_emit_atomic_exchange (target, mem, val, model);
7856         }
7857     }
7858
7859   return NULL_RTX;
7860 }
7861
7862 /* Try to emit an instruction for a specific operation varaition.
7863    OPTAB contains the OP functions.
7864    TARGET is an optional place to return the result. const0_rtx means unused.
7865    MEM is the memory location to operate on.
7866    VAL is the value to use in the operation.
7867    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
7868    MODEL is the memory model, if used.
7869    AFTER is true if the returned result is the value after the operation.  */
7870
7871 static rtx
7872 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
7873                rtx val, bool use_memmodel, enum memmodel model, bool after)
7874 {
7875   enum machine_mode mode = GET_MODE (mem);
7876   struct expand_operand ops[4];
7877   enum insn_code icode;
7878   int op_counter = 0;
7879   int num_ops;
7880
7881   /* Check to see if there is a result returned.  */
7882   if (target == const0_rtx)
7883     {
7884       if (use_memmodel)
7885         {
7886           icode = direct_optab_handler (optab->mem_no_result, mode);
7887           create_integer_operand (&ops[2], model);
7888           num_ops = 3;
7889         }
7890       else
7891         {
7892           icode = direct_optab_handler (optab->no_result, mode);
7893           num_ops = 2;
7894         }
7895     }
7896   /* Otherwise, we need to generate a result.  */
7897   else
7898     {
7899       if (use_memmodel)
7900         {
7901           icode = direct_optab_handler (after ? optab->mem_fetch_after
7902                                         : optab->mem_fetch_before, mode);
7903           create_integer_operand (&ops[3], model);
7904           num_ops = 4;
7905         }
7906       else
7907         {
7908           icode = optab_handler (after ? optab->fetch_after
7909                                  : optab->fetch_before, mode);
7910           num_ops = 3;
7911         }
7912       create_output_operand (&ops[op_counter++], target, mode);
7913     }
7914   if (icode == CODE_FOR_nothing)
7915     return NULL_RTX;
7916
7917   create_fixed_operand (&ops[op_counter++], mem);
7918   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
7919   create_convert_operand_to (&ops[op_counter++], val, mode, true);
7920
7921   if (maybe_expand_insn (icode, num_ops, ops))
7922     return (target == const0_rtx ? const0_rtx : ops[0].value);
7923
7924   return NULL_RTX;
7925 }
7926
7927
7928 /* This function expands an atomic fetch_OP or OP_fetch operation:
7929    TARGET is an option place to stick the return value.  const0_rtx indicates
7930    the result is unused.
7931    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7932    CODE is the operation being performed (OP)
7933    MEMMODEL is the memory model variant to use.
7934    AFTER is true to return the result of the operation (OP_fetch).
7935    AFTER is false to return the value before the operation (fetch_OP).
7936
7937    This function will *only* generate instructions if there is a direct
7938    optab. No compare and swap loops or libcalls will be generated. */
7939
7940 static rtx
7941 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
7942                                     enum rtx_code code, enum memmodel model,
7943                                     bool after)
7944 {
7945   enum machine_mode mode = GET_MODE (mem);
7946   struct atomic_op_functions optab;
7947   rtx result;
7948   bool unused_result = (target == const0_rtx);
7949
7950   get_atomic_op_for_code (&optab, code);
7951
7952   /* Check to see if there are any better instructions.  */
7953   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
7954   if (result)
7955     return result;
7956
7957   /* Check for the case where the result isn't used and try those patterns.  */
7958   if (unused_result)
7959     {
7960       /* Try the memory model variant first.  */
7961       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
7962       if (result)
7963         return result;
7964
7965       /* Next try the old style withuot a memory model.  */
7966       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
7967       if (result)
7968         return result;
7969
7970       /* There is no no-result pattern, so try patterns with a result.  */
7971       target = NULL_RTX;
7972     }
7973
7974   /* Try the __atomic version.  */
7975   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
7976   if (result)
7977     return result;
7978
7979   /* Try the older __sync version.  */
7980   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
7981   if (result)
7982     return result;
7983
7984   /* If the fetch value can be calculated from the other variation of fetch,
7985      try that operation.  */
7986   if (after || unused_result || optab.reverse_code != UNKNOWN)
7987     {
7988       /* Try the __atomic version, then the older __sync version.  */
7989       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
7990       if (!result)
7991         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
7992
7993       if (result)
7994         {
7995           /* If the result isn't used, no need to do compensation code.  */
7996           if (unused_result)
7997             return result;
7998
7999           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
8000              Fetch_before == after REVERSE_OP val.  */
8001           if (!after)
8002             code = optab.reverse_code;
8003           if (code == NOT)
8004             {
8005               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
8006                                             true, OPTAB_LIB_WIDEN);
8007               result = expand_simple_unop (mode, NOT, result, target, true);
8008             }
8009           else
8010             result = expand_simple_binop (mode, code, result, val, target,
8011                                           true, OPTAB_LIB_WIDEN);
8012           return result;
8013         }
8014     }
8015
8016   /* No direct opcode can be generated.  */
8017   return NULL_RTX;
8018 }
8019
8020
8021
8022 /* This function expands an atomic fetch_OP or OP_fetch operation:
8023    TARGET is an option place to stick the return value.  const0_rtx indicates
8024    the result is unused.
8025    atomically fetch MEM, perform the operation with VAL and return it to MEM.
8026    CODE is the operation being performed (OP)
8027    MEMMODEL is the memory model variant to use.
8028    AFTER is true to return the result of the operation (OP_fetch).
8029    AFTER is false to return the value before the operation (fetch_OP).  */
8030 rtx
8031 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
8032                         enum memmodel model, bool after)
8033 {
8034   enum machine_mode mode = GET_MODE (mem);
8035   rtx result;
8036   bool unused_result = (target == const0_rtx);
8037
8038   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
8039                                                after);
8040
8041   if (result)
8042     return result;
8043
8044   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
8045   if (code == PLUS || code == MINUS)
8046     {
8047       rtx tmp;
8048       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
8049
8050       start_sequence ();
8051       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
8052       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
8053                                                    model, after);
8054       if (result)
8055         {
8056           /* PLUS worked so emit the insns and return.  */
8057           tmp = get_insns ();
8058           end_sequence ();
8059           emit_insn (tmp);
8060           return result;
8061         }
8062
8063       /* PLUS did not work, so throw away the negation code and continue.  */
8064       end_sequence ();
8065     }
8066
8067   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
8068   if (!can_compare_and_swap_p (mode, false))
8069     {
8070       rtx libfunc;
8071       bool fixup = false;
8072       enum rtx_code orig_code = code;
8073       struct atomic_op_functions optab;
8074
8075       get_atomic_op_for_code (&optab, code);
8076       libfunc = optab_libfunc (after ? optab.fetch_after
8077                                : optab.fetch_before, mode);
8078       if (libfunc == NULL
8079           && (after || unused_result || optab.reverse_code != UNKNOWN))
8080         {
8081           fixup = true;
8082           if (!after)
8083             code = optab.reverse_code;
8084           libfunc = optab_libfunc (after ? optab.fetch_before
8085                                    : optab.fetch_after, mode);
8086         }
8087       if (libfunc != NULL)
8088         {
8089           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
8090           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
8091                                             2, addr, ptr_mode, val, mode);
8092
8093           if (!unused_result && fixup)
8094             result = expand_simple_binop (mode, code, result, val, target,
8095                                           true, OPTAB_LIB_WIDEN);
8096           return result;
8097         }
8098
8099       /* We need the original code for any further attempts.  */
8100       code = orig_code;
8101     }
8102
8103   /* If nothing else has succeeded, default to a compare and swap loop.  */
8104   if (can_compare_and_swap_p (mode, true))
8105     {
8106       rtx_insn *insn;
8107       rtx t0 = gen_reg_rtx (mode), t1;
8108
8109       start_sequence ();
8110
8111       /* If the result is used, get a register for it.  */
8112       if (!unused_result)
8113         {
8114           if (!target || !register_operand (target, mode))
8115             target = gen_reg_rtx (mode);
8116           /* If fetch_before, copy the value now.  */
8117           if (!after)
8118             emit_move_insn (target, t0);
8119         }
8120       else
8121         target = const0_rtx;
8122
8123       t1 = t0;
8124       if (code == NOT)
8125         {
8126           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
8127                                     true, OPTAB_LIB_WIDEN);
8128           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
8129         }
8130       else
8131         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
8132                                   OPTAB_LIB_WIDEN);
8133
8134       /* For after, copy the value now.  */
8135       if (!unused_result && after)
8136         emit_move_insn (target, t1);
8137       insn = get_insns ();
8138       end_sequence ();
8139
8140       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
8141         return target;
8142     }
8143
8144   return NULL_RTX;
8145 }
8146 \f
8147 /* Return true if OPERAND is suitable for operand number OPNO of
8148    instruction ICODE.  */
8149
8150 bool
8151 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
8152 {
8153   return (!insn_data[(int) icode].operand[opno].predicate
8154           || (insn_data[(int) icode].operand[opno].predicate
8155               (operand, insn_data[(int) icode].operand[opno].mode)));
8156 }
8157 \f
8158 /* TARGET is a target of a multiword operation that we are going to
8159    implement as a series of word-mode operations.  Return true if
8160    TARGET is suitable for this purpose.  */
8161
8162 bool
8163 valid_multiword_target_p (rtx target)
8164 {
8165   enum machine_mode mode;
8166   int i;
8167
8168   mode = GET_MODE (target);
8169   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
8170     if (!validate_subreg (word_mode, mode, target, i))
8171       return false;
8172   return true;
8173 }
8174
8175 /* Like maybe_legitimize_operand, but do not change the code of the
8176    current rtx value.  */
8177
8178 static bool
8179 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
8180                                     struct expand_operand *op)
8181 {
8182   /* See if the operand matches in its current form.  */
8183   if (insn_operand_matches (icode, opno, op->value))
8184     return true;
8185
8186   /* If the operand is a memory whose address has no side effects,
8187      try forcing the address into a non-virtual pseudo register.
8188      The check for side effects is important because copy_to_mode_reg
8189      cannot handle things like auto-modified addresses.  */
8190   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
8191     {
8192       rtx addr, mem;
8193
8194       mem = op->value;
8195       addr = XEXP (mem, 0);
8196       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
8197           && !side_effects_p (addr))
8198         {
8199           rtx_insn *last;
8200           enum machine_mode mode;
8201
8202           last = get_last_insn ();
8203           mode = get_address_mode (mem);
8204           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
8205           if (insn_operand_matches (icode, opno, mem))
8206             {
8207               op->value = mem;
8208               return true;
8209             }
8210           delete_insns_since (last);
8211         }
8212     }
8213
8214   return false;
8215 }
8216
8217 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
8218    on success, storing the new operand value back in OP.  */
8219
8220 static bool
8221 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
8222                           struct expand_operand *op)
8223 {
8224   enum machine_mode mode, imode;
8225   bool old_volatile_ok, result;
8226
8227   mode = op->mode;
8228   switch (op->type)
8229     {
8230     case EXPAND_FIXED:
8231       old_volatile_ok = volatile_ok;
8232       volatile_ok = true;
8233       result = maybe_legitimize_operand_same_code (icode, opno, op);
8234       volatile_ok = old_volatile_ok;
8235       return result;
8236
8237     case EXPAND_OUTPUT:
8238       gcc_assert (mode != VOIDmode);
8239       if (op->value
8240           && op->value != const0_rtx
8241           && GET_MODE (op->value) == mode
8242           && maybe_legitimize_operand_same_code (icode, opno, op))
8243         return true;
8244
8245       op->value = gen_reg_rtx (mode);
8246       break;
8247
8248     case EXPAND_INPUT:
8249     input:
8250       gcc_assert (mode != VOIDmode);
8251       gcc_assert (GET_MODE (op->value) == VOIDmode
8252                   || GET_MODE (op->value) == mode);
8253       if (maybe_legitimize_operand_same_code (icode, opno, op))
8254         return true;
8255
8256       op->value = copy_to_mode_reg (mode, op->value);
8257       break;
8258
8259     case EXPAND_CONVERT_TO:
8260       gcc_assert (mode != VOIDmode);
8261       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
8262       goto input;
8263
8264     case EXPAND_CONVERT_FROM:
8265       if (GET_MODE (op->value) != VOIDmode)
8266         mode = GET_MODE (op->value);
8267       else
8268         /* The caller must tell us what mode this value has.  */
8269         gcc_assert (mode != VOIDmode);
8270
8271       imode = insn_data[(int) icode].operand[opno].mode;
8272       if (imode != VOIDmode && imode != mode)
8273         {
8274           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
8275           mode = imode;
8276         }
8277       goto input;
8278
8279     case EXPAND_ADDRESS:
8280       gcc_assert (mode != VOIDmode);
8281       op->value = convert_memory_address (mode, op->value);
8282       goto input;
8283
8284     case EXPAND_INTEGER:
8285       mode = insn_data[(int) icode].operand[opno].mode;
8286       if (mode != VOIDmode && const_int_operand (op->value, mode))
8287         goto input;
8288       break;
8289     }
8290   return insn_operand_matches (icode, opno, op->value);
8291 }
8292
8293 /* Make OP describe an input operand that should have the same value
8294    as VALUE, after any mode conversion that the target might request.
8295    TYPE is the type of VALUE.  */
8296
8297 void
8298 create_convert_operand_from_type (struct expand_operand *op,
8299                                   rtx value, tree type)
8300 {
8301   create_convert_operand_from (op, value, TYPE_MODE (type),
8302                                TYPE_UNSIGNED (type));
8303 }
8304
8305 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
8306    of instruction ICODE.  Return true on success, leaving the new operand
8307    values in the OPS themselves.  Emit no code on failure.  */
8308
8309 bool
8310 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
8311                            unsigned int nops, struct expand_operand *ops)
8312 {
8313   rtx_insn *last;
8314   unsigned int i;
8315
8316   last = get_last_insn ();
8317   for (i = 0; i < nops; i++)
8318     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
8319       {
8320         delete_insns_since (last);
8321         return false;
8322       }
8323   return true;
8324 }
8325
8326 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
8327    as its operands.  Return the instruction pattern on success,
8328    and emit any necessary set-up code.  Return null and emit no
8329    code on failure.  */
8330
8331 rtx
8332 maybe_gen_insn (enum insn_code icode, unsigned int nops,
8333                 struct expand_operand *ops)
8334 {
8335   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
8336   if (!maybe_legitimize_operands (icode, 0, nops, ops))
8337     return NULL_RTX;
8338
8339   switch (nops)
8340     {
8341     case 1:
8342       return GEN_FCN (icode) (ops[0].value);
8343     case 2:
8344       return GEN_FCN (icode) (ops[0].value, ops[1].value);
8345     case 3:
8346       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
8347     case 4:
8348       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8349                               ops[3].value);
8350     case 5:
8351       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8352                               ops[3].value, ops[4].value);
8353     case 6:
8354       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8355                               ops[3].value, ops[4].value, ops[5].value);
8356     case 7:
8357       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8358                               ops[3].value, ops[4].value, ops[5].value,
8359                               ops[6].value);
8360     case 8:
8361       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8362                               ops[3].value, ops[4].value, ops[5].value,
8363                               ops[6].value, ops[7].value);
8364     case 9:
8365       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8366                               ops[3].value, ops[4].value, ops[5].value,
8367                               ops[6].value, ops[7].value, ops[8].value);
8368     }
8369   gcc_unreachable ();
8370 }
8371
8372 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
8373    as its operands.  Return true on success and emit no code on failure.  */
8374
8375 bool
8376 maybe_expand_insn (enum insn_code icode, unsigned int nops,
8377                    struct expand_operand *ops)
8378 {
8379   rtx pat = maybe_gen_insn (icode, nops, ops);
8380   if (pat)
8381     {
8382       emit_insn (pat);
8383       return true;
8384     }
8385   return false;
8386 }
8387
8388 /* Like maybe_expand_insn, but for jumps.  */
8389
8390 bool
8391 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
8392                         struct expand_operand *ops)
8393 {
8394   rtx pat = maybe_gen_insn (icode, nops, ops);
8395   if (pat)
8396     {
8397       emit_jump_insn (pat);
8398       return true;
8399     }
8400   return false;
8401 }
8402
8403 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
8404    as its operands.  */
8405
8406 void
8407 expand_insn (enum insn_code icode, unsigned int nops,
8408              struct expand_operand *ops)
8409 {
8410   if (!maybe_expand_insn (icode, nops, ops))
8411     gcc_unreachable ();
8412 }
8413
8414 /* Like expand_insn, but for jumps.  */
8415
8416 void
8417 expand_jump_insn (enum insn_code icode, unsigned int nops,
8418                   struct expand_operand *ops)
8419 {
8420   if (!maybe_expand_jump_insn (icode, nops, ops))
8421     gcc_unreachable ();
8422 }
8423
8424 /* Reduce conditional compilation elsewhere.  */
8425 #ifndef HAVE_insv
8426 #define HAVE_insv       0
8427 #define CODE_FOR_insv   CODE_FOR_nothing
8428 #endif
8429 #ifndef HAVE_extv
8430 #define HAVE_extv       0
8431 #define CODE_FOR_extv   CODE_FOR_nothing
8432 #endif
8433 #ifndef HAVE_extzv
8434 #define HAVE_extzv      0
8435 #define CODE_FOR_extzv  CODE_FOR_nothing
8436 #endif
8437
8438 /* Enumerates the possible types of structure operand to an
8439    extraction_insn.  */
8440 enum extraction_type { ET_unaligned_mem, ET_reg };
8441
8442 /* Check whether insv, extv or extzv pattern ICODE can be used for an
8443    insertion or extraction of type TYPE on a structure of mode MODE.
8444    Return true if so and fill in *INSN accordingly.  STRUCT_OP is the
8445    operand number of the structure (the first sign_extract or zero_extract
8446    operand) and FIELD_OP is the operand number of the field (the other
8447    side of the set from the sign_extract or zero_extract).  */
8448
8449 static bool
8450 get_traditional_extraction_insn (extraction_insn *insn,
8451                                  enum extraction_type type,
8452                                  enum machine_mode mode,
8453                                  enum insn_code icode,
8454                                  int struct_op, int field_op)
8455 {
8456   const struct insn_data_d *data = &insn_data[icode];
8457
8458   enum machine_mode struct_mode = data->operand[struct_op].mode;
8459   if (struct_mode == VOIDmode)
8460     struct_mode = word_mode;
8461   if (mode != struct_mode)
8462     return false;
8463
8464   enum machine_mode field_mode = data->operand[field_op].mode;
8465   if (field_mode == VOIDmode)
8466     field_mode = word_mode;
8467
8468   enum machine_mode pos_mode = data->operand[struct_op + 2].mode;
8469   if (pos_mode == VOIDmode)
8470     pos_mode = word_mode;
8471
8472   insn->icode = icode;
8473   insn->field_mode = field_mode;
8474   insn->struct_mode = (type == ET_unaligned_mem ? byte_mode : struct_mode);
8475   insn->pos_mode = pos_mode;
8476   return true;
8477 }
8478
8479 /* Return true if an optab exists to perform an insertion or extraction
8480    of type TYPE in mode MODE.  Describe the instruction in *INSN if so.
8481
8482    REG_OPTAB is the optab to use for register structures and
8483    MISALIGN_OPTAB is the optab to use for misaligned memory structures.
8484    POS_OP is the operand number of the bit position.  */
8485
8486 static bool
8487 get_optab_extraction_insn (struct extraction_insn *insn,
8488                            enum extraction_type type,
8489                            enum machine_mode mode, direct_optab reg_optab,
8490                            direct_optab misalign_optab, int pos_op)
8491 {
8492   direct_optab optab = (type == ET_unaligned_mem ? misalign_optab : reg_optab);
8493   enum insn_code icode = direct_optab_handler (optab, mode);
8494   if (icode == CODE_FOR_nothing)
8495     return false;
8496
8497   const struct insn_data_d *data = &insn_data[icode];
8498
8499   insn->icode = icode;
8500   insn->field_mode = mode;
8501   insn->struct_mode = (type == ET_unaligned_mem ? BLKmode : mode);
8502   insn->pos_mode = data->operand[pos_op].mode;
8503   if (insn->pos_mode == VOIDmode)
8504     insn->pos_mode = word_mode;
8505   return true;
8506 }
8507
8508 /* Return true if an instruction exists to perform an insertion or
8509    extraction (PATTERN says which) of type TYPE in mode MODE.
8510    Describe the instruction in *INSN if so.  */
8511
8512 static bool
8513 get_extraction_insn (extraction_insn *insn,
8514                      enum extraction_pattern pattern,
8515                      enum extraction_type type,
8516                      enum machine_mode mode)
8517 {
8518   switch (pattern)
8519     {
8520     case EP_insv:
8521       if (HAVE_insv
8522           && get_traditional_extraction_insn (insn, type, mode,
8523                                               CODE_FOR_insv, 0, 3))
8524         return true;
8525       return get_optab_extraction_insn (insn, type, mode, insv_optab,
8526                                         insvmisalign_optab, 2);
8527
8528     case EP_extv:
8529       if (HAVE_extv
8530           && get_traditional_extraction_insn (insn, type, mode,
8531                                               CODE_FOR_extv, 1, 0))
8532         return true;
8533       return get_optab_extraction_insn (insn, type, mode, extv_optab,
8534                                         extvmisalign_optab, 3);
8535
8536     case EP_extzv:
8537       if (HAVE_extzv
8538           && get_traditional_extraction_insn (insn, type, mode,
8539                                               CODE_FOR_extzv, 1, 0))
8540         return true;
8541       return get_optab_extraction_insn (insn, type, mode, extzv_optab,
8542                                         extzvmisalign_optab, 3);
8543
8544     default:
8545       gcc_unreachable ();
8546     }
8547 }
8548
8549 /* Return true if an instruction exists to access a field of mode
8550    FIELDMODE in a structure that has STRUCT_BITS significant bits.
8551    Describe the "best" such instruction in *INSN if so.  PATTERN and
8552    TYPE describe the type of insertion or extraction we want to perform.
8553
8554    For an insertion, the number of significant structure bits includes
8555    all bits of the target.  For an extraction, it need only include the
8556    most significant bit of the field.  Larger widths are acceptable
8557    in both cases.  */
8558
8559 static bool
8560 get_best_extraction_insn (extraction_insn *insn,
8561                           enum extraction_pattern pattern,
8562                           enum extraction_type type,
8563                           unsigned HOST_WIDE_INT struct_bits,
8564                           enum machine_mode field_mode)
8565 {
8566   enum machine_mode mode = smallest_mode_for_size (struct_bits, MODE_INT);
8567   while (mode != VOIDmode)
8568     {
8569       if (get_extraction_insn (insn, pattern, type, mode))
8570         {
8571           while (mode != VOIDmode
8572                  && GET_MODE_SIZE (mode) <= GET_MODE_SIZE (field_mode)
8573                  && !TRULY_NOOP_TRUNCATION_MODES_P (insn->field_mode,
8574                                                     field_mode))
8575             {
8576               get_extraction_insn (insn, pattern, type, mode);
8577               mode = GET_MODE_WIDER_MODE (mode);
8578             }
8579           return true;
8580         }
8581       mode = GET_MODE_WIDER_MODE (mode);
8582     }
8583   return false;
8584 }
8585
8586 /* Return true if an instruction exists to access a field of mode
8587    FIELDMODE in a register structure that has STRUCT_BITS significant bits.
8588    Describe the "best" such instruction in *INSN if so.  PATTERN describes
8589    the type of insertion or extraction we want to perform.
8590
8591    For an insertion, the number of significant structure bits includes
8592    all bits of the target.  For an extraction, it need only include the
8593    most significant bit of the field.  Larger widths are acceptable
8594    in both cases.  */
8595
8596 bool
8597 get_best_reg_extraction_insn (extraction_insn *insn,
8598                               enum extraction_pattern pattern,
8599                               unsigned HOST_WIDE_INT struct_bits,
8600                               enum machine_mode field_mode)
8601 {
8602   return get_best_extraction_insn (insn, pattern, ET_reg, struct_bits,
8603                                    field_mode);
8604 }
8605
8606 /* Return true if an instruction exists to access a field of BITSIZE
8607    bits starting BITNUM bits into a memory structure.  Describe the
8608    "best" such instruction in *INSN if so.  PATTERN describes the type
8609    of insertion or extraction we want to perform and FIELDMODE is the
8610    natural mode of the extracted field.
8611
8612    The instructions considered here only access bytes that overlap
8613    the bitfield; they do not touch any surrounding bytes.  */
8614
8615 bool
8616 get_best_mem_extraction_insn (extraction_insn *insn,
8617                               enum extraction_pattern pattern,
8618                               HOST_WIDE_INT bitsize, HOST_WIDE_INT bitnum,
8619                               enum machine_mode field_mode)
8620 {
8621   unsigned HOST_WIDE_INT struct_bits = (bitnum % BITS_PER_UNIT
8622                                         + bitsize
8623                                         + BITS_PER_UNIT - 1);
8624   struct_bits -= struct_bits % BITS_PER_UNIT;
8625   return get_best_extraction_insn (insn, pattern, ET_unaligned_mem,
8626                                    struct_bits, field_mode);
8627 }
8628
8629 #include "gt-optabs.h"